os_solaris.cpp revision 269:850fdf70db2b
1/*
2 * Copyright 1997-2008 Sun Microsystems, Inc.  All Rights Reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
20 * CA 95054 USA or visit www.sun.com if you need additional information or
21 * have any questions.
22 *
23 */
24
25// do not include  precompiled  header file
26# include "incls/_os_solaris.cpp.incl"
27
28// put OS-includes here
29# include <dlfcn.h>
30# include <errno.h>
31# include <link.h>
32# include <poll.h>
33# include <pthread.h>
34# include <pwd.h>
35# include <schedctl.h>
36# include <setjmp.h>
37# include <signal.h>
38# include <stdio.h>
39# include <alloca.h>
40# include <sys/filio.h>
41# include <sys/ipc.h>
42# include <sys/lwp.h>
43# include <sys/machelf.h>     // for elf Sym structure used by dladdr1
44# include <sys/mman.h>
45# include <sys/processor.h>
46# include <sys/procset.h>
47# include <sys/pset.h>
48# include <sys/resource.h>
49# include <sys/shm.h>
50# include <sys/socket.h>
51# include <sys/stat.h>
52# include <sys/systeminfo.h>
53# include <sys/time.h>
54# include <sys/times.h>
55# include <sys/types.h>
56# include <sys/wait.h>
57# include <sys/utsname.h>
58# include <thread.h>
59# include <unistd.h>
60# include <sys/priocntl.h>
61# include <sys/rtpriocntl.h>
62# include <sys/tspriocntl.h>
63# include <sys/iapriocntl.h>
64# include <sys/loadavg.h>
65# include <string.h>
66
67# define _STRUCTURED_PROC 1  //  this gets us the new structured proc interfaces of 5.6 & later
68# include <sys/procfs.h>     //  see comment in <sys/procfs.h>
69
70#define MAX_PATH (2 * K)
71
72// for timer info max values which include all bits
73#define ALL_64_BITS CONST64(0xFFFFFFFFFFFFFFFF)
74
75#ifdef _GNU_SOURCE
76// See bug #6514594
77extern "C" int madvise(caddr_t, size_t, int);
78extern "C"  int memcntl(caddr_t addr, size_t len, int cmd, caddr_t  arg,
79     int attr, int mask);
80#endif //_GNU_SOURCE
81
82/*
83  MPSS Changes Start.
84  The JVM binary needs to be built and run on pre-Solaris 9
85  systems, but the constants needed by MPSS are only in Solaris 9
86  header files.  They are textually replicated here to allow
87  building on earlier systems.  Once building on Solaris 8 is
88  no longer a requirement, these #defines can be replaced by ordinary
89  system .h inclusion.
90
91  In earlier versions of the  JDK and Solaris, we used ISM for large pages.
92  But ISM requires shared memory to achieve this and thus has many caveats.
93  MPSS is a fully transparent and is a cleaner way to get large pages.
94  Although we still require keeping ISM for backward compatiblitiy as well as
95  giving the opportunity to use large pages on older systems it is
96  recommended that MPSS be used for Solaris 9 and above.
97
98*/
99
100#ifndef MC_HAT_ADVISE
101
102struct memcntl_mha {
103  uint_t          mha_cmd;        /* command(s) */
104  uint_t          mha_flags;
105  size_t          mha_pagesize;
106};
107#define MC_HAT_ADVISE   7       /* advise hat map size */
108#define MHA_MAPSIZE_VA  0x1     /* set preferred page size */
109#define MAP_ALIGN       0x200   /* addr specifies alignment */
110
111#endif
112// MPSS Changes End.
113
114
115// Here are some liblgrp types from sys/lgrp_user.h to be able to
116// compile on older systems without this header file.
117
118#ifndef MADV_ACCESS_LWP
119# define  MADV_ACCESS_LWP         7       /* next LWP to access heavily */
120#endif
121#ifndef MADV_ACCESS_MANY
122# define  MADV_ACCESS_MANY        8       /* many processes to access heavily */
123#endif
124
125#ifndef LGRP_RSRC_CPU
126# define LGRP_RSRC_CPU           0       /* CPU resources */
127#endif
128#ifndef LGRP_RSRC_MEM
129# define LGRP_RSRC_MEM           1       /* memory resources */
130#endif
131
132// Some more macros from sys/mman.h that are not present in Solaris 8.
133
134#ifndef MAX_MEMINFO_CNT
135/*
136 * info_req request type definitions for meminfo
137 * request types starting with MEMINFO_V are used for Virtual addresses
138 * and should not be mixed with MEMINFO_PLGRP which is targeted for Physical
139 * addresses
140 */
141# define MEMINFO_SHIFT           16
142# define MEMINFO_MASK            (0xFF << MEMINFO_SHIFT)
143# define MEMINFO_VPHYSICAL       (0x01 << MEMINFO_SHIFT) /* get physical addr */
144# define MEMINFO_VLGRP           (0x02 << MEMINFO_SHIFT) /* get lgroup */
145# define MEMINFO_VPAGESIZE       (0x03 << MEMINFO_SHIFT) /* size of phys page */
146# define MEMINFO_VREPLCNT        (0x04 << MEMINFO_SHIFT) /* no. of replica */
147# define MEMINFO_VREPL           (0x05 << MEMINFO_SHIFT) /* physical replica */
148# define MEMINFO_VREPL_LGRP      (0x06 << MEMINFO_SHIFT) /* lgrp of replica */
149# define MEMINFO_PLGRP           (0x07 << MEMINFO_SHIFT) /* lgroup for paddr */
150
151/* maximum number of addresses meminfo() can process at a time */
152# define MAX_MEMINFO_CNT 256
153
154/* maximum number of request types */
155# define MAX_MEMINFO_REQ 31
156#endif
157
158// see thr_setprio(3T) for the basis of these numbers
159#define MinimumPriority 0
160#define NormalPriority  64
161#define MaximumPriority 127
162
163// Values for ThreadPriorityPolicy == 1
164int prio_policy1[MaxPriority+1] = { -99999, 0, 16, 32, 48, 64,
165                                        80, 96, 112, 124, 127 };
166
167// System parameters used internally
168static clock_t clock_tics_per_sec = 100;
169
170// For diagnostics to print a message once. see run_periodic_checks
171static bool check_addr0_done = false;
172static sigset_t check_signal_done;
173static bool check_signals = true;
174
175address os::Solaris::handler_start;  // start pc of thr_sighndlrinfo
176address os::Solaris::handler_end;    // end pc of thr_sighndlrinfo
177
178address os::Solaris::_main_stack_base = NULL;  // 4352906 workaround
179
180
181// "default" initializers for missing libc APIs
182extern "C" {
183  static int lwp_mutex_init(mutex_t *mx, int scope, void *arg) { memset(mx, 0, sizeof(mutex_t)); return 0; }
184  static int lwp_mutex_destroy(mutex_t *mx)                 { return 0; }
185
186  static int lwp_cond_init(cond_t *cv, int scope, void *arg){ memset(cv, 0, sizeof(cond_t)); return 0; }
187  static int lwp_cond_destroy(cond_t *cv)                   { return 0; }
188}
189
190// "default" initializers for pthread-based synchronization
191extern "C" {
192  static int pthread_mutex_default_init(mutex_t *mx, int scope, void *arg) { memset(mx, 0, sizeof(mutex_t)); return 0; }
193  static int pthread_cond_default_init(cond_t *cv, int scope, void *arg){ memset(cv, 0, sizeof(cond_t)); return 0; }
194}
195
196// Thread Local Storage
197// This is common to all Solaris platforms so it is defined here,
198// in this common file.
199// The declarations are in the os_cpu threadLS*.hpp files.
200//
201// Static member initialization for TLS
202Thread* ThreadLocalStorage::_get_thread_cache[ThreadLocalStorage::_pd_cache_size] = {NULL};
203
204#ifndef PRODUCT
205#define _PCT(n,d)       ((100.0*(double)(n))/(double)(d))
206
207int ThreadLocalStorage::_tcacheHit = 0;
208int ThreadLocalStorage::_tcacheMiss = 0;
209
210void ThreadLocalStorage::print_statistics() {
211  int total = _tcacheMiss+_tcacheHit;
212  tty->print_cr("Thread cache hits %d misses %d total %d percent %f\n",
213                _tcacheHit, _tcacheMiss, total, _PCT(_tcacheHit, total));
214}
215#undef _PCT
216#endif // PRODUCT
217
218Thread* ThreadLocalStorage::get_thread_via_cache_slowly(uintptr_t raw_id,
219                                                        int index) {
220  Thread *thread = get_thread_slow();
221  if (thread != NULL) {
222    address sp = os::current_stack_pointer();
223    guarantee(thread->_stack_base == NULL ||
224              (sp <= thread->_stack_base &&
225                 sp >= thread->_stack_base - thread->_stack_size) ||
226               is_error_reported(),
227              "sp must be inside of selected thread stack");
228
229    thread->_self_raw_id = raw_id;  // mark for quick retrieval
230    _get_thread_cache[ index ] = thread;
231  }
232  return thread;
233}
234
235
236static const double all_zero[ sizeof(Thread) / sizeof(double) + 1 ] = {0};
237#define NO_CACHED_THREAD ((Thread*)all_zero)
238
239void ThreadLocalStorage::pd_set_thread(Thread* thread) {
240
241  // Store the new value before updating the cache to prevent a race
242  // between get_thread_via_cache_slowly() and this store operation.
243  os::thread_local_storage_at_put(ThreadLocalStorage::thread_index(), thread);
244
245  // Update thread cache with new thread if setting on thread create,
246  // or NO_CACHED_THREAD (zeroed) thread if resetting thread on exit.
247  uintptr_t raw = pd_raw_thread_id();
248  int ix = pd_cache_index(raw);
249  _get_thread_cache[ix] = thread == NULL ? NO_CACHED_THREAD : thread;
250}
251
252void ThreadLocalStorage::pd_init() {
253  for (int i = 0; i < _pd_cache_size; i++) {
254    _get_thread_cache[i] = NO_CACHED_THREAD;
255  }
256}
257
258// Invalidate all the caches (happens to be the same as pd_init).
259void ThreadLocalStorage::pd_invalidate_all() { pd_init(); }
260
261#undef NO_CACHED_THREAD
262
263// END Thread Local Storage
264
265static inline size_t adjust_stack_size(address base, size_t size) {
266  if ((ssize_t)size < 0) {
267    // 4759953: Compensate for ridiculous stack size.
268    size = max_intx;
269  }
270  if (size > (size_t)base) {
271    // 4812466: Make sure size doesn't allow the stack to wrap the address space.
272    size = (size_t)base;
273  }
274  return size;
275}
276
277static inline stack_t get_stack_info() {
278  stack_t st;
279  int retval = thr_stksegment(&st);
280  st.ss_size = adjust_stack_size((address)st.ss_sp, st.ss_size);
281  assert(retval == 0, "incorrect return value from thr_stksegment");
282  assert((address)&st < (address)st.ss_sp, "Invalid stack base returned");
283  assert((address)&st > (address)st.ss_sp-st.ss_size, "Invalid stack size returned");
284  return st;
285}
286
287address os::current_stack_base() {
288  int r = thr_main() ;
289  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
290  bool is_primordial_thread = r;
291
292  // Workaround 4352906, avoid calls to thr_stksegment by
293  // thr_main after the first one (it looks like we trash
294  // some data, causing the value for ss_sp to be incorrect).
295  if (!is_primordial_thread || os::Solaris::_main_stack_base == NULL) {
296    stack_t st = get_stack_info();
297    if (is_primordial_thread) {
298      // cache initial value of stack base
299      os::Solaris::_main_stack_base = (address)st.ss_sp;
300    }
301    return (address)st.ss_sp;
302  } else {
303    guarantee(os::Solaris::_main_stack_base != NULL, "Attempt to use null cached stack base");
304    return os::Solaris::_main_stack_base;
305  }
306}
307
308size_t os::current_stack_size() {
309  size_t size;
310
311  int r = thr_main() ;
312  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
313  if(!r) {
314    size = get_stack_info().ss_size;
315  } else {
316    struct rlimit limits;
317    getrlimit(RLIMIT_STACK, &limits);
318    size = adjust_stack_size(os::Solaris::_main_stack_base, (size_t)limits.rlim_cur);
319  }
320  // base may not be page aligned
321  address base = current_stack_base();
322  address bottom = (address)align_size_up((intptr_t)(base - size), os::vm_page_size());;
323  return (size_t)(base - bottom);
324}
325
326// interruptible infrastructure
327
328// setup_interruptible saves the thread state before going into an
329// interruptible system call.
330// The saved state is used to restore the thread to
331// its former state whether or not an interrupt is received.
332// Used by classloader os::read
333// hpi calls skip this layer and stay in _thread_in_native
334
335void os::Solaris::setup_interruptible(JavaThread* thread) {
336
337  JavaThreadState thread_state = thread->thread_state();
338
339  assert(thread_state != _thread_blocked, "Coming from the wrong thread");
340  assert(thread_state != _thread_in_native, "Native threads skip setup_interruptible");
341  OSThread* osthread = thread->osthread();
342  osthread->set_saved_interrupt_thread_state(thread_state);
343  thread->frame_anchor()->make_walkable(thread);
344  ThreadStateTransition::transition(thread, thread_state, _thread_blocked);
345}
346
347// Version of setup_interruptible() for threads that are already in
348// _thread_blocked. Used by os_sleep().
349void os::Solaris::setup_interruptible_already_blocked(JavaThread* thread) {
350  thread->frame_anchor()->make_walkable(thread);
351}
352
353JavaThread* os::Solaris::setup_interruptible() {
354  JavaThread* thread = (JavaThread*)ThreadLocalStorage::thread();
355  setup_interruptible(thread);
356  return thread;
357}
358
359void os::Solaris::try_enable_extended_io() {
360  typedef int (*enable_extended_FILE_stdio_t)(int, int);
361
362  if (!UseExtendedFileIO) {
363    return;
364  }
365
366  enable_extended_FILE_stdio_t enabler =
367    (enable_extended_FILE_stdio_t) dlsym(RTLD_DEFAULT,
368                                         "enable_extended_FILE_stdio");
369  if (enabler) {
370    enabler(-1, -1);
371  }
372}
373
374
375#ifdef ASSERT
376
377JavaThread* os::Solaris::setup_interruptible_native() {
378  JavaThread* thread = (JavaThread*)ThreadLocalStorage::thread();
379  JavaThreadState thread_state = thread->thread_state();
380  assert(thread_state == _thread_in_native, "Assumed thread_in_native");
381  return thread;
382}
383
384void os::Solaris::cleanup_interruptible_native(JavaThread* thread) {
385  JavaThreadState thread_state = thread->thread_state();
386  assert(thread_state == _thread_in_native, "Assumed thread_in_native");
387}
388#endif
389
390// cleanup_interruptible reverses the effects of setup_interruptible
391// setup_interruptible_already_blocked() does not need any cleanup.
392
393void os::Solaris::cleanup_interruptible(JavaThread* thread) {
394  OSThread* osthread = thread->osthread();
395
396  ThreadStateTransition::transition(thread, _thread_blocked, osthread->saved_interrupt_thread_state());
397}
398
399// I/O interruption related counters called in _INTERRUPTIBLE
400
401void os::Solaris::bump_interrupted_before_count() {
402  RuntimeService::record_interrupted_before_count();
403}
404
405void os::Solaris::bump_interrupted_during_count() {
406  RuntimeService::record_interrupted_during_count();
407}
408
409static int _processors_online = 0;
410
411         jint os::Solaris::_os_thread_limit = 0;
412volatile jint os::Solaris::_os_thread_count = 0;
413
414julong os::available_memory() {
415  return Solaris::available_memory();
416}
417
418julong os::Solaris::available_memory() {
419  return (julong)sysconf(_SC_AVPHYS_PAGES) * os::vm_page_size();
420}
421
422julong os::Solaris::_physical_memory = 0;
423
424julong os::physical_memory() {
425   return Solaris::physical_memory();
426}
427
428julong os::allocatable_physical_memory(julong size) {
429#ifdef _LP64
430   return size;
431#else
432   julong result = MIN2(size, (julong)3835*M);
433   if (!is_allocatable(result)) {
434     // Memory allocations will be aligned but the alignment
435     // is not known at this point.  Alignments will
436     // be at most to LargePageSizeInBytes.  Protect
437     // allocations from alignments up to illegal
438     // values. If at this point 2G is illegal.
439     julong reasonable_size = (julong)2*G - 2 * LargePageSizeInBytes;
440     result =  MIN2(size, reasonable_size);
441   }
442   return result;
443#endif
444}
445
446static hrtime_t first_hrtime = 0;
447static const hrtime_t hrtime_hz = 1000*1000*1000;
448const int LOCK_BUSY = 1;
449const int LOCK_FREE = 0;
450const int LOCK_INVALID = -1;
451static volatile hrtime_t max_hrtime = 0;
452static volatile int max_hrtime_lock = LOCK_FREE;     // Update counter with LSB as lock-in-progress
453
454
455void os::Solaris::initialize_system_info() {
456  _processor_count = sysconf(_SC_NPROCESSORS_CONF);
457  _processors_online = sysconf (_SC_NPROCESSORS_ONLN);
458  _physical_memory = (julong)sysconf(_SC_PHYS_PAGES) * (julong)sysconf(_SC_PAGESIZE);
459}
460
461int os::active_processor_count() {
462  int online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
463  pid_t pid = getpid();
464  psetid_t pset = PS_NONE;
465  // Are we running in a processor set?
466  if (pset_bind(PS_QUERY, P_PID, pid, &pset) == 0) {
467    if (pset != PS_NONE) {
468      uint_t pset_cpus;
469      // Query number of cpus in processor set
470      if (pset_info(pset, NULL, &pset_cpus, NULL) == 0) {
471        assert(pset_cpus > 0 && pset_cpus <= online_cpus, "sanity check");
472        _processors_online = pset_cpus;
473        return pset_cpus;
474      }
475    }
476  }
477  // Otherwise return number of online cpus
478  return online_cpus;
479}
480
481static bool find_processors_in_pset(psetid_t        pset,
482                                    processorid_t** id_array,
483                                    uint_t*         id_length) {
484  bool result = false;
485  // Find the number of processors in the processor set.
486  if (pset_info(pset, NULL, id_length, NULL) == 0) {
487    // Make up an array to hold their ids.
488    *id_array = NEW_C_HEAP_ARRAY(processorid_t, *id_length);
489    // Fill in the array with their processor ids.
490    if (pset_info(pset, NULL, id_length, *id_array) == 0) {
491      result = true;
492    }
493  }
494  return result;
495}
496
497// Callers of find_processors_online() must tolerate imprecise results --
498// the system configuration can change asynchronously because of DR
499// or explicit psradm operations.
500//
501// We also need to take care that the loop (below) terminates as the
502// number of processors online can change between the _SC_NPROCESSORS_ONLN
503// request and the loop that builds the list of processor ids.   Unfortunately
504// there's no reliable way to determine the maximum valid processor id,
505// so we use a manifest constant, MAX_PROCESSOR_ID, instead.  See p_online
506// man pages, which claim the processor id set is "sparse, but
507// not too sparse".  MAX_PROCESSOR_ID is used to ensure that we eventually
508// exit the loop.
509//
510// In the future we'll be able to use sysconf(_SC_CPUID_MAX), but that's
511// not available on S8.0.
512
513static bool find_processors_online(processorid_t** id_array,
514                                   uint*           id_length) {
515  const processorid_t MAX_PROCESSOR_ID = 100000 ;
516  // Find the number of processors online.
517  *id_length = sysconf(_SC_NPROCESSORS_ONLN);
518  // Make up an array to hold their ids.
519  *id_array = NEW_C_HEAP_ARRAY(processorid_t, *id_length);
520  // Processors need not be numbered consecutively.
521  long found = 0;
522  processorid_t next = 0;
523  while (found < *id_length && next < MAX_PROCESSOR_ID) {
524    processor_info_t info;
525    if (processor_info(next, &info) == 0) {
526      // NB, PI_NOINTR processors are effectively online ...
527      if (info.pi_state == P_ONLINE || info.pi_state == P_NOINTR) {
528        (*id_array)[found] = next;
529        found += 1;
530      }
531    }
532    next += 1;
533  }
534  if (found < *id_length) {
535      // The loop above didn't identify the expected number of processors.
536      // We could always retry the operation, calling sysconf(_SC_NPROCESSORS_ONLN)
537      // and re-running the loop, above, but there's no guarantee of progress
538      // if the system configuration is in flux.  Instead, we just return what
539      // we've got.  Note that in the worst case find_processors_online() could
540      // return an empty set.  (As a fall-back in the case of the empty set we
541      // could just return the ID of the current processor).
542      *id_length = found ;
543  }
544
545  return true;
546}
547
548static bool assign_distribution(processorid_t* id_array,
549                                uint           id_length,
550                                uint*          distribution,
551                                uint           distribution_length) {
552  // We assume we can assign processorid_t's to uint's.
553  assert(sizeof(processorid_t) == sizeof(uint),
554         "can't convert processorid_t to uint");
555  // Quick check to see if we won't succeed.
556  if (id_length < distribution_length) {
557    return false;
558  }
559  // Assign processor ids to the distribution.
560  // Try to shuffle processors to distribute work across boards,
561  // assuming 4 processors per board.
562  const uint processors_per_board = ProcessDistributionStride;
563  // Find the maximum processor id.
564  processorid_t max_id = 0;
565  for (uint m = 0; m < id_length; m += 1) {
566    max_id = MAX2(max_id, id_array[m]);
567  }
568  // The next id, to limit loops.
569  const processorid_t limit_id = max_id + 1;
570  // Make up markers for available processors.
571  bool* available_id = NEW_C_HEAP_ARRAY(bool, limit_id);
572  for (uint c = 0; c < limit_id; c += 1) {
573    available_id[c] = false;
574  }
575  for (uint a = 0; a < id_length; a += 1) {
576    available_id[id_array[a]] = true;
577  }
578  // Step by "boards", then by "slot", copying to "assigned".
579  // NEEDS_CLEANUP: The assignment of processors should be stateful,
580  //                remembering which processors have been assigned by
581  //                previous calls, etc., so as to distribute several
582  //                independent calls of this method.  What we'd like is
583  //                It would be nice to have an API that let us ask
584  //                how many processes are bound to a processor,
585  //                but we don't have that, either.
586  //                In the short term, "board" is static so that
587  //                subsequent distributions don't all start at board 0.
588  static uint board = 0;
589  uint assigned = 0;
590  // Until we've found enough processors ....
591  while (assigned < distribution_length) {
592    // ... find the next available processor in the board.
593    for (uint slot = 0; slot < processors_per_board; slot += 1) {
594      uint try_id = board * processors_per_board + slot;
595      if ((try_id < limit_id) && (available_id[try_id] == true)) {
596        distribution[assigned] = try_id;
597        available_id[try_id] = false;
598        assigned += 1;
599        break;
600      }
601    }
602    board += 1;
603    if (board * processors_per_board + 0 >= limit_id) {
604      board = 0;
605    }
606  }
607  if (available_id != NULL) {
608    FREE_C_HEAP_ARRAY(bool, available_id);
609  }
610  return true;
611}
612
613bool os::distribute_processes(uint length, uint* distribution) {
614  bool result = false;
615  // Find the processor id's of all the available CPUs.
616  processorid_t* id_array  = NULL;
617  uint           id_length = 0;
618  // There are some races between querying information and using it,
619  // since processor sets can change dynamically.
620  psetid_t pset = PS_NONE;
621  // Are we running in a processor set?
622  if ((pset_bind(PS_QUERY, P_PID, P_MYID, &pset) == 0) && pset != PS_NONE) {
623    result = find_processors_in_pset(pset, &id_array, &id_length);
624  } else {
625    result = find_processors_online(&id_array, &id_length);
626  }
627  if (result == true) {
628    if (id_length >= length) {
629      result = assign_distribution(id_array, id_length, distribution, length);
630    } else {
631      result = false;
632    }
633  }
634  if (id_array != NULL) {
635    FREE_C_HEAP_ARRAY(processorid_t, id_array);
636  }
637  return result;
638}
639
640bool os::bind_to_processor(uint processor_id) {
641  // We assume that a processorid_t can be stored in a uint.
642  assert(sizeof(uint) == sizeof(processorid_t),
643         "can't convert uint to processorid_t");
644  int bind_result =
645    processor_bind(P_LWPID,                       // bind LWP.
646                   P_MYID,                        // bind current LWP.
647                   (processorid_t) processor_id,  // id.
648                   NULL);                         // don't return old binding.
649  return (bind_result == 0);
650}
651
652bool os::getenv(const char* name, char* buffer, int len) {
653  char* val = ::getenv( name );
654  if ( val == NULL
655  ||   strlen(val) + 1  >  len ) {
656    if (len > 0)  buffer[0] = 0; // return a null string
657    return false;
658  }
659  strcpy( buffer, val );
660  return true;
661}
662
663
664// Return true if user is running as root.
665
666bool os::have_special_privileges() {
667  static bool init = false;
668  static bool privileges = false;
669  if (!init) {
670    privileges = (getuid() != geteuid()) || (getgid() != getegid());
671    init = true;
672  }
673  return privileges;
674}
675
676
677static char* get_property(char* name, char* buffer, int buffer_size) {
678  if (os::getenv(name, buffer, buffer_size)) {
679    return buffer;
680  }
681  static char empty[] = "";
682  return empty;
683}
684
685
686void os::init_system_properties_values() {
687  char arch[12];
688  sysinfo(SI_ARCHITECTURE, arch, sizeof(arch));
689
690  // The next steps are taken in the product version:
691  //
692  // Obtain the JAVA_HOME value from the location of libjvm[_g].so.
693  // This library should be located at:
694  // <JAVA_HOME>/jre/lib/<arch>/{client|server}/libjvm[_g].so.
695  //
696  // If "/jre/lib/" appears at the right place in the path, then we
697  // assume libjvm[_g].so is installed in a JDK and we use this path.
698  //
699  // Otherwise exit with message: "Could not create the Java virtual machine."
700  //
701  // The following extra steps are taken in the debugging version:
702  //
703  // If "/jre/lib/" does NOT appear at the right place in the path
704  // instead of exit check for $JAVA_HOME environment variable.
705  //
706  // If it is defined and we are able to locate $JAVA_HOME/jre/lib/<arch>,
707  // then we append a fake suffix "hotspot/libjvm[_g].so" to this path so
708  // it looks like libjvm[_g].so is installed there
709  // <JAVA_HOME>/jre/lib/<arch>/hotspot/libjvm[_g].so.
710  //
711  // Otherwise exit.
712  //
713  // Important note: if the location of libjvm.so changes this
714  // code needs to be changed accordingly.
715
716  // The next few definitions allow the code to be verbatim:
717#define malloc(n) (char*)NEW_C_HEAP_ARRAY(char, (n))
718#define free(p) FREE_C_HEAP_ARRAY(char, p)
719#define getenv(n) ::getenv(n)
720
721#define EXTENSIONS_DIR  "/lib/ext"
722#define ENDORSED_DIR    "/lib/endorsed"
723#define COMMON_DIR      "/usr/jdk/packages"
724
725  {
726    /* sysclasspath, java_home, dll_dir */
727    {
728        char *home_path;
729        char *dll_path;
730        char *pslash;
731        char buf[MAXPATHLEN];
732        os::jvm_path(buf, sizeof(buf));
733
734        // Found the full path to libjvm.so.
735        // Now cut the path to <java_home>/jre if we can.
736        *(strrchr(buf, '/')) = '\0';  /* get rid of /libjvm.so */
737        pslash = strrchr(buf, '/');
738        if (pslash != NULL)
739            *pslash = '\0';           /* get rid of /{client|server|hotspot} */
740        dll_path = malloc(strlen(buf) + 1);
741        if (dll_path == NULL)
742            return;
743        strcpy(dll_path, buf);
744        Arguments::set_dll_dir(dll_path);
745
746        if (pslash != NULL) {
747            pslash = strrchr(buf, '/');
748            if (pslash != NULL) {
749                *pslash = '\0';       /* get rid of /<arch> */
750                pslash = strrchr(buf, '/');
751                if (pslash != NULL)
752                    *pslash = '\0';   /* get rid of /lib */
753            }
754        }
755
756        home_path = malloc(strlen(buf) + 1);
757        if (home_path == NULL)
758            return;
759        strcpy(home_path, buf);
760        Arguments::set_java_home(home_path);
761
762        if (!set_boot_path('/', ':'))
763            return;
764    }
765
766    /*
767     * Where to look for native libraries
768     */
769    {
770      // Use dlinfo() to determine the correct java.library.path.
771      //
772      // If we're launched by the Java launcher, and the user
773      // does not set java.library.path explicitly on the commandline,
774      // the Java launcher sets LD_LIBRARY_PATH for us and unsets
775      // LD_LIBRARY_PATH_32 and LD_LIBRARY_PATH_64.  In this case
776      // dlinfo returns LD_LIBRARY_PATH + crle settings (including
777      // /usr/lib), which is exactly what we want.
778      //
779      // If the user does set java.library.path, it completely
780      // overwrites this setting, and always has.
781      //
782      // If we're not launched by the Java launcher, we may
783      // get here with any/all of the LD_LIBRARY_PATH[_32|64]
784      // settings.  Again, dlinfo does exactly what we want.
785
786      Dl_serinfo     _info, *info = &_info;
787      Dl_serpath     *path;
788      char*          library_path;
789      char           *common_path;
790      int            i;
791
792      // determine search path count and required buffer size
793      if (dlinfo(RTLD_SELF, RTLD_DI_SERINFOSIZE, (void *)info) == -1) {
794        vm_exit_during_initialization("dlinfo SERINFOSIZE request", dlerror());
795      }
796
797      // allocate new buffer and initialize
798      info = (Dl_serinfo*)malloc(_info.dls_size);
799      if (info == NULL) {
800        vm_exit_out_of_memory(_info.dls_size,
801                              "init_system_properties_values info");
802      }
803      info->dls_size = _info.dls_size;
804      info->dls_cnt = _info.dls_cnt;
805
806      // obtain search path information
807      if (dlinfo(RTLD_SELF, RTLD_DI_SERINFO, (void *)info) == -1) {
808        free(info);
809        vm_exit_during_initialization("dlinfo SERINFO request", dlerror());
810      }
811
812      path = &info->dls_serpath[0];
813
814      // Note: Due to a legacy implementation, most of the library path
815      // is set in the launcher.  This was to accomodate linking restrictions
816      // on legacy Solaris implementations (which are no longer supported).
817      // Eventually, all the library path setting will be done here.
818      //
819      // However, to prevent the proliferation of improperly built native
820      // libraries, the new path component /usr/jdk/packages is added here.
821
822      // Determine the actual CPU architecture.
823      char cpu_arch[12];
824      sysinfo(SI_ARCHITECTURE, cpu_arch, sizeof(cpu_arch));
825#ifdef _LP64
826      // If we are a 64-bit vm, perform the following translations:
827      //   sparc   -> sparcv9
828      //   i386    -> amd64
829      if (strcmp(cpu_arch, "sparc") == 0)
830        strcat(cpu_arch, "v9");
831      else if (strcmp(cpu_arch, "i386") == 0)
832        strcpy(cpu_arch, "amd64");
833#endif
834
835      // Construct the invariant part of ld_library_path. Note that the
836      // space for the colon and the trailing null are provided by the
837      // nulls included by the sizeof operator.
838      size_t bufsize = sizeof(COMMON_DIR) + sizeof("/lib/") + strlen(cpu_arch);
839      common_path = malloc(bufsize);
840      if (common_path == NULL) {
841        free(info);
842        vm_exit_out_of_memory(bufsize,
843                              "init_system_properties_values common_path");
844      }
845      sprintf(common_path, COMMON_DIR "/lib/%s", cpu_arch);
846
847      // struct size is more than sufficient for the path components obtained
848      // through the dlinfo() call, so only add additional space for the path
849      // components explicitly added here.
850      bufsize = info->dls_size + strlen(common_path);
851      library_path = malloc(bufsize);
852      if (library_path == NULL) {
853        free(info);
854        free(common_path);
855        vm_exit_out_of_memory(bufsize,
856                              "init_system_properties_values library_path");
857      }
858      library_path[0] = '\0';
859
860      // Construct the desired Java library path from the linker's library
861      // search path.
862      //
863      // For compatibility, it is optimal that we insert the additional path
864      // components specific to the Java VM after those components specified
865      // in LD_LIBRARY_PATH (if any) but before those added by the ld.so
866      // infrastructure.
867      if (info->dls_cnt == 0) { // Not sure this can happen, but allow for it
868        strcpy(library_path, common_path);
869      } else {
870        int inserted = 0;
871        for (i = 0; i < info->dls_cnt; i++, path++) {
872          uint_t flags = path->dls_flags & LA_SER_MASK;
873          if (((flags & LA_SER_LIBPATH) == 0) && !inserted) {
874            strcat(library_path, common_path);
875            strcat(library_path, os::path_separator());
876            inserted = 1;
877          }
878          strcat(library_path, path->dls_name);
879          strcat(library_path, os::path_separator());
880        }
881        // eliminate trailing path separator
882        library_path[strlen(library_path)-1] = '\0';
883      }
884
885      // happens before argument parsing - can't use a trace flag
886      // tty->print_raw("init_system_properties_values: native lib path: ");
887      // tty->print_raw_cr(library_path);
888
889      // callee copies into its own buffer
890      Arguments::set_library_path(library_path);
891
892      free(common_path);
893      free(library_path);
894      free(info);
895    }
896
897    /*
898     * Extensions directories.
899     *
900     * Note that the space for the colon and the trailing null are provided
901     * by the nulls included by the sizeof operator (so actually one byte more
902     * than necessary is allocated).
903     */
904    {
905        char *buf = (char *) malloc(strlen(Arguments::get_java_home()) +
906            sizeof(EXTENSIONS_DIR) + sizeof(COMMON_DIR) +
907            sizeof(EXTENSIONS_DIR));
908        sprintf(buf, "%s" EXTENSIONS_DIR ":" COMMON_DIR EXTENSIONS_DIR,
909            Arguments::get_java_home());
910        Arguments::set_ext_dirs(buf);
911    }
912
913    /* Endorsed standards default directory. */
914    {
915        char * buf = malloc(strlen(Arguments::get_java_home()) + sizeof(ENDORSED_DIR));
916        sprintf(buf, "%s" ENDORSED_DIR, Arguments::get_java_home());
917        Arguments::set_endorsed_dirs(buf);
918    }
919  }
920
921#undef malloc
922#undef free
923#undef getenv
924#undef EXTENSIONS_DIR
925#undef ENDORSED_DIR
926#undef COMMON_DIR
927
928}
929
930void os::breakpoint() {
931  BREAKPOINT;
932}
933
934bool os::obsolete_option(const JavaVMOption *option)
935{
936  if (!strncmp(option->optionString, "-Xt", 3)) {
937    return true;
938  } else if (!strncmp(option->optionString, "-Xtm", 4)) {
939    return true;
940  } else if (!strncmp(option->optionString, "-Xverifyheap", 12)) {
941    return true;
942  } else if (!strncmp(option->optionString, "-Xmaxjitcodesize", 16)) {
943    return true;
944  }
945  return false;
946}
947
948bool os::Solaris::valid_stack_address(Thread* thread, address sp) {
949  address  stackStart  = (address)thread->stack_base();
950  address  stackEnd    = (address)(stackStart - (address)thread->stack_size());
951  if (sp < stackStart && sp >= stackEnd ) return true;
952  return false;
953}
954
955extern "C" void breakpoint() {
956  // use debugger to set breakpoint here
957}
958
959// Returns an estimate of the current stack pointer. Result must be guaranteed to
960// point into the calling threads stack, and be no lower than the current stack
961// pointer.
962address os::current_stack_pointer() {
963  volatile int dummy;
964  address sp = (address)&dummy + 8;     // %%%% need to confirm if this is right
965  return sp;
966}
967
968static thread_t main_thread;
969
970// Thread start routine for all new Java threads
971extern "C" void* java_start(void* thread_addr) {
972  // Try to randomize the cache line index of hot stack frames.
973  // This helps when threads of the same stack traces evict each other's
974  // cache lines. The threads can be either from the same JVM instance, or
975  // from different JVM instances. The benefit is especially true for
976  // processors with hyperthreading technology.
977  static int counter = 0;
978  int pid = os::current_process_id();
979  alloca(((pid ^ counter++) & 7) * 128);
980
981  int prio;
982  Thread* thread = (Thread*)thread_addr;
983  OSThread* osthr = thread->osthread();
984
985  osthr->set_lwp_id( _lwp_self() );  // Store lwp in case we are bound
986  thread->_schedctl = (void *) schedctl_init () ;
987
988  if (UseNUMA) {
989    int lgrp_id = os::numa_get_group_id();
990    if (lgrp_id != -1) {
991      thread->set_lgrp_id(lgrp_id);
992    }
993  }
994
995  // If the creator called set priority before we started,
996  // we need to call set priority now that we have an lwp.
997  // Get the priority from libthread and set the priority
998  // for the new Solaris lwp.
999  if ( osthr->thread_id() != -1 ) {
1000    if ( UseThreadPriorities ) {
1001      thr_getprio(osthr->thread_id(), &prio);
1002      if (ThreadPriorityVerbose) {
1003        tty->print_cr("Starting Thread " INTPTR_FORMAT ", LWP is " INTPTR_FORMAT ", setting priority: %d\n",
1004                      osthr->thread_id(), osthr->lwp_id(), prio );
1005      }
1006      os::set_native_priority(thread, prio);
1007    }
1008  } else if (ThreadPriorityVerbose) {
1009    warning("Can't set priority in _start routine, thread id hasn't been set\n");
1010  }
1011
1012  assert(osthr->get_state() == RUNNABLE, "invalid os thread state");
1013
1014  // initialize signal mask for this thread
1015  os::Solaris::hotspot_sigmask(thread);
1016
1017  thread->run();
1018
1019  // One less thread is executing
1020  // When the VMThread gets here, the main thread may have already exited
1021  // which frees the CodeHeap containing the Atomic::dec code
1022  if (thread != VMThread::vm_thread() && VMThread::vm_thread() != NULL) {
1023    Atomic::dec(&os::Solaris::_os_thread_count);
1024  }
1025
1026  if (UseDetachedThreads) {
1027    thr_exit(NULL);
1028    ShouldNotReachHere();
1029  }
1030  return NULL;
1031}
1032
1033static OSThread* create_os_thread(Thread* thread, thread_t thread_id) {
1034  // Allocate the OSThread object
1035  OSThread* osthread = new OSThread(NULL, NULL);
1036  if (osthread == NULL) return NULL;
1037
1038  // Store info on the Solaris thread into the OSThread
1039  osthread->set_thread_id(thread_id);
1040  osthread->set_lwp_id(_lwp_self());
1041  thread->_schedctl = (void *) schedctl_init () ;
1042
1043  if (UseNUMA) {
1044    int lgrp_id = os::numa_get_group_id();
1045    if (lgrp_id != -1) {
1046      thread->set_lgrp_id(lgrp_id);
1047    }
1048  }
1049
1050  if ( ThreadPriorityVerbose ) {
1051    tty->print_cr("In create_os_thread, Thread " INTPTR_FORMAT ", LWP is " INTPTR_FORMAT "\n",
1052                  osthread->thread_id(), osthread->lwp_id() );
1053  }
1054
1055  // Initial thread state is INITIALIZED, not SUSPENDED
1056  osthread->set_state(INITIALIZED);
1057
1058  return osthread;
1059}
1060
1061void os::Solaris::hotspot_sigmask(Thread* thread) {
1062
1063  //Save caller's signal mask
1064  sigset_t sigmask;
1065  thr_sigsetmask(SIG_SETMASK, NULL, &sigmask);
1066  OSThread *osthread = thread->osthread();
1067  osthread->set_caller_sigmask(sigmask);
1068
1069  thr_sigsetmask(SIG_UNBLOCK, os::Solaris::unblocked_signals(), NULL);
1070  if (!ReduceSignalUsage) {
1071    if (thread->is_VM_thread()) {
1072      // Only the VM thread handles BREAK_SIGNAL ...
1073      thr_sigsetmask(SIG_UNBLOCK, vm_signals(), NULL);
1074    } else {
1075      // ... all other threads block BREAK_SIGNAL
1076      assert(!sigismember(vm_signals(), SIGINT), "SIGINT should not be blocked");
1077      thr_sigsetmask(SIG_BLOCK, vm_signals(), NULL);
1078    }
1079  }
1080}
1081
1082bool os::create_attached_thread(JavaThread* thread) {
1083#ifdef ASSERT
1084  thread->verify_not_published();
1085#endif
1086  OSThread* osthread = create_os_thread(thread, thr_self());
1087  if (osthread == NULL) {
1088     return false;
1089  }
1090
1091  // Initial thread state is RUNNABLE
1092  osthread->set_state(RUNNABLE);
1093  thread->set_osthread(osthread);
1094
1095  // initialize signal mask for this thread
1096  // and save the caller's signal mask
1097  os::Solaris::hotspot_sigmask(thread);
1098
1099  return true;
1100}
1101
1102bool os::create_main_thread(JavaThread* thread) {
1103#ifdef ASSERT
1104  thread->verify_not_published();
1105#endif
1106  if (_starting_thread == NULL) {
1107    _starting_thread = create_os_thread(thread, main_thread);
1108     if (_starting_thread == NULL) {
1109        return false;
1110     }
1111  }
1112
1113  // The primodial thread is runnable from the start
1114  _starting_thread->set_state(RUNNABLE);
1115
1116  thread->set_osthread(_starting_thread);
1117
1118  // initialize signal mask for this thread
1119  // and save the caller's signal mask
1120  os::Solaris::hotspot_sigmask(thread);
1121
1122  return true;
1123}
1124
1125// _T2_libthread is true if we believe we are running with the newer
1126// SunSoft lwp/libthread.so (2.8 patch, 2.9 default)
1127bool os::Solaris::_T2_libthread = false;
1128
1129bool os::create_thread(Thread* thread, ThreadType thr_type, size_t stack_size) {
1130  // Allocate the OSThread object
1131  OSThread* osthread = new OSThread(NULL, NULL);
1132  if (osthread == NULL) {
1133    return false;
1134  }
1135
1136  if ( ThreadPriorityVerbose ) {
1137    char *thrtyp;
1138    switch ( thr_type ) {
1139      case vm_thread:
1140        thrtyp = (char *)"vm";
1141        break;
1142      case cgc_thread:
1143        thrtyp = (char *)"cgc";
1144        break;
1145      case pgc_thread:
1146        thrtyp = (char *)"pgc";
1147        break;
1148      case java_thread:
1149        thrtyp = (char *)"java";
1150        break;
1151      case compiler_thread:
1152        thrtyp = (char *)"compiler";
1153        break;
1154      case watcher_thread:
1155        thrtyp = (char *)"watcher";
1156        break;
1157      default:
1158        thrtyp = (char *)"unknown";
1159        break;
1160    }
1161    tty->print_cr("In create_thread, creating a %s thread\n", thrtyp);
1162  }
1163
1164  // Calculate stack size if it's not specified by caller.
1165  if (stack_size == 0) {
1166    // The default stack size 1M (2M for LP64).
1167    stack_size = (BytesPerWord >> 2) * K * K;
1168
1169    switch (thr_type) {
1170    case os::java_thread:
1171      // Java threads use ThreadStackSize which default value can be changed with the flag -Xss
1172      if (JavaThread::stack_size_at_create() > 0) stack_size = JavaThread::stack_size_at_create();
1173      break;
1174    case os::compiler_thread:
1175      if (CompilerThreadStackSize > 0) {
1176        stack_size = (size_t)(CompilerThreadStackSize * K);
1177        break;
1178      } // else fall through:
1179        // use VMThreadStackSize if CompilerThreadStackSize is not defined
1180    case os::vm_thread:
1181    case os::pgc_thread:
1182    case os::cgc_thread:
1183    case os::watcher_thread:
1184      if (VMThreadStackSize > 0) stack_size = (size_t)(VMThreadStackSize * K);
1185      break;
1186    }
1187  }
1188  stack_size = MAX2(stack_size, os::Solaris::min_stack_allowed);
1189
1190  // Initial state is ALLOCATED but not INITIALIZED
1191  osthread->set_state(ALLOCATED);
1192
1193  if (os::Solaris::_os_thread_count > os::Solaris::_os_thread_limit) {
1194    // We got lots of threads. Check if we still have some address space left.
1195    // Need to be at least 5Mb of unreserved address space. We do check by
1196    // trying to reserve some.
1197    const size_t VirtualMemoryBangSize = 20*K*K;
1198    char* mem = os::reserve_memory(VirtualMemoryBangSize);
1199    if (mem == NULL) {
1200      delete osthread;
1201      return false;
1202    } else {
1203      // Release the memory again
1204      os::release_memory(mem, VirtualMemoryBangSize);
1205    }
1206  }
1207
1208  // Setup osthread because the child thread may need it.
1209  thread->set_osthread(osthread);
1210
1211  // Create the Solaris thread
1212  // explicit THR_BOUND for T2_libthread case in case
1213  // that assumption is not accurate, but our alternate signal stack
1214  // handling is based on it which must have bound threads
1215  thread_t tid = 0;
1216  long     flags = (UseDetachedThreads ? THR_DETACHED : 0) | THR_SUSPENDED
1217                   | ((UseBoundThreads || os::Solaris::T2_libthread() ||
1218                       (thr_type == vm_thread) ||
1219                       (thr_type == cgc_thread) ||
1220                       (thr_type == pgc_thread) ||
1221                       (thr_type == compiler_thread && BackgroundCompilation)) ?
1222                      THR_BOUND : 0);
1223  int      status;
1224
1225  // 4376845 -- libthread/kernel don't provide enough LWPs to utilize all CPUs.
1226  //
1227  // On multiprocessors systems, libthread sometimes under-provisions our
1228  // process with LWPs.  On a 30-way systems, for instance, we could have
1229  // 50 user-level threads in ready state and only 2 or 3 LWPs assigned
1230  // to our process.  This can result in under utilization of PEs.
1231  // I suspect the problem is related to libthread's LWP
1232  // pool management and to the kernel's SIGBLOCKING "last LWP parked"
1233  // upcall policy.
1234  //
1235  // The following code is palliative -- it attempts to ensure that our
1236  // process has sufficient LWPs to take advantage of multiple PEs.
1237  // Proper long-term cures include using user-level threads bound to LWPs
1238  // (THR_BOUND) or using LWP-based synchronization.  Note that there is a
1239  // slight timing window with respect to sampling _os_thread_count, but
1240  // the race is benign.  Also, we should periodically recompute
1241  // _processors_online as the min of SC_NPROCESSORS_ONLN and the
1242  // the number of PEs in our partition.  You might be tempted to use
1243  // THR_NEW_LWP here, but I'd recommend against it as that could
1244  // result in undesirable growth of the libthread's LWP pool.
1245  // The fix below isn't sufficient; for instance, it doesn't take into count
1246  // LWPs parked on IO.  It does, however, help certain CPU-bound benchmarks.
1247  //
1248  // Some pathologies this scheme doesn't handle:
1249  // *  Threads can block, releasing the LWPs.  The LWPs can age out.
1250  //    When a large number of threads become ready again there aren't
1251  //    enough LWPs available to service them.  This can occur when the
1252  //    number of ready threads oscillates.
1253  // *  LWPs/Threads park on IO, thus taking the LWP out of circulation.
1254  //
1255  // Finally, we should call thr_setconcurrency() periodically to refresh
1256  // the LWP pool and thwart the LWP age-out mechanism.
1257  // The "+3" term provides a little slop -- we want to slightly overprovision.
1258
1259  if (AdjustConcurrency && os::Solaris::_os_thread_count < (_processors_online+3)) {
1260    if (!(flags & THR_BOUND)) {
1261      thr_setconcurrency (os::Solaris::_os_thread_count);       // avoid starvation
1262    }
1263  }
1264  // Although this doesn't hurt, we should warn of undefined behavior
1265  // when using unbound T1 threads with schedctl().  This should never
1266  // happen, as the compiler and VM threads are always created bound
1267  DEBUG_ONLY(
1268      if ((VMThreadHintNoPreempt || CompilerThreadHintNoPreempt) &&
1269          (!os::Solaris::T2_libthread() && (!(flags & THR_BOUND))) &&
1270          ((thr_type == vm_thread) || (thr_type == cgc_thread) ||
1271           (thr_type == pgc_thread) || (thr_type == compiler_thread && BackgroundCompilation))) {
1272         warning("schedctl behavior undefined when Compiler/VM/GC Threads are Unbound");
1273      }
1274  );
1275
1276
1277  // Mark that we don't have an lwp or thread id yet.
1278  // In case we attempt to set the priority before the thread starts.
1279  osthread->set_lwp_id(-1);
1280  osthread->set_thread_id(-1);
1281
1282  status = thr_create(NULL, stack_size, java_start, thread, flags, &tid);
1283  if (status != 0) {
1284    if (PrintMiscellaneous && (Verbose || WizardMode)) {
1285      perror("os::create_thread");
1286    }
1287    thread->set_osthread(NULL);
1288    // Need to clean up stuff we've allocated so far
1289    delete osthread;
1290    return false;
1291  }
1292
1293  Atomic::inc(&os::Solaris::_os_thread_count);
1294
1295  // Store info on the Solaris thread into the OSThread
1296  osthread->set_thread_id(tid);
1297
1298  // Remember that we created this thread so we can set priority on it
1299  osthread->set_vm_created();
1300
1301  // Set the default thread priority otherwise use NormalPriority
1302
1303  if ( UseThreadPriorities ) {
1304     thr_setprio(tid, (DefaultThreadPriority == -1) ?
1305                        java_to_os_priority[NormPriority] :
1306                        DefaultThreadPriority);
1307  }
1308
1309  // Initial thread state is INITIALIZED, not SUSPENDED
1310  osthread->set_state(INITIALIZED);
1311
1312  // The thread is returned suspended (in state INITIALIZED), and is started higher up in the call chain
1313  return true;
1314}
1315
1316/* defined for >= Solaris 10. This allows builds on earlier versions
1317 *  of Solaris to take advantage of the newly reserved Solaris JVM signals
1318 *  With SIGJVM1, SIGJVM2, INTERRUPT_SIGNAL is SIGJVM1, ASYNC_SIGNAL is SIGJVM2
1319 *  and -XX:+UseAltSigs does nothing since these should have no conflict
1320 */
1321#if !defined(SIGJVM1)
1322#define SIGJVM1 39
1323#define SIGJVM2 40
1324#endif
1325
1326debug_only(static bool signal_sets_initialized = false);
1327static sigset_t unblocked_sigs, vm_sigs, allowdebug_blocked_sigs;
1328int os::Solaris::_SIGinterrupt = INTERRUPT_SIGNAL;
1329int os::Solaris::_SIGasync = ASYNC_SIGNAL;
1330
1331bool os::Solaris::is_sig_ignored(int sig) {
1332      struct sigaction oact;
1333      sigaction(sig, (struct sigaction*)NULL, &oact);
1334      void* ohlr = oact.sa_sigaction ? CAST_FROM_FN_PTR(void*,  oact.sa_sigaction)
1335                                     : CAST_FROM_FN_PTR(void*,  oact.sa_handler);
1336      if (ohlr == CAST_FROM_FN_PTR(void*, SIG_IGN))
1337           return true;
1338      else
1339           return false;
1340}
1341
1342// Note: SIGRTMIN is a macro that calls sysconf() so it will
1343// dynamically detect SIGRTMIN value for the system at runtime, not buildtime
1344static bool isJVM1available() {
1345  return SIGJVM1 < SIGRTMIN;
1346}
1347
1348void os::Solaris::signal_sets_init() {
1349  // Should also have an assertion stating we are still single-threaded.
1350  assert(!signal_sets_initialized, "Already initialized");
1351  // Fill in signals that are necessarily unblocked for all threads in
1352  // the VM. Currently, we unblock the following signals:
1353  // SHUTDOWN{1,2,3}_SIGNAL: for shutdown hooks support (unless over-ridden
1354  //                         by -Xrs (=ReduceSignalUsage));
1355  // BREAK_SIGNAL which is unblocked only by the VM thread and blocked by all
1356  // other threads. The "ReduceSignalUsage" boolean tells us not to alter
1357  // the dispositions or masks wrt these signals.
1358  // Programs embedding the VM that want to use the above signals for their
1359  // own purposes must, at this time, use the "-Xrs" option to prevent
1360  // interference with shutdown hooks and BREAK_SIGNAL thread dumping.
1361  // (See bug 4345157, and other related bugs).
1362  // In reality, though, unblocking these signals is really a nop, since
1363  // these signals are not blocked by default.
1364  sigemptyset(&unblocked_sigs);
1365  sigemptyset(&allowdebug_blocked_sigs);
1366  sigaddset(&unblocked_sigs, SIGILL);
1367  sigaddset(&unblocked_sigs, SIGSEGV);
1368  sigaddset(&unblocked_sigs, SIGBUS);
1369  sigaddset(&unblocked_sigs, SIGFPE);
1370
1371  if (isJVM1available) {
1372    os::Solaris::set_SIGinterrupt(SIGJVM1);
1373    os::Solaris::set_SIGasync(SIGJVM2);
1374  } else if (UseAltSigs) {
1375    os::Solaris::set_SIGinterrupt(ALT_INTERRUPT_SIGNAL);
1376    os::Solaris::set_SIGasync(ALT_ASYNC_SIGNAL);
1377  } else {
1378    os::Solaris::set_SIGinterrupt(INTERRUPT_SIGNAL);
1379    os::Solaris::set_SIGasync(ASYNC_SIGNAL);
1380  }
1381
1382  sigaddset(&unblocked_sigs, os::Solaris::SIGinterrupt());
1383  sigaddset(&unblocked_sigs, os::Solaris::SIGasync());
1384
1385  if (!ReduceSignalUsage) {
1386   if (!os::Solaris::is_sig_ignored(SHUTDOWN1_SIGNAL)) {
1387      sigaddset(&unblocked_sigs, SHUTDOWN1_SIGNAL);
1388      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN1_SIGNAL);
1389   }
1390   if (!os::Solaris::is_sig_ignored(SHUTDOWN2_SIGNAL)) {
1391      sigaddset(&unblocked_sigs, SHUTDOWN2_SIGNAL);
1392      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN2_SIGNAL);
1393   }
1394   if (!os::Solaris::is_sig_ignored(SHUTDOWN3_SIGNAL)) {
1395      sigaddset(&unblocked_sigs, SHUTDOWN3_SIGNAL);
1396      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN3_SIGNAL);
1397   }
1398  }
1399  // Fill in signals that are blocked by all but the VM thread.
1400  sigemptyset(&vm_sigs);
1401  if (!ReduceSignalUsage)
1402    sigaddset(&vm_sigs, BREAK_SIGNAL);
1403  debug_only(signal_sets_initialized = true);
1404
1405  // For diagnostics only used in run_periodic_checks
1406  sigemptyset(&check_signal_done);
1407}
1408
1409// These are signals that are unblocked while a thread is running Java.
1410// (For some reason, they get blocked by default.)
1411sigset_t* os::Solaris::unblocked_signals() {
1412  assert(signal_sets_initialized, "Not initialized");
1413  return &unblocked_sigs;
1414}
1415
1416// These are the signals that are blocked while a (non-VM) thread is
1417// running Java. Only the VM thread handles these signals.
1418sigset_t* os::Solaris::vm_signals() {
1419  assert(signal_sets_initialized, "Not initialized");
1420  return &vm_sigs;
1421}
1422
1423// These are signals that are blocked during cond_wait to allow debugger in
1424sigset_t* os::Solaris::allowdebug_blocked_signals() {
1425  assert(signal_sets_initialized, "Not initialized");
1426  return &allowdebug_blocked_sigs;
1427}
1428
1429// First crack at OS-specific initialization, from inside the new thread.
1430void os::initialize_thread() {
1431  int r = thr_main() ;
1432  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
1433  if (r) {
1434    JavaThread* jt = (JavaThread *)Thread::current();
1435    assert(jt != NULL,"Sanity check");
1436    size_t stack_size;
1437    address base = jt->stack_base();
1438    if (Arguments::created_by_java_launcher()) {
1439      // Use 2MB to allow for Solaris 7 64 bit mode.
1440      stack_size = JavaThread::stack_size_at_create() == 0
1441        ? 2048*K : JavaThread::stack_size_at_create();
1442
1443      // There are rare cases when we may have already used more than
1444      // the basic stack size allotment before this method is invoked.
1445      // Attempt to allow for a normally sized java_stack.
1446      size_t current_stack_offset = (size_t)(base - (address)&stack_size);
1447      stack_size += ReservedSpace::page_align_size_down(current_stack_offset);
1448    } else {
1449      // 6269555: If we were not created by a Java launcher, i.e. if we are
1450      // running embedded in a native application, treat the primordial thread
1451      // as much like a native attached thread as possible.  This means using
1452      // the current stack size from thr_stksegment(), unless it is too large
1453      // to reliably setup guard pages.  A reasonable max size is 8MB.
1454      size_t current_size = current_stack_size();
1455      // This should never happen, but just in case....
1456      if (current_size == 0) current_size = 2 * K * K;
1457      stack_size = current_size > (8 * K * K) ? (8 * K * K) : current_size;
1458    }
1459    address bottom = (address)align_size_up((intptr_t)(base - stack_size), os::vm_page_size());;
1460    stack_size = (size_t)(base - bottom);
1461
1462    assert(stack_size > 0, "Stack size calculation problem");
1463
1464    if (stack_size > jt->stack_size()) {
1465      NOT_PRODUCT(
1466        struct rlimit limits;
1467        getrlimit(RLIMIT_STACK, &limits);
1468        size_t size = adjust_stack_size(base, (size_t)limits.rlim_cur);
1469        assert(size >= jt->stack_size(), "Stack size problem in main thread");
1470      )
1471      tty->print_cr(
1472        "Stack size of %d Kb exceeds current limit of %d Kb.\n"
1473        "(Stack sizes are rounded up to a multiple of the system page size.)\n"
1474        "See limit(1) to increase the stack size limit.",
1475        stack_size / K, jt->stack_size() / K);
1476      vm_exit(1);
1477    }
1478    assert(jt->stack_size() >= stack_size,
1479          "Attempt to map more stack than was allocated");
1480    jt->set_stack_size(stack_size);
1481  }
1482
1483   // 5/22/01: Right now alternate signal stacks do not handle
1484   // throwing stack overflow exceptions, see bug 4463178
1485   // Until a fix is found for this, T2 will NOT imply alternate signal
1486   // stacks.
1487   // If using T2 libthread threads, install an alternate signal stack.
1488   // Because alternate stacks associate with LWPs on Solaris,
1489   // see sigaltstack(2), if using UNBOUND threads, or if UseBoundThreads
1490   // we prefer to explicitly stack bang.
1491   // If not using T2 libthread, but using UseBoundThreads any threads
1492   // (primordial thread, jni_attachCurrentThread) we do not create,
1493   // probably are not bound, therefore they can not have an alternate
1494   // signal stack. Since our stack banging code is generated and
1495   // is shared across threads, all threads must be bound to allow
1496   // using alternate signal stacks.  The alternative is to interpose
1497   // on _lwp_create to associate an alt sig stack with each LWP,
1498   // and this could be a problem when the JVM is embedded.
1499   // We would prefer to use alternate signal stacks with T2
1500   // Since there is currently no accurate way to detect T2
1501   // we do not. Assuming T2 when running T1 causes sig 11s or assertions
1502   // on installing alternate signal stacks
1503
1504
1505   // 05/09/03: removed alternate signal stack support for Solaris
1506   // The alternate signal stack mechanism is no longer needed to
1507   // handle stack overflow. This is now handled by allocating
1508   // guard pages (red zone) and stackbanging.
1509   // Initially the alternate signal stack mechanism was removed because
1510   // it did not work with T1 llibthread. Alternate
1511   // signal stacks MUST have all threads bound to lwps. Applications
1512   // can create their own threads and attach them without their being
1513   // bound under T1. This is frequently the case for the primordial thread.
1514   // If we were ever to reenable this mechanism we would need to
1515   // use the dynamic check for T2 libthread.
1516
1517  os::Solaris::init_thread_fpu_state();
1518}
1519
1520
1521
1522// Free Solaris resources related to the OSThread
1523void os::free_thread(OSThread* osthread) {
1524  assert(osthread != NULL, "os::free_thread but osthread not set");
1525
1526
1527  // We are told to free resources of the argument thread,
1528  // but we can only really operate on the current thread.
1529  // The main thread must take the VMThread down synchronously
1530  // before the main thread exits and frees up CodeHeap
1531  guarantee((Thread::current()->osthread() == osthread
1532     || (osthread == VMThread::vm_thread()->osthread())), "os::free_thread but not current thread");
1533  if (Thread::current()->osthread() == osthread) {
1534    // Restore caller's signal mask
1535    sigset_t sigmask = osthread->caller_sigmask();
1536    thr_sigsetmask(SIG_SETMASK, &sigmask, NULL);
1537  }
1538  delete osthread;
1539}
1540
1541void os::pd_start_thread(Thread* thread) {
1542  int status = thr_continue(thread->osthread()->thread_id());
1543  assert_status(status == 0, status, "thr_continue failed");
1544}
1545
1546
1547intx os::current_thread_id() {
1548  return (intx)thr_self();
1549}
1550
1551static pid_t _initial_pid = 0;
1552
1553int os::current_process_id() {
1554  return (int)(_initial_pid ? _initial_pid : getpid());
1555}
1556
1557int os::allocate_thread_local_storage() {
1558  // %%%       in Win32 this allocates a memory segment pointed to by a
1559  //           register.  Dan Stein can implement a similar feature in
1560  //           Solaris.  Alternatively, the VM can do the same thing
1561  //           explicitly: malloc some storage and keep the pointer in a
1562  //           register (which is part of the thread's context) (or keep it
1563  //           in TLS).
1564  // %%%       In current versions of Solaris, thr_self and TSD can
1565  //           be accessed via short sequences of displaced indirections.
1566  //           The value of thr_self is available as %g7(36).
1567  //           The value of thr_getspecific(k) is stored in %g7(12)(4)(k*4-4),
1568  //           assuming that the current thread already has a value bound to k.
1569  //           It may be worth experimenting with such access patterns,
1570  //           and later having the parameters formally exported from a Solaris
1571  //           interface.  I think, however, that it will be faster to
1572  //           maintain the invariant that %g2 always contains the
1573  //           JavaThread in Java code, and have stubs simply
1574  //           treat %g2 as a caller-save register, preserving it in a %lN.
1575  thread_key_t tk;
1576  if (thr_keycreate( &tk, NULL ) )
1577    fatal1("os::allocate_thread_local_storage: thr_keycreate failed (%s)", strerror(errno));
1578  return int(tk);
1579}
1580
1581void os::free_thread_local_storage(int index) {
1582  // %%% don't think we need anything here
1583  // if ( pthread_key_delete((pthread_key_t) tk) )
1584  //   fatal("os::free_thread_local_storage: pthread_key_delete failed");
1585}
1586
1587#define SMALLINT 32   // libthread allocate for tsd_common is a version specific
1588                      // small number - point is NO swap space available
1589void os::thread_local_storage_at_put(int index, void* value) {
1590  // %%% this is used only in threadLocalStorage.cpp
1591  if (thr_setspecific((thread_key_t)index, value)) {
1592    if (errno == ENOMEM) {
1593       vm_exit_out_of_memory(SMALLINT, "thr_setspecific: out of swap space");
1594    } else {
1595      fatal1("os::thread_local_storage_at_put: thr_setspecific failed (%s)", strerror(errno));
1596    }
1597  } else {
1598      ThreadLocalStorage::set_thread_in_slot ((Thread *) value) ;
1599  }
1600}
1601
1602// This function could be called before TLS is initialized, for example, when
1603// VM receives an async signal or when VM causes a fatal error during
1604// initialization. Return NULL if thr_getspecific() fails.
1605void* os::thread_local_storage_at(int index) {
1606  // %%% this is used only in threadLocalStorage.cpp
1607  void* r = NULL;
1608  return thr_getspecific((thread_key_t)index, &r) != 0 ? NULL : r;
1609}
1610
1611
1612const int NANOSECS_PER_MILLISECS = 1000000;
1613// gethrtime can move backwards if read from one cpu and then a different cpu
1614// getTimeNanos is guaranteed to not move backward on Solaris
1615// local spinloop created as faster for a CAS on an int than
1616// a CAS on a 64bit jlong. Also Atomic::cmpxchg for jlong is not
1617// supported on sparc v8 or pre supports_cx8 intel boxes.
1618// oldgetTimeNanos for systems which do not support CAS on 64bit jlong
1619// i.e. sparc v8 and pre supports_cx8 (i486) intel boxes
1620inline hrtime_t oldgetTimeNanos() {
1621  int gotlock = LOCK_INVALID;
1622  hrtime_t newtime = gethrtime();
1623
1624  for (;;) {
1625// grab lock for max_hrtime
1626    int curlock = max_hrtime_lock;
1627    if (curlock & LOCK_BUSY)  continue;
1628    if (gotlock = Atomic::cmpxchg(LOCK_BUSY, &max_hrtime_lock, LOCK_FREE) != LOCK_FREE) continue;
1629    if (newtime > max_hrtime) {
1630      max_hrtime = newtime;
1631    } else {
1632      newtime = max_hrtime;
1633    }
1634    // release lock
1635    max_hrtime_lock = LOCK_FREE;
1636    return newtime;
1637  }
1638}
1639// gethrtime can move backwards if read from one cpu and then a different cpu
1640// getTimeNanos is guaranteed to not move backward on Solaris
1641inline hrtime_t getTimeNanos() {
1642  if (VM_Version::supports_cx8()) {
1643    bool retry = false;
1644    hrtime_t newtime = gethrtime();
1645    hrtime_t oldmaxtime = max_hrtime;
1646    hrtime_t retmaxtime = oldmaxtime;
1647    while ((newtime > retmaxtime) && (retry == false || retmaxtime != oldmaxtime)) {
1648      oldmaxtime = retmaxtime;
1649      retmaxtime = Atomic::cmpxchg(newtime, (volatile jlong *)&max_hrtime, oldmaxtime);
1650      retry = true;
1651    }
1652    return (newtime > retmaxtime) ? newtime : retmaxtime;
1653  } else {
1654    return oldgetTimeNanos();
1655  }
1656}
1657
1658// Time since start-up in seconds to a fine granularity.
1659// Used by VMSelfDestructTimer and the MemProfiler.
1660double os::elapsedTime() {
1661  return (double)(getTimeNanos() - first_hrtime) / (double)hrtime_hz;
1662}
1663
1664jlong os::elapsed_counter() {
1665  return (jlong)(getTimeNanos() - first_hrtime);
1666}
1667
1668jlong os::elapsed_frequency() {
1669   return hrtime_hz;
1670}
1671
1672// Return the real, user, and system times in seconds from an
1673// arbitrary fixed point in the past.
1674bool os::getTimesSecs(double* process_real_time,
1675                  double* process_user_time,
1676                  double* process_system_time) {
1677  struct tms ticks;
1678  clock_t real_ticks = times(&ticks);
1679
1680  if (real_ticks == (clock_t) (-1)) {
1681    return false;
1682  } else {
1683    double ticks_per_second = (double) clock_tics_per_sec;
1684    *process_user_time = ((double) ticks.tms_utime) / ticks_per_second;
1685    *process_system_time = ((double) ticks.tms_stime) / ticks_per_second;
1686    // For consistency return the real time from getTimeNanos()
1687    // converted to seconds.
1688    *process_real_time = ((double) getTimeNanos()) / ((double) NANOUNITS);
1689
1690    return true;
1691  }
1692}
1693
1694// Used internally for comparisons only
1695// getTimeMillis guaranteed to not move backwards on Solaris
1696jlong getTimeMillis() {
1697  jlong nanotime = getTimeNanos();
1698  return (jlong)(nanotime / NANOSECS_PER_MILLISECS);
1699}
1700
1701// Must return millis since Jan 1 1970 for JVM_CurrentTimeMillis
1702jlong os::javaTimeMillis() {
1703  timeval t;
1704  if (gettimeofday( &t, NULL) == -1)
1705    fatal1("os::javaTimeMillis: gettimeofday (%s)", strerror(errno));
1706  return jlong(t.tv_sec) * 1000  +  jlong(t.tv_usec) / 1000;
1707}
1708
1709jlong os::javaTimeNanos() {
1710  return (jlong)getTimeNanos();
1711}
1712
1713void os::javaTimeNanos_info(jvmtiTimerInfo *info_ptr) {
1714  info_ptr->max_value = ALL_64_BITS;      // gethrtime() uses all 64 bits
1715  info_ptr->may_skip_backward = false;    // not subject to resetting or drifting
1716  info_ptr->may_skip_forward = false;     // not subject to resetting or drifting
1717  info_ptr->kind = JVMTI_TIMER_ELAPSED;   // elapsed not CPU time
1718}
1719
1720char * os::local_time_string(char *buf, size_t buflen) {
1721  struct tm t;
1722  time_t long_time;
1723  time(&long_time);
1724  localtime_r(&long_time, &t);
1725  jio_snprintf(buf, buflen, "%d-%02d-%02d %02d:%02d:%02d",
1726               t.tm_year + 1900, t.tm_mon + 1, t.tm_mday,
1727               t.tm_hour, t.tm_min, t.tm_sec);
1728  return buf;
1729}
1730
1731// Note: os::shutdown() might be called very early during initialization, or
1732// called from signal handler. Before adding something to os::shutdown(), make
1733// sure it is async-safe and can handle partially initialized VM.
1734void os::shutdown() {
1735
1736  // allow PerfMemory to attempt cleanup of any persistent resources
1737  perfMemory_exit();
1738
1739  // needs to remove object in file system
1740  AttachListener::abort();
1741
1742  // flush buffered output, finish log files
1743  ostream_abort();
1744
1745  // Check for abort hook
1746  abort_hook_t abort_hook = Arguments::abort_hook();
1747  if (abort_hook != NULL) {
1748    abort_hook();
1749  }
1750}
1751
1752// Note: os::abort() might be called very early during initialization, or
1753// called from signal handler. Before adding something to os::abort(), make
1754// sure it is async-safe and can handle partially initialized VM.
1755void os::abort(bool dump_core) {
1756  os::shutdown();
1757  if (dump_core) {
1758#ifndef PRODUCT
1759    fdStream out(defaultStream::output_fd());
1760    out.print_raw("Current thread is ");
1761    char buf[16];
1762    jio_snprintf(buf, sizeof(buf), UINTX_FORMAT, os::current_thread_id());
1763    out.print_raw_cr(buf);
1764    out.print_raw_cr("Dumping core ...");
1765#endif
1766    ::abort(); // dump core (for debugging)
1767  }
1768
1769  ::exit(1);
1770}
1771
1772// Die immediately, no exit hook, no abort hook, no cleanup.
1773void os::die() {
1774  _exit(-1);
1775}
1776
1777// unused
1778void os::set_error_file(const char *logfile) {}
1779
1780// DLL functions
1781
1782const char* os::dll_file_extension() { return ".so"; }
1783
1784const char* os::get_temp_directory() { return "/tmp/"; }
1785
1786const char* os::get_current_directory(char *buf, int buflen) {
1787  return getcwd(buf, buflen);
1788}
1789
1790// check if addr is inside libjvm[_g].so
1791bool os::address_is_in_vm(address addr) {
1792  static address libjvm_base_addr;
1793  Dl_info dlinfo;
1794
1795  if (libjvm_base_addr == NULL) {
1796    dladdr(CAST_FROM_FN_PTR(void *, os::address_is_in_vm), &dlinfo);
1797    libjvm_base_addr = (address)dlinfo.dli_fbase;
1798    assert(libjvm_base_addr !=NULL, "Cannot obtain base address for libjvm");
1799  }
1800
1801  if (dladdr((void *)addr, &dlinfo)) {
1802    if (libjvm_base_addr == (address)dlinfo.dli_fbase) return true;
1803  }
1804
1805  return false;
1806}
1807
1808typedef int (*dladdr1_func_type) (void *, Dl_info *, void **, int);
1809static dladdr1_func_type dladdr1_func = NULL;
1810
1811bool os::dll_address_to_function_name(address addr, char *buf,
1812                                      int buflen, int * offset) {
1813  Dl_info dlinfo;
1814
1815  // dladdr1_func was initialized in os::init()
1816  if (dladdr1_func){
1817      // yes, we have dladdr1
1818
1819      // Support for dladdr1 is checked at runtime; it may be
1820      // available even if the vm is built on a machine that does
1821      // not have dladdr1 support.  Make sure there is a value for
1822      // RTLD_DL_SYMENT.
1823      #ifndef RTLD_DL_SYMENT
1824      #define RTLD_DL_SYMENT 1
1825      #endif
1826      Sym * info;
1827      if (dladdr1_func((void *)addr, &dlinfo, (void **)&info,
1828                       RTLD_DL_SYMENT)) {
1829          if (buf) jio_snprintf(buf, buflen, "%s", dlinfo.dli_sname);
1830          if (offset) *offset = addr - (address)dlinfo.dli_saddr;
1831
1832          // check if the returned symbol really covers addr
1833          return ((char *)dlinfo.dli_saddr + info->st_size > (char *)addr);
1834      } else {
1835          if (buf) buf[0] = '\0';
1836          if (offset) *offset  = -1;
1837          return false;
1838      }
1839  } else {
1840      // no, only dladdr is available
1841      if(dladdr((void *)addr, &dlinfo)) {
1842          if (buf) jio_snprintf(buf, buflen, dlinfo.dli_sname);
1843          if (offset) *offset = addr - (address)dlinfo.dli_saddr;
1844          return true;
1845      } else {
1846          if (buf) buf[0] = '\0';
1847          if (offset) *offset  = -1;
1848          return false;
1849      }
1850  }
1851}
1852
1853bool os::dll_address_to_library_name(address addr, char* buf,
1854                                     int buflen, int* offset) {
1855  Dl_info dlinfo;
1856
1857  if (dladdr((void*)addr, &dlinfo)){
1858     if (buf) jio_snprintf(buf, buflen, "%s", dlinfo.dli_fname);
1859     if (offset) *offset = addr - (address)dlinfo.dli_fbase;
1860     return true;
1861  } else {
1862     if (buf) buf[0] = '\0';
1863     if (offset) *offset = -1;
1864     return false;
1865  }
1866}
1867
1868// Prints the names and full paths of all opened dynamic libraries
1869// for current process
1870void os::print_dll_info(outputStream * st) {
1871    Dl_info dli;
1872    void *handle;
1873    Link_map *map;
1874    Link_map *p;
1875
1876    st->print_cr("Dynamic libraries:"); st->flush();
1877
1878    if (!dladdr(CAST_FROM_FN_PTR(void *, os::print_dll_info), &dli)) {
1879        st->print_cr("Error: Cannot print dynamic libraries.");
1880        return;
1881    }
1882    handle = dlopen(dli.dli_fname, RTLD_LAZY);
1883    if (handle == NULL) {
1884        st->print_cr("Error: Cannot print dynamic libraries.");
1885        return;
1886    }
1887    dlinfo(handle, RTLD_DI_LINKMAP, &map);
1888    if (map == NULL) {
1889        st->print_cr("Error: Cannot print dynamic libraries.");
1890        return;
1891    }
1892
1893    while (map->l_prev != NULL)
1894        map = map->l_prev;
1895
1896    while (map != NULL) {
1897        st->print_cr(PTR_FORMAT " \t%s", map->l_addr, map->l_name);
1898        map = map->l_next;
1899    }
1900
1901    dlclose(handle);
1902}
1903
1904  // Loads .dll/.so and
1905  // in case of error it checks if .dll/.so was built for the
1906  // same architecture as Hotspot is running on
1907
1908void * os::dll_load(const char *filename, char *ebuf, int ebuflen)
1909{
1910  void * result= ::dlopen(filename, RTLD_LAZY);
1911  if (result != NULL) {
1912    // Successful loading
1913    return result;
1914  }
1915
1916  Elf32_Ehdr elf_head;
1917
1918  // Read system error message into ebuf
1919  // It may or may not be overwritten below
1920  ::strncpy(ebuf, ::dlerror(), ebuflen-1);
1921  ebuf[ebuflen-1]='\0';
1922  int diag_msg_max_length=ebuflen-strlen(ebuf);
1923  char* diag_msg_buf=ebuf+strlen(ebuf);
1924
1925  if (diag_msg_max_length==0) {
1926    // No more space in ebuf for additional diagnostics message
1927    return NULL;
1928  }
1929
1930
1931  int file_descriptor= ::open(filename, O_RDONLY | O_NONBLOCK);
1932
1933  if (file_descriptor < 0) {
1934    // Can't open library, report dlerror() message
1935    return NULL;
1936  }
1937
1938  bool failed_to_read_elf_head=
1939    (sizeof(elf_head)!=
1940        (::read(file_descriptor, &elf_head,sizeof(elf_head)))) ;
1941
1942  ::close(file_descriptor);
1943  if (failed_to_read_elf_head) {
1944    // file i/o error - report dlerror() msg
1945    return NULL;
1946  }
1947
1948  typedef struct {
1949    Elf32_Half  code;         // Actual value as defined in elf.h
1950    Elf32_Half  compat_class; // Compatibility of archs at VM's sense
1951    char        elf_class;    // 32 or 64 bit
1952    char        endianess;    // MSB or LSB
1953    char*       name;         // String representation
1954  } arch_t;
1955
1956  static const arch_t arch_array[]={
1957    {EM_386,         EM_386,     ELFCLASS32, ELFDATA2LSB, (char*)"IA 32"},
1958    {EM_486,         EM_386,     ELFCLASS32, ELFDATA2LSB, (char*)"IA 32"},
1959    {EM_IA_64,       EM_IA_64,   ELFCLASS64, ELFDATA2LSB, (char*)"IA 64"},
1960    {EM_X86_64,      EM_X86_64,  ELFCLASS64, ELFDATA2LSB, (char*)"AMD 64"},
1961    {EM_SPARC,       EM_SPARC,   ELFCLASS32, ELFDATA2MSB, (char*)"Sparc 32"},
1962    {EM_SPARC32PLUS, EM_SPARC,   ELFCLASS32, ELFDATA2MSB, (char*)"Sparc 32"},
1963    {EM_SPARCV9,     EM_SPARCV9, ELFCLASS64, ELFDATA2MSB, (char*)"Sparc v9 64"},
1964    {EM_PPC,         EM_PPC,     ELFCLASS32, ELFDATA2MSB, (char*)"Power PC 32"},
1965    {EM_PPC64,       EM_PPC64,   ELFCLASS64, ELFDATA2MSB, (char*)"Power PC 64"}
1966  };
1967
1968  #if  (defined IA32)
1969    static  Elf32_Half running_arch_code=EM_386;
1970  #elif   (defined AMD64)
1971    static  Elf32_Half running_arch_code=EM_X86_64;
1972  #elif  (defined IA64)
1973    static  Elf32_Half running_arch_code=EM_IA_64;
1974  #elif  (defined __sparc) && (defined _LP64)
1975    static  Elf32_Half running_arch_code=EM_SPARCV9;
1976  #elif  (defined __sparc) && (!defined _LP64)
1977    static  Elf32_Half running_arch_code=EM_SPARC;
1978  #elif  (defined __powerpc64__)
1979    static  Elf32_Half running_arch_code=EM_PPC64;
1980  #elif  (defined __powerpc__)
1981    static  Elf32_Half running_arch_code=EM_PPC;
1982  #else
1983    #error Method os::dll_load requires that one of following is defined:\
1984         IA32, AMD64, IA64, __sparc, __powerpc__
1985  #endif
1986
1987  // Identify compatability class for VM's architecture and library's architecture
1988  // Obtain string descriptions for architectures
1989
1990  arch_t lib_arch={elf_head.e_machine,0,elf_head.e_ident[EI_CLASS], elf_head.e_ident[EI_DATA], NULL};
1991  int running_arch_index=-1;
1992
1993  for (unsigned int i=0 ; i < ARRAY_SIZE(arch_array) ; i++ ) {
1994    if (running_arch_code == arch_array[i].code) {
1995      running_arch_index    = i;
1996    }
1997    if (lib_arch.code == arch_array[i].code) {
1998      lib_arch.compat_class = arch_array[i].compat_class;
1999      lib_arch.name         = arch_array[i].name;
2000    }
2001  }
2002
2003  assert(running_arch_index != -1,
2004    "Didn't find running architecture code (running_arch_code) in arch_array");
2005  if (running_arch_index == -1) {
2006    // Even though running architecture detection failed
2007    // we may still continue with reporting dlerror() message
2008    return NULL;
2009  }
2010
2011  if (lib_arch.endianess != arch_array[running_arch_index].endianess) {
2012    ::snprintf(diag_msg_buf, diag_msg_max_length-1," (Possible cause: endianness mismatch)");
2013    return NULL;
2014  }
2015
2016  if (lib_arch.elf_class != arch_array[running_arch_index].elf_class) {
2017    ::snprintf(diag_msg_buf, diag_msg_max_length-1," (Possible cause: architecture word width mismatch)");
2018    return NULL;
2019  }
2020
2021  if (lib_arch.compat_class != arch_array[running_arch_index].compat_class) {
2022    if ( lib_arch.name!=NULL ) {
2023      ::snprintf(diag_msg_buf, diag_msg_max_length-1,
2024        " (Possible cause: can't load %s-bit .so on a %s-bit platform)",
2025        lib_arch.name, arch_array[running_arch_index].name);
2026    } else {
2027      ::snprintf(diag_msg_buf, diag_msg_max_length-1,
2028      " (Possible cause: can't load this .so (machine code=0x%x) on a %s-bit platform)",
2029        lib_arch.code,
2030        arch_array[running_arch_index].name);
2031    }
2032  }
2033
2034  return NULL;
2035}
2036
2037
2038
2039bool _print_ascii_file(const char* filename, outputStream* st) {
2040  int fd = open(filename, O_RDONLY);
2041  if (fd == -1) {
2042     return false;
2043  }
2044
2045  char buf[32];
2046  int bytes;
2047  while ((bytes = read(fd, buf, sizeof(buf))) > 0) {
2048    st->print_raw(buf, bytes);
2049  }
2050
2051  close(fd);
2052
2053  return true;
2054}
2055
2056void os::print_os_info(outputStream* st) {
2057  st->print("OS:");
2058
2059  if (!_print_ascii_file("/etc/release", st)) {
2060    st->print("Solaris");
2061  }
2062  st->cr();
2063
2064  // kernel
2065  st->print("uname:");
2066  struct utsname name;
2067  uname(&name);
2068  st->print(name.sysname); st->print(" ");
2069  st->print(name.release); st->print(" ");
2070  st->print(name.version); st->print(" ");
2071  st->print(name.machine);
2072
2073  // libthread
2074  if (os::Solaris::T2_libthread()) st->print("  (T2 libthread)");
2075  else st->print("  (T1 libthread)");
2076  st->cr();
2077
2078  // rlimit
2079  st->print("rlimit:");
2080  struct rlimit rlim;
2081
2082  st->print(" STACK ");
2083  getrlimit(RLIMIT_STACK, &rlim);
2084  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2085  else st->print("%uk", rlim.rlim_cur >> 10);
2086
2087  st->print(", CORE ");
2088  getrlimit(RLIMIT_CORE, &rlim);
2089  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2090  else st->print("%uk", rlim.rlim_cur >> 10);
2091
2092  st->print(", NOFILE ");
2093  getrlimit(RLIMIT_NOFILE, &rlim);
2094  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2095  else st->print("%d", rlim.rlim_cur);
2096
2097  st->print(", AS ");
2098  getrlimit(RLIMIT_AS, &rlim);
2099  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2100  else st->print("%uk", rlim.rlim_cur >> 10);
2101  st->cr();
2102
2103  // load average
2104  st->print("load average:");
2105  double loadavg[3];
2106  os::loadavg(loadavg, 3);
2107  st->print("%0.02f %0.02f %0.02f", loadavg[0], loadavg[1], loadavg[2]);
2108  st->cr();
2109}
2110
2111
2112static bool check_addr0(outputStream* st) {
2113  jboolean status = false;
2114  int fd = open("/proc/self/map",O_RDONLY);
2115  if (fd >= 0) {
2116    prmap_t p;
2117    while(read(fd, &p, sizeof(p)) > 0) {
2118      if (p.pr_vaddr == 0x0) {
2119        st->print("Warning: Address: 0x%x, Size: %dK, ",p.pr_vaddr, p.pr_size/1024, p.pr_mapname);
2120        st->print("Mapped file: %s, ", p.pr_mapname[0] == '\0' ? "None" : p.pr_mapname);
2121        st->print("Access:");
2122        st->print("%s",(p.pr_mflags & MA_READ)  ? "r" : "-");
2123        st->print("%s",(p.pr_mflags & MA_WRITE) ? "w" : "-");
2124        st->print("%s",(p.pr_mflags & MA_EXEC)  ? "x" : "-");
2125        st->cr();
2126        status = true;
2127      }
2128      close(fd);
2129    }
2130  }
2131  return status;
2132}
2133
2134void os::print_memory_info(outputStream* st) {
2135  st->print("Memory:");
2136  st->print(" %dk page", os::vm_page_size()>>10);
2137  st->print(", physical " UINT64_FORMAT "k", os::physical_memory()>>10);
2138  st->print("(" UINT64_FORMAT "k free)", os::available_memory() >> 10);
2139  st->cr();
2140  (void) check_addr0(st);
2141}
2142
2143// Taken from /usr/include/sys/machsig.h  Supposed to be architecture specific
2144// but they're the same for all the solaris architectures that we support.
2145const char *ill_names[] = { "ILL0", "ILL_ILLOPC", "ILL_ILLOPN", "ILL_ILLADR",
2146                          "ILL_ILLTRP", "ILL_PRVOPC", "ILL_PRVREG",
2147                          "ILL_COPROC", "ILL_BADSTK" };
2148
2149const char *fpe_names[] = { "FPE0", "FPE_INTDIV", "FPE_INTOVF", "FPE_FLTDIV",
2150                          "FPE_FLTOVF", "FPE_FLTUND", "FPE_FLTRES",
2151                          "FPE_FLTINV", "FPE_FLTSUB" };
2152
2153const char *segv_names[] = { "SEGV0", "SEGV_MAPERR", "SEGV_ACCERR" };
2154
2155const char *bus_names[] = { "BUS0", "BUS_ADRALN", "BUS_ADRERR", "BUS_OBJERR" };
2156
2157void os::print_siginfo(outputStream* st, void* siginfo) {
2158  st->print("siginfo:");
2159
2160  const int buflen = 100;
2161  char buf[buflen];
2162  siginfo_t *si = (siginfo_t*)siginfo;
2163  st->print("si_signo=%s: ", os::exception_name(si->si_signo, buf, buflen));
2164  char *err = strerror(si->si_errno);
2165  if (si->si_errno != 0 && err != NULL) {
2166    st->print("si_errno=%s", err);
2167  } else {
2168    st->print("si_errno=%d", si->si_errno);
2169  }
2170  const int c = si->si_code;
2171  assert(c > 0, "unexpected si_code");
2172  switch (si->si_signo) {
2173  case SIGILL:
2174    st->print(", si_code=%d (%s)", c, c > 8 ? "" : ill_names[c]);
2175    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2176    break;
2177  case SIGFPE:
2178    st->print(", si_code=%d (%s)", c, c > 9 ? "" : fpe_names[c]);
2179    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2180    break;
2181  case SIGSEGV:
2182    st->print(", si_code=%d (%s)", c, c > 2 ? "" : segv_names[c]);
2183    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2184    break;
2185  case SIGBUS:
2186    st->print(", si_code=%d (%s)", c, c > 3 ? "" : bus_names[c]);
2187    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2188    break;
2189  default:
2190    st->print(", si_code=%d", si->si_code);
2191    // no si_addr
2192  }
2193
2194  if ((si->si_signo == SIGBUS || si->si_signo == SIGSEGV) &&
2195      UseSharedSpaces) {
2196    FileMapInfo* mapinfo = FileMapInfo::current_info();
2197    if (mapinfo->is_in_shared_space(si->si_addr)) {
2198      st->print("\n\nError accessing class data sharing archive."   \
2199                " Mapped file inaccessible during execution, "      \
2200                " possible disk/network problem.");
2201    }
2202  }
2203  st->cr();
2204}
2205
2206// Moved from whole group, because we need them here for diagnostic
2207// prints.
2208#define OLDMAXSIGNUM 32
2209static int Maxsignum = 0;
2210static int *ourSigFlags = NULL;
2211
2212extern "C" void sigINTRHandler(int, siginfo_t*, void*);
2213
2214int os::Solaris::get_our_sigflags(int sig) {
2215  assert(ourSigFlags!=NULL, "signal data structure not initialized");
2216  assert(sig > 0 && sig < Maxsignum, "vm signal out of expected range");
2217  return ourSigFlags[sig];
2218}
2219
2220void os::Solaris::set_our_sigflags(int sig, int flags) {
2221  assert(ourSigFlags!=NULL, "signal data structure not initialized");
2222  assert(sig > 0 && sig < Maxsignum, "vm signal out of expected range");
2223  ourSigFlags[sig] = flags;
2224}
2225
2226
2227static const char* get_signal_handler_name(address handler,
2228                                           char* buf, int buflen) {
2229  int offset;
2230  bool found = os::dll_address_to_library_name(handler, buf, buflen, &offset);
2231  if (found) {
2232    // skip directory names
2233    const char *p1, *p2;
2234    p1 = buf;
2235    size_t len = strlen(os::file_separator());
2236    while ((p2 = strstr(p1, os::file_separator())) != NULL) p1 = p2 + len;
2237    jio_snprintf(buf, buflen, "%s+0x%x", p1, offset);
2238  } else {
2239    jio_snprintf(buf, buflen, PTR_FORMAT, handler);
2240  }
2241  return buf;
2242}
2243
2244static void print_signal_handler(outputStream* st, int sig,
2245                                  char* buf, size_t buflen) {
2246  struct sigaction sa;
2247
2248  sigaction(sig, NULL, &sa);
2249
2250  st->print("%s: ", os::exception_name(sig, buf, buflen));
2251
2252  address handler = (sa.sa_flags & SA_SIGINFO)
2253                  ? CAST_FROM_FN_PTR(address, sa.sa_sigaction)
2254                  : CAST_FROM_FN_PTR(address, sa.sa_handler);
2255
2256  if (handler == CAST_FROM_FN_PTR(address, SIG_DFL)) {
2257    st->print("SIG_DFL");
2258  } else if (handler == CAST_FROM_FN_PTR(address, SIG_IGN)) {
2259    st->print("SIG_IGN");
2260  } else {
2261    st->print("[%s]", get_signal_handler_name(handler, buf, buflen));
2262  }
2263
2264  st->print(", sa_mask[0]=" PTR32_FORMAT, *(uint32_t*)&sa.sa_mask);
2265
2266  address rh = VMError::get_resetted_sighandler(sig);
2267  // May be, handler was resetted by VMError?
2268  if(rh != NULL) {
2269    handler = rh;
2270    sa.sa_flags = VMError::get_resetted_sigflags(sig);
2271  }
2272
2273  st->print(", sa_flags="   PTR32_FORMAT, sa.sa_flags);
2274
2275  // Check: is it our handler?
2276  if(handler == CAST_FROM_FN_PTR(address, signalHandler) ||
2277     handler == CAST_FROM_FN_PTR(address, sigINTRHandler)) {
2278    // It is our signal handler
2279    // check for flags
2280    if(sa.sa_flags != os::Solaris::get_our_sigflags(sig)) {
2281      st->print(
2282        ", flags was changed from " PTR32_FORMAT ", consider using jsig library",
2283        os::Solaris::get_our_sigflags(sig));
2284    }
2285  }
2286  st->cr();
2287}
2288
2289void os::print_signal_handlers(outputStream* st, char* buf, size_t buflen) {
2290  st->print_cr("Signal Handlers:");
2291  print_signal_handler(st, SIGSEGV, buf, buflen);
2292  print_signal_handler(st, SIGBUS , buf, buflen);
2293  print_signal_handler(st, SIGFPE , buf, buflen);
2294  print_signal_handler(st, SIGPIPE, buf, buflen);
2295  print_signal_handler(st, SIGXFSZ, buf, buflen);
2296  print_signal_handler(st, SIGILL , buf, buflen);
2297  print_signal_handler(st, INTERRUPT_SIGNAL, buf, buflen);
2298  print_signal_handler(st, ASYNC_SIGNAL, buf, buflen);
2299  print_signal_handler(st, BREAK_SIGNAL, buf, buflen);
2300  print_signal_handler(st, SHUTDOWN1_SIGNAL , buf, buflen);
2301  print_signal_handler(st, SHUTDOWN2_SIGNAL , buf, buflen);
2302  print_signal_handler(st, SHUTDOWN3_SIGNAL, buf, buflen);
2303  print_signal_handler(st, os::Solaris::SIGinterrupt(), buf, buflen);
2304  print_signal_handler(st, os::Solaris::SIGasync(), buf, buflen);
2305}
2306
2307static char saved_jvm_path[MAXPATHLEN] = { 0 };
2308
2309// Find the full path to the current module, libjvm.so or libjvm_g.so
2310void os::jvm_path(char *buf, jint buflen) {
2311  // Error checking.
2312  if (buflen < MAXPATHLEN) {
2313    assert(false, "must use a large-enough buffer");
2314    buf[0] = '\0';
2315    return;
2316  }
2317  // Lazy resolve the path to current module.
2318  if (saved_jvm_path[0] != 0) {
2319    strcpy(buf, saved_jvm_path);
2320    return;
2321  }
2322
2323  Dl_info dlinfo;
2324  int ret = dladdr(CAST_FROM_FN_PTR(void *, os::jvm_path), &dlinfo);
2325  assert(ret != 0, "cannot locate libjvm");
2326  realpath((char *)dlinfo.dli_fname, buf);
2327
2328  if (strcmp(Arguments::sun_java_launcher(), "gamma") == 0) {
2329    // Support for the gamma launcher.  Typical value for buf is
2330    // "<JAVA_HOME>/jre/lib/<arch>/<vmtype>/libjvm.so".  If "/jre/lib/" appears at
2331    // the right place in the string, then assume we are installed in a JDK and
2332    // we're done.  Otherwise, check for a JAVA_HOME environment variable and fix
2333    // up the path so it looks like libjvm.so is installed there (append a
2334    // fake suffix hotspot/libjvm.so).
2335    const char *p = buf + strlen(buf) - 1;
2336    for (int count = 0; p > buf && count < 5; ++count) {
2337      for (--p; p > buf && *p != '/'; --p)
2338        /* empty */ ;
2339    }
2340
2341    if (strncmp(p, "/jre/lib/", 9) != 0) {
2342      // Look for JAVA_HOME in the environment.
2343      char* java_home_var = ::getenv("JAVA_HOME");
2344      if (java_home_var != NULL && java_home_var[0] != 0) {
2345        char cpu_arch[12];
2346        sysinfo(SI_ARCHITECTURE, cpu_arch, sizeof(cpu_arch));
2347#ifdef _LP64
2348        // If we are on sparc running a 64-bit vm, look in jre/lib/sparcv9.
2349        if (strcmp(cpu_arch, "sparc") == 0) {
2350          strcat(cpu_arch, "v9");
2351        } else if (strcmp(cpu_arch, "i386") == 0) {
2352          strcpy(cpu_arch, "amd64");
2353        }
2354#endif
2355        // Check the current module name "libjvm.so" or "libjvm_g.so".
2356        p = strrchr(buf, '/');
2357        assert(strstr(p, "/libjvm") == p, "invalid library name");
2358        p = strstr(p, "_g") ? "_g" : "";
2359
2360        realpath(java_home_var, buf);
2361        sprintf(buf + strlen(buf), "/jre/lib/%s", cpu_arch);
2362        if (0 == access(buf, F_OK)) {
2363          // Use current module name "libjvm[_g].so" instead of
2364          // "libjvm"debug_only("_g")".so" since for fastdebug version
2365          // we should have "libjvm.so" but debug_only("_g") adds "_g"!
2366          // It is used when we are choosing the HPI library's name
2367          // "libhpi[_g].so" in hpi::initialize_get_interface().
2368          sprintf(buf + strlen(buf), "/hotspot/libjvm%s.so", p);
2369        } else {
2370          // Go back to path of .so
2371          realpath((char *)dlinfo.dli_fname, buf);
2372        }
2373      }
2374    }
2375  }
2376
2377  strcpy(saved_jvm_path, buf);
2378}
2379
2380
2381void os::print_jni_name_prefix_on(outputStream* st, int args_size) {
2382  // no prefix required, not even "_"
2383}
2384
2385
2386void os::print_jni_name_suffix_on(outputStream* st, int args_size) {
2387  // no suffix required
2388}
2389
2390
2391// sun.misc.Signal
2392
2393extern "C" {
2394  static void UserHandler(int sig, void *siginfo, void *context) {
2395    // Ctrl-C is pressed during error reporting, likely because the error
2396    // handler fails to abort. Let VM die immediately.
2397    if (sig == SIGINT && is_error_reported()) {
2398       os::die();
2399    }
2400
2401    os::signal_notify(sig);
2402    // We do not need to reinstate the signal handler each time...
2403  }
2404}
2405
2406void* os::user_handler() {
2407  return CAST_FROM_FN_PTR(void*, UserHandler);
2408}
2409
2410extern "C" {
2411  typedef void (*sa_handler_t)(int);
2412  typedef void (*sa_sigaction_t)(int, siginfo_t *, void *);
2413}
2414
2415void* os::signal(int signal_number, void* handler) {
2416  struct sigaction sigAct, oldSigAct;
2417  sigfillset(&(sigAct.sa_mask));
2418  sigAct.sa_flags = SA_RESTART & ~SA_RESETHAND;
2419  sigAct.sa_handler = CAST_TO_FN_PTR(sa_handler_t, handler);
2420
2421  if (sigaction(signal_number, &sigAct, &oldSigAct))
2422    // -1 means registration failed
2423    return (void *)-1;
2424
2425  return CAST_FROM_FN_PTR(void*, oldSigAct.sa_handler);
2426}
2427
2428void os::signal_raise(int signal_number) {
2429  raise(signal_number);
2430}
2431
2432/*
2433 * The following code is moved from os.cpp for making this
2434 * code platform specific, which it is by its very nature.
2435 */
2436
2437// a counter for each possible signal value
2438static int Sigexit = 0;
2439static int Maxlibjsigsigs;
2440static jint *pending_signals = NULL;
2441static int *preinstalled_sigs = NULL;
2442static struct sigaction *chainedsigactions = NULL;
2443static sema_t sig_sem;
2444typedef int (*version_getting_t)();
2445version_getting_t os::Solaris::get_libjsig_version = NULL;
2446static int libjsigversion = NULL;
2447
2448int os::sigexitnum_pd() {
2449  assert(Sigexit > 0, "signal memory not yet initialized");
2450  return Sigexit;
2451}
2452
2453void os::Solaris::init_signal_mem() {
2454  // Initialize signal structures
2455  Maxsignum = SIGRTMAX;
2456  Sigexit = Maxsignum+1;
2457  assert(Maxsignum >0, "Unable to obtain max signal number");
2458
2459  Maxlibjsigsigs = Maxsignum;
2460
2461  // pending_signals has one int per signal
2462  // The additional signal is for SIGEXIT - exit signal to signal_thread
2463  pending_signals = (jint *)os::malloc(sizeof(jint) * (Sigexit+1));
2464  memset(pending_signals, 0, (sizeof(jint) * (Sigexit+1)));
2465
2466  if (UseSignalChaining) {
2467     chainedsigactions = (struct sigaction *)malloc(sizeof(struct sigaction)
2468       * (Maxsignum + 1));
2469     memset(chainedsigactions, 0, (sizeof(struct sigaction) * (Maxsignum + 1)));
2470     preinstalled_sigs = (int *)os::malloc(sizeof(int) * (Maxsignum + 1));
2471     memset(preinstalled_sigs, 0, (sizeof(int) * (Maxsignum + 1)));
2472  }
2473  ourSigFlags = (int*)malloc(sizeof(int) * (Maxsignum + 1 ));
2474  memset(ourSigFlags, 0, sizeof(int) * (Maxsignum + 1));
2475}
2476
2477void os::signal_init_pd() {
2478  int ret;
2479
2480  ret = ::sema_init(&sig_sem, 0, NULL, NULL);
2481  assert(ret == 0, "sema_init() failed");
2482}
2483
2484void os::signal_notify(int signal_number) {
2485  int ret;
2486
2487  Atomic::inc(&pending_signals[signal_number]);
2488  ret = ::sema_post(&sig_sem);
2489  assert(ret == 0, "sema_post() failed");
2490}
2491
2492static int check_pending_signals(bool wait_for_signal) {
2493  int ret;
2494  while (true) {
2495    for (int i = 0; i < Sigexit + 1; i++) {
2496      jint n = pending_signals[i];
2497      if (n > 0 && n == Atomic::cmpxchg(n - 1, &pending_signals[i], n)) {
2498        return i;
2499      }
2500    }
2501    if (!wait_for_signal) {
2502      return -1;
2503    }
2504    JavaThread *thread = JavaThread::current();
2505    ThreadBlockInVM tbivm(thread);
2506
2507    bool threadIsSuspended;
2508    do {
2509      thread->set_suspend_equivalent();
2510      // cleared by handle_special_suspend_equivalent_condition() or java_suspend_self()
2511      while((ret = ::sema_wait(&sig_sem)) == EINTR)
2512          ;
2513      assert(ret == 0, "sema_wait() failed");
2514
2515      // were we externally suspended while we were waiting?
2516      threadIsSuspended = thread->handle_special_suspend_equivalent_condition();
2517      if (threadIsSuspended) {
2518        //
2519        // The semaphore has been incremented, but while we were waiting
2520        // another thread suspended us. We don't want to continue running
2521        // while suspended because that would surprise the thread that
2522        // suspended us.
2523        //
2524        ret = ::sema_post(&sig_sem);
2525        assert(ret == 0, "sema_post() failed");
2526
2527        thread->java_suspend_self();
2528      }
2529    } while (threadIsSuspended);
2530  }
2531}
2532
2533int os::signal_lookup() {
2534  return check_pending_signals(false);
2535}
2536
2537int os::signal_wait() {
2538  return check_pending_signals(true);
2539}
2540
2541////////////////////////////////////////////////////////////////////////////////
2542// Virtual Memory
2543
2544static int page_size = -1;
2545
2546// The mmap MAP_ALIGN flag is supported on Solaris 9 and later.  init_2() will
2547// clear this var if support is not available.
2548static bool has_map_align = true;
2549
2550int os::vm_page_size() {
2551  assert(page_size != -1, "must call os::init");
2552  return page_size;
2553}
2554
2555// Solaris allocates memory by pages.
2556int os::vm_allocation_granularity() {
2557  assert(page_size != -1, "must call os::init");
2558  return page_size;
2559}
2560
2561bool os::commit_memory(char* addr, size_t bytes) {
2562  size_t size = bytes;
2563  return
2564     NULL != Solaris::mmap_chunk(addr, size, MAP_PRIVATE|MAP_FIXED,
2565                                 PROT_READ | PROT_WRITE | PROT_EXEC);
2566}
2567
2568bool os::commit_memory(char* addr, size_t bytes, size_t alignment_hint) {
2569  if (commit_memory(addr, bytes)) {
2570    if (UseMPSS && alignment_hint > (size_t)vm_page_size()) {
2571      // If the large page size has been set and the VM
2572      // is using large pages, use the large page size
2573      // if it is smaller than the alignment hint. This is
2574      // a case where the VM wants to use a larger alignment size
2575      // for its own reasons but still want to use large pages
2576      // (which is what matters to setting the mpss range.
2577      size_t page_size = 0;
2578      if (large_page_size() < alignment_hint) {
2579        assert(UseLargePages, "Expected to be here for large page use only");
2580        page_size = large_page_size();
2581      } else {
2582        // If the alignment hint is less than the large page
2583        // size, the VM wants a particular alignment (thus the hint)
2584        // for internal reasons.  Try to set the mpss range using
2585        // the alignment_hint.
2586        page_size = alignment_hint;
2587      }
2588      // Since this is a hint, ignore any failures.
2589      (void)Solaris::set_mpss_range(addr, bytes, page_size);
2590    }
2591    return true;
2592  }
2593  return false;
2594}
2595
2596// Uncommit the pages in a specified region.
2597void os::free_memory(char* addr, size_t bytes) {
2598  if (madvise(addr, bytes, MADV_FREE) < 0) {
2599    debug_only(warning("MADV_FREE failed."));
2600    return;
2601  }
2602}
2603
2604// Change the page size in a given range.
2605void os::realign_memory(char *addr, size_t bytes, size_t alignment_hint) {
2606  assert((intptr_t)addr % alignment_hint == 0, "Address should be aligned.");
2607  assert((intptr_t)(addr + bytes) % alignment_hint == 0, "End should be aligned.");
2608  Solaris::set_mpss_range(addr, bytes, alignment_hint);
2609}
2610
2611// Tell the OS to make the range local to the first-touching LWP
2612void os::numa_make_local(char *addr, size_t bytes, int lgrp_hint) {
2613  assert((intptr_t)addr % os::vm_page_size() == 0, "Address should be page-aligned.");
2614  if (madvise(addr, bytes, MADV_ACCESS_LWP) < 0) {
2615    debug_only(warning("MADV_ACCESS_LWP failed."));
2616  }
2617}
2618
2619// Tell the OS that this range would be accessed from different LWPs.
2620void os::numa_make_global(char *addr, size_t bytes) {
2621  assert((intptr_t)addr % os::vm_page_size() == 0, "Address should be page-aligned.");
2622  if (madvise(addr, bytes, MADV_ACCESS_MANY) < 0) {
2623    debug_only(warning("MADV_ACCESS_MANY failed."));
2624  }
2625}
2626
2627// Get the number of the locality groups.
2628size_t os::numa_get_groups_num() {
2629  size_t n = Solaris::lgrp_nlgrps(Solaris::lgrp_cookie());
2630  return n != -1 ? n : 1;
2631}
2632
2633// Get a list of leaf locality groups. A leaf lgroup is group that
2634// doesn't have any children. Typical leaf group is a CPU or a CPU/memory
2635// board. An LWP is assigned to one of these groups upon creation.
2636size_t os::numa_get_leaf_groups(int *ids, size_t size) {
2637   if ((ids[0] = Solaris::lgrp_root(Solaris::lgrp_cookie())) == -1) {
2638     ids[0] = 0;
2639     return 1;
2640   }
2641   int result_size = 0, top = 1, bottom = 0, cur = 0;
2642   for (int k = 0; k < size; k++) {
2643     int r = Solaris::lgrp_children(Solaris::lgrp_cookie(), ids[cur],
2644                                    (Solaris::lgrp_id_t*)&ids[top], size - top);
2645     if (r == -1) {
2646       ids[0] = 0;
2647       return 1;
2648     }
2649     if (!r) {
2650       // That's a leaf node.
2651       assert (bottom <= cur, "Sanity check");
2652       // Check if the node has memory
2653       if (Solaris::lgrp_resources(Solaris::lgrp_cookie(), ids[cur],
2654                                   NULL, 0, LGRP_RSRC_MEM) > 0) {
2655         ids[bottom++] = ids[cur];
2656       }
2657     }
2658     top += r;
2659     cur++;
2660   }
2661   if (bottom == 0) {
2662     // Handle a situation, when the OS reports no memory available.
2663     // Assume UMA architecture.
2664     ids[0] = 0;
2665     return 1;
2666   }
2667   return bottom;
2668}
2669
2670// Detect the topology change. Typically happens during CPU pluggin-unplugging.
2671bool os::numa_topology_changed() {
2672  int is_stale = Solaris::lgrp_cookie_stale(Solaris::lgrp_cookie());
2673  if (is_stale != -1 && is_stale) {
2674    Solaris::lgrp_fini(Solaris::lgrp_cookie());
2675    Solaris::lgrp_cookie_t c = Solaris::lgrp_init(Solaris::LGRP_VIEW_CALLER);
2676    assert(c != 0, "Failure to initialize LGRP API");
2677    Solaris::set_lgrp_cookie(c);
2678    return true;
2679  }
2680  return false;
2681}
2682
2683// Get the group id of the current LWP.
2684int os::numa_get_group_id() {
2685  int lgrp_id = Solaris::lgrp_home(P_LWPID, P_MYID);
2686  if (lgrp_id == -1) {
2687    return 0;
2688  }
2689  const int size = os::numa_get_groups_num();
2690  int *ids = (int*)alloca(size * sizeof(int));
2691
2692  // Get the ids of all lgroups with memory; r is the count.
2693  int r = Solaris::lgrp_resources(Solaris::lgrp_cookie(), lgrp_id,
2694                                  (Solaris::lgrp_id_t*)ids, size, LGRP_RSRC_MEM);
2695  if (r <= 0) {
2696    return 0;
2697  }
2698  return ids[os::random() % r];
2699}
2700
2701// Request information about the page.
2702bool os::get_page_info(char *start, page_info* info) {
2703  const uint_t info_types[] = { MEMINFO_VLGRP, MEMINFO_VPAGESIZE };
2704  uint64_t addr = (uintptr_t)start;
2705  uint64_t outdata[2];
2706  uint_t validity = 0;
2707
2708  if (os::Solaris::meminfo(&addr, 1, info_types, 2, outdata, &validity) < 0) {
2709    return false;
2710  }
2711
2712  info->size = 0;
2713  info->lgrp_id = -1;
2714
2715  if ((validity & 1) != 0) {
2716    if ((validity & 2) != 0) {
2717      info->lgrp_id = outdata[0];
2718    }
2719    if ((validity & 4) != 0) {
2720      info->size = outdata[1];
2721    }
2722    return true;
2723  }
2724  return false;
2725}
2726
2727// Scan the pages from start to end until a page different than
2728// the one described in the info parameter is encountered.
2729char *os::scan_pages(char *start, char* end, page_info* page_expected, page_info* page_found) {
2730  const uint_t info_types[] = { MEMINFO_VLGRP, MEMINFO_VPAGESIZE };
2731  const size_t types = sizeof(info_types) / sizeof(info_types[0]);
2732  uint64_t addrs[MAX_MEMINFO_CNT], outdata[types * MAX_MEMINFO_CNT];
2733  uint_t validity[MAX_MEMINFO_CNT];
2734
2735  size_t page_size = MAX2((size_t)os::vm_page_size(), page_expected->size);
2736  uint64_t p = (uint64_t)start;
2737  while (p < (uint64_t)end) {
2738    addrs[0] = p;
2739    size_t addrs_count = 1;
2740    while (addrs_count < MAX_MEMINFO_CNT && addrs[addrs_count - 1] < (uint64_t)end) {
2741      addrs[addrs_count] = addrs[addrs_count - 1] + page_size;
2742      addrs_count++;
2743    }
2744
2745    if (os::Solaris::meminfo(addrs, addrs_count, info_types, types, outdata, validity) < 0) {
2746      return NULL;
2747    }
2748
2749    size_t i = 0;
2750    for (; i < addrs_count; i++) {
2751      if ((validity[i] & 1) != 0) {
2752        if ((validity[i] & 4) != 0) {
2753          if (outdata[types * i + 1] != page_expected->size) {
2754            break;
2755          }
2756        } else
2757          if (page_expected->size != 0) {
2758            break;
2759          }
2760
2761        if ((validity[i] & 2) != 0 && page_expected->lgrp_id > 0) {
2762          if (outdata[types * i] != page_expected->lgrp_id) {
2763            break;
2764          }
2765        }
2766      } else {
2767        return NULL;
2768      }
2769    }
2770
2771    if (i != addrs_count) {
2772      if ((validity[i] & 2) != 0) {
2773        page_found->lgrp_id = outdata[types * i];
2774      } else {
2775        page_found->lgrp_id = -1;
2776      }
2777      if ((validity[i] & 4) != 0) {
2778        page_found->size = outdata[types * i + 1];
2779      } else {
2780        page_found->size = 0;
2781      }
2782      return (char*)addrs[i];
2783    }
2784
2785    p = addrs[addrs_count - 1] + page_size;
2786  }
2787  return end;
2788}
2789
2790bool os::uncommit_memory(char* addr, size_t bytes) {
2791  size_t size = bytes;
2792  // Map uncommitted pages PROT_NONE so we fail early if we touch an
2793  // uncommitted page. Otherwise, the read/write might succeed if we
2794  // have enough swap space to back the physical page.
2795  return
2796    NULL != Solaris::mmap_chunk(addr, size,
2797                                MAP_PRIVATE|MAP_FIXED|MAP_NORESERVE,
2798                                PROT_NONE);
2799}
2800
2801char* os::Solaris::mmap_chunk(char *addr, size_t size, int flags, int prot) {
2802  char *b = (char *)mmap(addr, size, prot, flags, os::Solaris::_dev_zero_fd, 0);
2803
2804  if (b == MAP_FAILED) {
2805    return NULL;
2806  }
2807  return b;
2808}
2809
2810char* os::Solaris::anon_mmap(char* requested_addr, size_t bytes, size_t alignment_hint, bool fixed) {
2811  char* addr = requested_addr;
2812  int flags = MAP_PRIVATE | MAP_NORESERVE;
2813
2814  assert(!(fixed && (alignment_hint > 0)), "alignment hint meaningless with fixed mmap");
2815
2816  if (fixed) {
2817    flags |= MAP_FIXED;
2818  } else if (has_map_align && (alignment_hint > (size_t) vm_page_size())) {
2819    flags |= MAP_ALIGN;
2820    addr = (char*) alignment_hint;
2821  }
2822
2823  // Map uncommitted pages PROT_NONE so we fail early if we touch an
2824  // uncommitted page. Otherwise, the read/write might succeed if we
2825  // have enough swap space to back the physical page.
2826  return mmap_chunk(addr, bytes, flags, PROT_NONE);
2827}
2828
2829char* os::reserve_memory(size_t bytes, char* requested_addr, size_t alignment_hint) {
2830  char* addr = Solaris::anon_mmap(requested_addr, bytes, alignment_hint, (requested_addr != NULL));
2831
2832  guarantee(requested_addr == NULL || requested_addr == addr,
2833            "OS failed to return requested mmap address.");
2834  return addr;
2835}
2836
2837// Reserve memory at an arbitrary address, only if that area is
2838// available (and not reserved for something else).
2839
2840char* os::attempt_reserve_memory_at(size_t bytes, char* requested_addr) {
2841  const int max_tries = 10;
2842  char* base[max_tries];
2843  size_t size[max_tries];
2844
2845  // Solaris adds a gap between mmap'ed regions.  The size of the gap
2846  // is dependent on the requested size and the MMU.  Our initial gap
2847  // value here is just a guess and will be corrected later.
2848  bool had_top_overlap = false;
2849  bool have_adjusted_gap = false;
2850  size_t gap = 0x400000;
2851
2852  // Assert only that the size is a multiple of the page size, since
2853  // that's all that mmap requires, and since that's all we really know
2854  // about at this low abstraction level.  If we need higher alignment,
2855  // we can either pass an alignment to this method or verify alignment
2856  // in one of the methods further up the call chain.  See bug 5044738.
2857  assert(bytes % os::vm_page_size() == 0, "reserving unexpected size block");
2858
2859  // Since snv_84, Solaris attempts to honor the address hint - see 5003415.
2860  // Give it a try, if the kernel honors the hint we can return immediately.
2861  char* addr = Solaris::anon_mmap(requested_addr, bytes, 0, false);
2862  volatile int err = errno;
2863  if (addr == requested_addr) {
2864    return addr;
2865  } else if (addr != NULL) {
2866    unmap_memory(addr, bytes);
2867  }
2868
2869  if (PrintMiscellaneous && Verbose) {
2870    char buf[256];
2871    buf[0] = '\0';
2872    if (addr == NULL) {
2873      jio_snprintf(buf, sizeof(buf), ": %s", strerror(err));
2874    }
2875    warning("attempt_reserve_memory_at: couldn't reserve %d bytes at "
2876            PTR_FORMAT ": reserve_memory_helper returned " PTR_FORMAT
2877            "%s", bytes, requested_addr, addr, buf);
2878  }
2879
2880  // Address hint method didn't work.  Fall back to the old method.
2881  // In theory, once SNV becomes our oldest supported platform, this
2882  // code will no longer be needed.
2883  //
2884  // Repeatedly allocate blocks until the block is allocated at the
2885  // right spot. Give up after max_tries.
2886  int i;
2887  for (i = 0; i < max_tries; ++i) {
2888    base[i] = reserve_memory(bytes);
2889
2890    if (base[i] != NULL) {
2891      // Is this the block we wanted?
2892      if (base[i] == requested_addr) {
2893        size[i] = bytes;
2894        break;
2895      }
2896
2897      // check that the gap value is right
2898      if (had_top_overlap && !have_adjusted_gap) {
2899        size_t actual_gap = base[i-1] - base[i] - bytes;
2900        if (gap != actual_gap) {
2901          // adjust the gap value and retry the last 2 allocations
2902          assert(i > 0, "gap adjustment code problem");
2903          have_adjusted_gap = true;  // adjust the gap only once, just in case
2904          gap = actual_gap;
2905          if (PrintMiscellaneous && Verbose) {
2906            warning("attempt_reserve_memory_at: adjusted gap to 0x%lx", gap);
2907          }
2908          unmap_memory(base[i], bytes);
2909          unmap_memory(base[i-1], size[i-1]);
2910          i-=2;
2911          continue;
2912        }
2913      }
2914
2915      // Does this overlap the block we wanted? Give back the overlapped
2916      // parts and try again.
2917      //
2918      // There is still a bug in this code: if top_overlap == bytes,
2919      // the overlap is offset from requested region by the value of gap.
2920      // In this case giving back the overlapped part will not work,
2921      // because we'll give back the entire block at base[i] and
2922      // therefore the subsequent allocation will not generate a new gap.
2923      // This could be fixed with a new algorithm that used larger
2924      // or variable size chunks to find the requested region -
2925      // but such a change would introduce additional complications.
2926      // It's rare enough that the planets align for this bug,
2927      // so we'll just wait for a fix for 6204603/5003415 which
2928      // will provide a mmap flag to allow us to avoid this business.
2929
2930      size_t top_overlap = requested_addr + (bytes + gap) - base[i];
2931      if (top_overlap >= 0 && top_overlap < bytes) {
2932        had_top_overlap = true;
2933        unmap_memory(base[i], top_overlap);
2934        base[i] += top_overlap;
2935        size[i] = bytes - top_overlap;
2936      } else {
2937        size_t bottom_overlap = base[i] + bytes - requested_addr;
2938        if (bottom_overlap >= 0 && bottom_overlap < bytes) {
2939          if (PrintMiscellaneous && Verbose && bottom_overlap == 0) {
2940            warning("attempt_reserve_memory_at: possible alignment bug");
2941          }
2942          unmap_memory(requested_addr, bottom_overlap);
2943          size[i] = bytes - bottom_overlap;
2944        } else {
2945          size[i] = bytes;
2946        }
2947      }
2948    }
2949  }
2950
2951  // Give back the unused reserved pieces.
2952
2953  for (int j = 0; j < i; ++j) {
2954    if (base[j] != NULL) {
2955      unmap_memory(base[j], size[j]);
2956    }
2957  }
2958
2959  return (i < max_tries) ? requested_addr : NULL;
2960}
2961
2962bool os::release_memory(char* addr, size_t bytes) {
2963  size_t size = bytes;
2964  return munmap(addr, size) == 0;
2965}
2966
2967static bool solaris_mprotect(char* addr, size_t bytes, int prot) {
2968  assert(addr == (char*)align_size_down((uintptr_t)addr, os::vm_page_size()),
2969         "addr must be page aligned");
2970  int retVal = mprotect(addr, bytes, prot);
2971  return retVal == 0;
2972}
2973
2974// Protect memory (Used to pass readonly pages through
2975// JNI GetArray<type>Elements with empty arrays.)
2976bool os::protect_memory(char* addr, size_t bytes, ProtType prot,
2977                        bool is_committed) {
2978  unsigned int p = 0;
2979  switch (prot) {
2980  case MEM_PROT_NONE: p = PROT_NONE; break;
2981  case MEM_PROT_READ: p = PROT_READ; break;
2982  case MEM_PROT_RW:   p = PROT_READ|PROT_WRITE; break;
2983  case MEM_PROT_RWX:  p = PROT_READ|PROT_WRITE|PROT_EXEC; break;
2984  default:
2985    ShouldNotReachHere();
2986  }
2987  // is_committed is unused.
2988  return solaris_mprotect(addr, bytes, p);
2989}
2990
2991// guard_memory and unguard_memory only happens within stack guard pages.
2992// Since ISM pertains only to the heap, guard and unguard memory should not
2993/// happen with an ISM region.
2994bool os::guard_memory(char* addr, size_t bytes) {
2995  return solaris_mprotect(addr, bytes, PROT_NONE);
2996}
2997
2998bool os::unguard_memory(char* addr, size_t bytes) {
2999  return solaris_mprotect(addr, bytes, PROT_READ|PROT_WRITE|PROT_EXEC);
3000}
3001
3002// Large page support
3003
3004// UseLargePages is the master flag to enable/disable large page memory.
3005// UseMPSS and UseISM are supported for compatibility reasons. Their combined
3006// effects can be described in the following table:
3007//
3008// UseLargePages UseMPSS UseISM
3009//    false         *       *   => UseLargePages is the master switch, turning
3010//                                 it off will turn off both UseMPSS and
3011//                                 UseISM. VM will not use large page memory
3012//                                 regardless the settings of UseMPSS/UseISM.
3013//     true      false    false => Unless future Solaris provides other
3014//                                 mechanism to use large page memory, this
3015//                                 combination is equivalent to -UseLargePages,
3016//                                 VM will not use large page memory
3017//     true      true     false => JVM will use MPSS for large page memory.
3018//                                 This is the default behavior.
3019//     true      false    true  => JVM will use ISM for large page memory.
3020//     true      true     true  => JVM will use ISM if it is available.
3021//                                 Otherwise, JVM will fall back to MPSS.
3022//                                 Becaues ISM is now available on all
3023//                                 supported Solaris versions, this combination
3024//                                 is equivalent to +UseISM -UseMPSS.
3025
3026typedef int (*getpagesizes_func_type) (size_t[], int);
3027static size_t _large_page_size = 0;
3028
3029bool os::Solaris::ism_sanity_check(bool warn, size_t * page_size) {
3030  // x86 uses either 2M or 4M page, depending on whether PAE (Physical Address
3031  // Extensions) mode is enabled. AMD64/EM64T uses 2M page in 64bit mode. Sparc
3032  // can support multiple page sizes.
3033
3034  // Don't bother to probe page size because getpagesizes() comes with MPSS.
3035  // ISM is only recommended on old Solaris where there is no MPSS support.
3036  // Simply choose a conservative value as default.
3037  *page_size = LargePageSizeInBytes ? LargePageSizeInBytes :
3038               SPARC_ONLY(4 * M) IA32_ONLY(4 * M) AMD64_ONLY(2 * M);
3039
3040  // ISM is available on all supported Solaris versions
3041  return true;
3042}
3043
3044// Insertion sort for small arrays (descending order).
3045static void insertion_sort_descending(size_t* array, int len) {
3046  for (int i = 0; i < len; i++) {
3047    size_t val = array[i];
3048    for (size_t key = i; key > 0 && array[key - 1] < val; --key) {
3049      size_t tmp = array[key];
3050      array[key] = array[key - 1];
3051      array[key - 1] = tmp;
3052    }
3053  }
3054}
3055
3056bool os::Solaris::mpss_sanity_check(bool warn, size_t * page_size) {
3057  getpagesizes_func_type getpagesizes_func =
3058    CAST_TO_FN_PTR(getpagesizes_func_type, dlsym(RTLD_DEFAULT, "getpagesizes"));
3059  if (getpagesizes_func == NULL) {
3060    if (warn) {
3061      warning("MPSS is not supported by the operating system.");
3062    }
3063    return false;
3064  }
3065
3066  const unsigned int usable_count = VM_Version::page_size_count();
3067  if (usable_count == 1) {
3068    return false;
3069  }
3070
3071  // Fill the array of page sizes.
3072  int n = getpagesizes_func(_page_sizes, page_sizes_max);
3073  assert(n > 0, "Solaris bug?");
3074  if (n == page_sizes_max) {
3075    // Add a sentinel value (necessary only if the array was completely filled
3076    // since it is static (zeroed at initialization)).
3077    _page_sizes[--n] = 0;
3078    DEBUG_ONLY(warning("increase the size of the os::_page_sizes array.");)
3079  }
3080  assert(_page_sizes[n] == 0, "missing sentinel");
3081
3082  if (n == 1) return false;     // Only one page size available.
3083
3084  // Skip sizes larger than 4M (or LargePageSizeInBytes if it was set) and
3085  // select up to usable_count elements.  First sort the array, find the first
3086  // acceptable value, then copy the usable sizes to the top of the array and
3087  // trim the rest.  Make sure to include the default page size :-).
3088  //
3089  // A better policy could get rid of the 4M limit by taking the sizes of the
3090  // important VM memory regions (java heap and possibly the code cache) into
3091  // account.
3092  insertion_sort_descending(_page_sizes, n);
3093  const size_t size_limit =
3094    FLAG_IS_DEFAULT(LargePageSizeInBytes) ? 4 * M : LargePageSizeInBytes;
3095  int beg;
3096  for (beg = 0; beg < n && _page_sizes[beg] > size_limit; ++beg) /* empty */ ;
3097  const int end = MIN2((int)usable_count, n) - 1;
3098  for (int cur = 0; cur < end; ++cur, ++beg) {
3099    _page_sizes[cur] = _page_sizes[beg];
3100  }
3101  _page_sizes[end] = vm_page_size();
3102  _page_sizes[end + 1] = 0;
3103
3104  if (_page_sizes[end] > _page_sizes[end - 1]) {
3105    // Default page size is not the smallest; sort again.
3106    insertion_sort_descending(_page_sizes, end + 1);
3107  }
3108  *page_size = _page_sizes[0];
3109
3110  return true;
3111}
3112
3113bool os::large_page_init() {
3114  if (!UseLargePages) {
3115    UseISM = false;
3116    UseMPSS = false;
3117    return false;
3118  }
3119
3120  // print a warning if any large page related flag is specified on command line
3121  bool warn_on_failure = !FLAG_IS_DEFAULT(UseLargePages)        ||
3122                         !FLAG_IS_DEFAULT(UseISM)               ||
3123                         !FLAG_IS_DEFAULT(UseMPSS)              ||
3124                         !FLAG_IS_DEFAULT(LargePageSizeInBytes);
3125  UseISM = UseISM &&
3126           Solaris::ism_sanity_check(warn_on_failure, &_large_page_size);
3127  if (UseISM) {
3128    // ISM disables MPSS to be compatible with old JDK behavior
3129    UseMPSS = false;
3130    _page_sizes[0] = _large_page_size;
3131    _page_sizes[1] = vm_page_size();
3132  }
3133
3134  UseMPSS = UseMPSS &&
3135            Solaris::mpss_sanity_check(warn_on_failure, &_large_page_size);
3136
3137  UseLargePages = UseISM || UseMPSS;
3138  return UseLargePages;
3139}
3140
3141bool os::Solaris::set_mpss_range(caddr_t start, size_t bytes, size_t align) {
3142  // Signal to OS that we want large pages for addresses
3143  // from addr, addr + bytes
3144  struct memcntl_mha mpss_struct;
3145  mpss_struct.mha_cmd = MHA_MAPSIZE_VA;
3146  mpss_struct.mha_pagesize = align;
3147  mpss_struct.mha_flags = 0;
3148  if (memcntl(start, bytes, MC_HAT_ADVISE,
3149              (caddr_t) &mpss_struct, 0, 0) < 0) {
3150    debug_only(warning("Attempt to use MPSS failed."));
3151    return false;
3152  }
3153  return true;
3154}
3155
3156char* os::reserve_memory_special(size_t bytes) {
3157  assert(UseLargePages && UseISM, "only for ISM large pages");
3158
3159  size_t size = bytes;
3160  char* retAddr = NULL;
3161  int shmid;
3162  key_t ismKey;
3163
3164  bool warn_on_failure = UseISM &&
3165                        (!FLAG_IS_DEFAULT(UseLargePages)         ||
3166                         !FLAG_IS_DEFAULT(UseISM)                ||
3167                         !FLAG_IS_DEFAULT(LargePageSizeInBytes)
3168                        );
3169  char msg[128];
3170
3171  ismKey = IPC_PRIVATE;
3172
3173  // Create a large shared memory region to attach to based on size.
3174  // Currently, size is the total size of the heap
3175  shmid = shmget(ismKey, size, SHM_R | SHM_W | IPC_CREAT);
3176  if (shmid == -1){
3177     if (warn_on_failure) {
3178       jio_snprintf(msg, sizeof(msg), "Failed to reserve shared memory (errno = %d).", errno);
3179       warning(msg);
3180     }
3181     return NULL;
3182  }
3183
3184  // Attach to the region
3185  retAddr = (char *) shmat(shmid, 0, SHM_SHARE_MMU | SHM_R | SHM_W);
3186  int err = errno;
3187
3188  // Remove shmid. If shmat() is successful, the actual shared memory segment
3189  // will be deleted when it's detached by shmdt() or when the process
3190  // terminates. If shmat() is not successful this will remove the shared
3191  // segment immediately.
3192  shmctl(shmid, IPC_RMID, NULL);
3193
3194  if (retAddr == (char *) -1) {
3195    if (warn_on_failure) {
3196      jio_snprintf(msg, sizeof(msg), "Failed to attach shared memory (errno = %d).", err);
3197      warning(msg);
3198    }
3199    return NULL;
3200  }
3201
3202  return retAddr;
3203}
3204
3205bool os::release_memory_special(char* base, size_t bytes) {
3206  // detaching the SHM segment will also delete it, see reserve_memory_special()
3207  int rslt = shmdt(base);
3208  return rslt == 0;
3209}
3210
3211size_t os::large_page_size() {
3212  return _large_page_size;
3213}
3214
3215// MPSS allows application to commit large page memory on demand; with ISM
3216// the entire memory region must be allocated as shared memory.
3217bool os::can_commit_large_page_memory() {
3218  return UseISM ? false : true;
3219}
3220
3221bool os::can_execute_large_page_memory() {
3222  return UseISM ? false : true;
3223}
3224
3225static int os_sleep(jlong millis, bool interruptible) {
3226  const jlong limit = INT_MAX;
3227  jlong prevtime;
3228  int res;
3229
3230  while (millis > limit) {
3231    if ((res = os_sleep(limit, interruptible)) != OS_OK)
3232      return res;
3233    millis -= limit;
3234  }
3235
3236  // Restart interrupted polls with new parameters until the proper delay
3237  // has been completed.
3238
3239  prevtime = getTimeMillis();
3240
3241  while (millis > 0) {
3242    jlong newtime;
3243
3244    if (!interruptible) {
3245      // Following assert fails for os::yield_all:
3246      // assert(!thread->is_Java_thread(), "must not be java thread");
3247      res = poll(NULL, 0, millis);
3248    } else {
3249      JavaThread *jt = JavaThread::current();
3250
3251      INTERRUPTIBLE_NORESTART_VM_ALWAYS(poll(NULL, 0, millis), res, jt,
3252        os::Solaris::clear_interrupted);
3253    }
3254
3255    // INTERRUPTIBLE_NORESTART_VM_ALWAYS returns res == OS_INTRPT for
3256    // thread.Interrupt.
3257
3258    if((res == OS_ERR) && (errno == EINTR)) {
3259      newtime = getTimeMillis();
3260      assert(newtime >= prevtime, "time moving backwards");
3261    /* Doing prevtime and newtime in microseconds doesn't help precision,
3262       and trying to round up to avoid lost milliseconds can result in a
3263       too-short delay. */
3264      millis -= newtime - prevtime;
3265      if(millis <= 0)
3266        return OS_OK;
3267      prevtime = newtime;
3268    } else
3269      return res;
3270  }
3271
3272  return OS_OK;
3273}
3274
3275// Read calls from inside the vm need to perform state transitions
3276size_t os::read(int fd, void *buf, unsigned int nBytes) {
3277  INTERRUPTIBLE_RETURN_INT_VM(::read(fd, buf, nBytes), os::Solaris::clear_interrupted);
3278}
3279
3280int os::sleep(Thread* thread, jlong millis, bool interruptible) {
3281  assert(thread == Thread::current(),  "thread consistency check");
3282
3283  // TODO-FIXME: this should be removed.
3284  // On Solaris machines (especially 2.5.1) we found that sometimes the VM gets into a live lock
3285  // situation with a JavaThread being starved out of a lwp. The kernel doesn't seem to generate
3286  // a SIGWAITING signal which would enable the threads library to create a new lwp for the starving
3287  // thread. We suspect that because the Watcher thread keeps waking up at periodic intervals the kernel
3288  // is fooled into believing that the system is making progress. In the code below we block the
3289  // the watcher thread while safepoint is in progress so that it would not appear as though the
3290  // system is making progress.
3291  if (!Solaris::T2_libthread() &&
3292      thread->is_Watcher_thread() && SafepointSynchronize::is_synchronizing() && !Arguments::has_profile()) {
3293    // We now try to acquire the threads lock. Since this lock is held by the VM thread during
3294    // the entire safepoint, the watcher thread will  line up here during the safepoint.
3295    Threads_lock->lock_without_safepoint_check();
3296    Threads_lock->unlock();
3297  }
3298
3299  if (thread->is_Java_thread()) {
3300    // This is a JavaThread so we honor the _thread_blocked protocol
3301    // even for sleeps of 0 milliseconds. This was originally done
3302    // as a workaround for bug 4338139. However, now we also do it
3303    // to honor the suspend-equivalent protocol.
3304
3305    JavaThread *jt = (JavaThread *) thread;
3306    ThreadBlockInVM tbivm(jt);
3307
3308    jt->set_suspend_equivalent();
3309    // cleared by handle_special_suspend_equivalent_condition() or
3310    // java_suspend_self() via check_and_wait_while_suspended()
3311
3312    int ret_code;
3313    if (millis <= 0) {
3314      thr_yield();
3315      ret_code = 0;
3316    } else {
3317      // The original sleep() implementation did not create an
3318      // OSThreadWaitState helper for sleeps of 0 milliseconds.
3319      // I'm preserving that decision for now.
3320      OSThreadWaitState osts(jt->osthread(), false /* not Object.wait() */);
3321
3322      ret_code = os_sleep(millis, interruptible);
3323    }
3324
3325    // were we externally suspended while we were waiting?
3326    jt->check_and_wait_while_suspended();
3327
3328    return ret_code;
3329  }
3330
3331  // non-JavaThread from this point on:
3332
3333  if (millis <= 0) {
3334    thr_yield();
3335    return 0;
3336  }
3337
3338  OSThreadWaitState osts(thread->osthread(), false /* not Object.wait() */);
3339
3340  return os_sleep(millis, interruptible);
3341}
3342
3343int os::naked_sleep() {
3344  // %% make the sleep time an integer flag. for now use 1 millisec.
3345  return os_sleep(1, false);
3346}
3347
3348// Sleep forever; naked call to OS-specific sleep; use with CAUTION
3349void os::infinite_sleep() {
3350  while (true) {    // sleep forever ...
3351    ::sleep(100);   // ... 100 seconds at a time
3352  }
3353}
3354
3355// Used to convert frequent JVM_Yield() to nops
3356bool os::dont_yield() {
3357  if (DontYieldALot) {
3358    static hrtime_t last_time = 0;
3359    hrtime_t diff = getTimeNanos() - last_time;
3360
3361    if (diff < DontYieldALotInterval * 1000000)
3362      return true;
3363
3364    last_time += diff;
3365
3366    return false;
3367  }
3368  else {
3369    return false;
3370  }
3371}
3372
3373// Caveat: Solaris os::yield() causes a thread-state transition whereas
3374// the linux and win32 implementations do not.  This should be checked.
3375
3376void os::yield() {
3377  // Yields to all threads with same or greater priority
3378  os::sleep(Thread::current(), 0, false);
3379}
3380
3381// Note that yield semantics are defined by the scheduling class to which
3382// the thread currently belongs.  Typically, yield will _not yield to
3383// other equal or higher priority threads that reside on the dispatch queues
3384// of other CPUs.
3385
3386os::YieldResult os::NakedYield() { thr_yield(); return os::YIELD_UNKNOWN; }
3387
3388
3389// On Solaris we found that yield_all doesn't always yield to all other threads.
3390// There have been cases where there is a thread ready to execute but it doesn't
3391// get an lwp as the VM thread continues to spin with sleeps of 1 millisecond.
3392// The 1 millisecond wait doesn't seem long enough for the kernel to issue a
3393// SIGWAITING signal which will cause a new lwp to be created. So we count the
3394// number of times yield_all is called in the one loop and increase the sleep
3395// time after 8 attempts. If this fails too we increase the concurrency level
3396// so that the starving thread would get an lwp
3397
3398void os::yield_all(int attempts) {
3399  // Yields to all threads, including threads with lower priorities
3400  if (attempts == 0) {
3401    os::sleep(Thread::current(), 1, false);
3402  } else {
3403    int iterations = attempts % 30;
3404    if (iterations == 0 && !os::Solaris::T2_libthread()) {
3405      // thr_setconcurrency and _getconcurrency make sense only under T1.
3406      int noofLWPS = thr_getconcurrency();
3407      if (noofLWPS < (Threads::number_of_threads() + 2)) {
3408        thr_setconcurrency(thr_getconcurrency() + 1);
3409      }
3410    } else if (iterations < 25) {
3411      os::sleep(Thread::current(), 1, false);
3412    } else {
3413      os::sleep(Thread::current(), 10, false);
3414    }
3415  }
3416}
3417
3418// Called from the tight loops to possibly influence time-sharing heuristics
3419void os::loop_breaker(int attempts) {
3420  os::yield_all(attempts);
3421}
3422
3423
3424// Interface for setting lwp priorities.  If we are using T2 libthread,
3425// which forces the use of BoundThreads or we manually set UseBoundThreads,
3426// all of our threads will be assigned to real lwp's.  Using the thr_setprio
3427// function is meaningless in this mode so we must adjust the real lwp's priority
3428// The routines below implement the getting and setting of lwp priorities.
3429//
3430// Note: There are three priority scales used on Solaris.  Java priotities
3431//       which range from 1 to 10, libthread "thr_setprio" scale which range
3432//       from 0 to 127, and the current scheduling class of the process we
3433//       are running in.  This is typically from -60 to +60.
3434//       The setting of the lwp priorities in done after a call to thr_setprio
3435//       so Java priorities are mapped to libthread priorities and we map from
3436//       the latter to lwp priorities.  We don't keep priorities stored in
3437//       Java priorities since some of our worker threads want to set priorities
3438//       higher than all Java threads.
3439//
3440// For related information:
3441// (1)  man -s 2 priocntl
3442// (2)  man -s 4 priocntl
3443// (3)  man dispadmin
3444// =    librt.so
3445// =    libthread/common/rtsched.c - thrp_setlwpprio().
3446// =    ps -cL <pid> ... to validate priority.
3447// =    sched_get_priority_min and _max
3448//              pthread_create
3449//              sched_setparam
3450//              pthread_setschedparam
3451//
3452// Assumptions:
3453// +    We assume that all threads in the process belong to the same
3454//              scheduling class.   IE. an homogenous process.
3455// +    Must be root or in IA group to change change "interactive" attribute.
3456//              Priocntl() will fail silently.  The only indication of failure is when
3457//              we read-back the value and notice that it hasn't changed.
3458// +    Interactive threads enter the runq at the head, non-interactive at the tail.
3459// +    For RT, change timeslice as well.  Invariant:
3460//              constant "priority integral"
3461//              Konst == TimeSlice * (60-Priority)
3462//              Given a priority, compute appropriate timeslice.
3463// +    Higher numerical values have higher priority.
3464
3465// sched class attributes
3466typedef struct {
3467        int   schedPolicy;              // classID
3468        int   maxPrio;
3469        int   minPrio;
3470} SchedInfo;
3471
3472
3473static SchedInfo tsLimits, iaLimits, rtLimits;
3474
3475#ifdef ASSERT
3476static int  ReadBackValidate = 1;
3477#endif
3478static int  myClass     = 0;
3479static int  myMin       = 0;
3480static int  myMax       = 0;
3481static int  myCur       = 0;
3482static bool priocntl_enable = false;
3483
3484
3485// Call the version of priocntl suitable for all supported versions
3486// of Solaris. We need to call through this wrapper so that we can
3487// build on Solaris 9 and run on Solaris 8, 9 and 10.
3488//
3489// This code should be removed if we ever stop supporting Solaris 8
3490// and earlier releases.
3491
3492static long priocntl_stub(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg);
3493typedef long (*priocntl_type)(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg);
3494static priocntl_type priocntl_ptr = priocntl_stub;
3495
3496// Stub to set the value of the real pointer, and then call the real
3497// function.
3498
3499static long priocntl_stub(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg) {
3500  // Try Solaris 8- name only.
3501  priocntl_type tmp = (priocntl_type)dlsym(RTLD_DEFAULT, "__priocntl");
3502  guarantee(tmp != NULL, "priocntl function not found.");
3503  priocntl_ptr = tmp;
3504  return (*priocntl_ptr)(PC_VERSION, idtype, id, cmd, arg);
3505}
3506
3507
3508// lwp_priocntl_init
3509//
3510// Try to determine the priority scale for our process.
3511//
3512// Return errno or 0 if OK.
3513//
3514static
3515int     lwp_priocntl_init ()
3516{
3517  int rslt;
3518  pcinfo_t ClassInfo;
3519  pcparms_t ParmInfo;
3520  int i;
3521
3522  if (!UseThreadPriorities) return 0;
3523
3524  // We are using Bound threads, we need to determine our priority ranges
3525  if (os::Solaris::T2_libthread() || UseBoundThreads) {
3526    // If ThreadPriorityPolicy is 1, switch tables
3527    if (ThreadPriorityPolicy == 1) {
3528      for (i = 0 ; i < MaxPriority+1; i++)
3529        os::java_to_os_priority[i] = prio_policy1[i];
3530    }
3531  }
3532  // Not using Bound Threads, set to ThreadPolicy 1
3533  else {
3534    for ( i = 0 ; i < MaxPriority+1; i++ ) {
3535      os::java_to_os_priority[i] = prio_policy1[i];
3536    }
3537    return 0;
3538  }
3539
3540
3541  // Get IDs for a set of well-known scheduling classes.
3542  // TODO-FIXME: GETCLINFO returns the current # of classes in the
3543  // the system.  We should have a loop that iterates over the
3544  // classID values, which are known to be "small" integers.
3545
3546  strcpy(ClassInfo.pc_clname, "TS");
3547  ClassInfo.pc_cid = -1;
3548  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3549  if (rslt < 0) return errno;
3550  assert(ClassInfo.pc_cid != -1, "cid for TS class is -1");
3551  tsLimits.schedPolicy = ClassInfo.pc_cid;
3552  tsLimits.maxPrio = ((tsinfo_t*)ClassInfo.pc_clinfo)->ts_maxupri;
3553  tsLimits.minPrio = -tsLimits.maxPrio;
3554
3555  strcpy(ClassInfo.pc_clname, "IA");
3556  ClassInfo.pc_cid = -1;
3557  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3558  if (rslt < 0) return errno;
3559  assert(ClassInfo.pc_cid != -1, "cid for IA class is -1");
3560  iaLimits.schedPolicy = ClassInfo.pc_cid;
3561  iaLimits.maxPrio = ((iainfo_t*)ClassInfo.pc_clinfo)->ia_maxupri;
3562  iaLimits.minPrio = -iaLimits.maxPrio;
3563
3564  strcpy(ClassInfo.pc_clname, "RT");
3565  ClassInfo.pc_cid = -1;
3566  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3567  if (rslt < 0) return errno;
3568  assert(ClassInfo.pc_cid != -1, "cid for RT class is -1");
3569  rtLimits.schedPolicy = ClassInfo.pc_cid;
3570  rtLimits.maxPrio = ((rtinfo_t*)ClassInfo.pc_clinfo)->rt_maxpri;
3571  rtLimits.minPrio = 0;
3572
3573
3574  // Query our "current" scheduling class.
3575  // This will normally be IA,TS or, rarely, RT.
3576  memset (&ParmInfo, 0, sizeof(ParmInfo));
3577  ParmInfo.pc_cid = PC_CLNULL;
3578  rslt = (*priocntl_ptr) (PC_VERSION, P_PID, P_MYID, PC_GETPARMS, (caddr_t)&ParmInfo );
3579  if ( rslt < 0 ) return errno;
3580  myClass = ParmInfo.pc_cid;
3581
3582  // We now know our scheduling classId, get specific information
3583  // the class.
3584  ClassInfo.pc_cid = myClass;
3585  ClassInfo.pc_clname[0] = 0;
3586  rslt = (*priocntl_ptr) (PC_VERSION, (idtype)0, 0, PC_GETCLINFO, (caddr_t)&ClassInfo );
3587  if ( rslt < 0 ) return errno;
3588
3589  if (ThreadPriorityVerbose)
3590    tty->print_cr ("lwp_priocntl_init: Class=%d(%s)...", myClass, ClassInfo.pc_clname);
3591
3592  memset(&ParmInfo, 0, sizeof(pcparms_t));
3593  ParmInfo.pc_cid = PC_CLNULL;
3594  rslt = (*priocntl_ptr)(PC_VERSION, P_PID, P_MYID, PC_GETPARMS, (caddr_t)&ParmInfo);
3595  if (rslt < 0) return errno;
3596
3597  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3598    myMin = rtLimits.minPrio;
3599    myMax = rtLimits.maxPrio;
3600  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3601    iaparms_t *iaInfo  = (iaparms_t*)ParmInfo.pc_clparms;
3602    myMin = iaLimits.minPrio;
3603    myMax = iaLimits.maxPrio;
3604    myMax = MIN2(myMax, (int)iaInfo->ia_uprilim);       // clamp - restrict
3605  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3606    tsparms_t *tsInfo  = (tsparms_t*)ParmInfo.pc_clparms;
3607    myMin = tsLimits.minPrio;
3608    myMax = tsLimits.maxPrio;
3609    myMax = MIN2(myMax, (int)tsInfo->ts_uprilim);       // clamp - restrict
3610  } else {
3611    // No clue - punt
3612    if (ThreadPriorityVerbose)
3613      tty->print_cr ("Unknown scheduling class: %s ... \n", ClassInfo.pc_clname);
3614    return EINVAL;      // no clue, punt
3615  }
3616
3617  if (ThreadPriorityVerbose)
3618        tty->print_cr ("Thread priority Range: [%d..%d]\n", myMin, myMax);
3619
3620  priocntl_enable = true;  // Enable changing priorities
3621  return 0;
3622}
3623
3624#define IAPRI(x)        ((iaparms_t *)((x).pc_clparms))
3625#define RTPRI(x)        ((rtparms_t *)((x).pc_clparms))
3626#define TSPRI(x)        ((tsparms_t *)((x).pc_clparms))
3627
3628
3629// scale_to_lwp_priority
3630//
3631// Convert from the libthread "thr_setprio" scale to our current
3632// lwp scheduling class scale.
3633//
3634static
3635int     scale_to_lwp_priority (int rMin, int rMax, int x)
3636{
3637  int v;
3638
3639  if (x == 127) return rMax;            // avoid round-down
3640    v = (((x*(rMax-rMin)))/128)+rMin;
3641  return v;
3642}
3643
3644
3645// set_lwp_priority
3646//
3647// Set the priority of the lwp.  This call should only be made
3648// when using bound threads (T2 threads are bound by default).
3649//
3650int     set_lwp_priority (int ThreadID, int lwpid, int newPrio )
3651{
3652  int rslt;
3653  int Actual, Expected, prv;
3654  pcparms_t ParmInfo;                   // for GET-SET
3655#ifdef ASSERT
3656  pcparms_t ReadBack;                   // for readback
3657#endif
3658
3659  // Set priority via PC_GETPARMS, update, PC_SETPARMS
3660  // Query current values.
3661  // TODO: accelerate this by eliminating the PC_GETPARMS call.
3662  // Cache "pcparms_t" in global ParmCache.
3663  // TODO: elide set-to-same-value
3664
3665  // If something went wrong on init, don't change priorities.
3666  if ( !priocntl_enable ) {
3667    if (ThreadPriorityVerbose)
3668      tty->print_cr("Trying to set priority but init failed, ignoring");
3669    return EINVAL;
3670  }
3671
3672
3673  // If lwp hasn't started yet, just return
3674  // the _start routine will call us again.
3675  if ( lwpid <= 0 ) {
3676    if (ThreadPriorityVerbose) {
3677      tty->print_cr ("deferring the set_lwp_priority of thread " INTPTR_FORMAT " to %d, lwpid not set",
3678                     ThreadID, newPrio);
3679    }
3680    return 0;
3681  }
3682
3683  if (ThreadPriorityVerbose) {
3684    tty->print_cr ("set_lwp_priority(" INTPTR_FORMAT "@" INTPTR_FORMAT " %d) ",
3685                   ThreadID, lwpid, newPrio);
3686  }
3687
3688  memset(&ParmInfo, 0, sizeof(pcparms_t));
3689  ParmInfo.pc_cid = PC_CLNULL;
3690  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_GETPARMS, (caddr_t)&ParmInfo);
3691  if (rslt < 0) return errno;
3692
3693  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3694    rtparms_t *rtInfo  = (rtparms_t*)ParmInfo.pc_clparms;
3695    rtInfo->rt_pri     = scale_to_lwp_priority (rtLimits.minPrio, rtLimits.maxPrio, newPrio);
3696    rtInfo->rt_tqsecs  = RT_NOCHANGE;
3697    rtInfo->rt_tqnsecs = RT_NOCHANGE;
3698    if (ThreadPriorityVerbose) {
3699      tty->print_cr("RT: %d->%d\n", newPrio, rtInfo->rt_pri);
3700    }
3701  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3702    iaparms_t *iaInfo  = (iaparms_t*)ParmInfo.pc_clparms;
3703    int maxClamped     = MIN2(iaLimits.maxPrio, (int)iaInfo->ia_uprilim);
3704    iaInfo->ia_upri    = scale_to_lwp_priority(iaLimits.minPrio, maxClamped, newPrio);
3705    iaInfo->ia_uprilim = IA_NOCHANGE;
3706    iaInfo->ia_nice    = IA_NOCHANGE;
3707    iaInfo->ia_mode    = IA_NOCHANGE;
3708    if (ThreadPriorityVerbose) {
3709      tty->print_cr ("IA: [%d...%d] %d->%d\n",
3710               iaLimits.minPrio, maxClamped, newPrio, iaInfo->ia_upri);
3711    }
3712  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3713    tsparms_t *tsInfo  = (tsparms_t*)ParmInfo.pc_clparms;
3714    int maxClamped     = MIN2(tsLimits.maxPrio, (int)tsInfo->ts_uprilim);
3715    prv                = tsInfo->ts_upri;
3716    tsInfo->ts_upri    = scale_to_lwp_priority(tsLimits.minPrio, maxClamped, newPrio);
3717    tsInfo->ts_uprilim = IA_NOCHANGE;
3718    if (ThreadPriorityVerbose) {
3719      tty->print_cr ("TS: %d [%d...%d] %d->%d\n",
3720               prv, tsLimits.minPrio, maxClamped, newPrio, tsInfo->ts_upri);
3721    }
3722    if (prv == tsInfo->ts_upri) return 0;
3723  } else {
3724    if ( ThreadPriorityVerbose ) {
3725      tty->print_cr ("Unknown scheduling class\n");
3726    }
3727      return EINVAL;    // no clue, punt
3728  }
3729
3730  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_SETPARMS, (caddr_t)&ParmInfo);
3731  if (ThreadPriorityVerbose && rslt) {
3732    tty->print_cr ("PC_SETPARMS ->%d %d\n", rslt, errno);
3733  }
3734  if (rslt < 0) return errno;
3735
3736#ifdef ASSERT
3737  // Sanity check: read back what we just attempted to set.
3738  // In theory it could have changed in the interim ...
3739  //
3740  // The priocntl system call is tricky.
3741  // Sometimes it'll validate the priority value argument and
3742  // return EINVAL if unhappy.  At other times it fails silently.
3743  // Readbacks are prudent.
3744
3745  if (!ReadBackValidate) return 0;
3746
3747  memset(&ReadBack, 0, sizeof(pcparms_t));
3748  ReadBack.pc_cid = PC_CLNULL;
3749  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_GETPARMS, (caddr_t)&ReadBack);
3750  assert(rslt >= 0, "priocntl failed");
3751  Actual = Expected = 0xBAD;
3752  assert(ParmInfo.pc_cid == ReadBack.pc_cid, "cid's don't match");
3753  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3754    Actual   = RTPRI(ReadBack)->rt_pri;
3755    Expected = RTPRI(ParmInfo)->rt_pri;
3756  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3757    Actual   = IAPRI(ReadBack)->ia_upri;
3758    Expected = IAPRI(ParmInfo)->ia_upri;
3759  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3760    Actual   = TSPRI(ReadBack)->ts_upri;
3761    Expected = TSPRI(ParmInfo)->ts_upri;
3762  } else {
3763    if ( ThreadPriorityVerbose ) {
3764      tty->print_cr("set_lwp_priority: unexpected class in readback: %d\n", ParmInfo.pc_cid);
3765    }
3766  }
3767
3768  if (Actual != Expected) {
3769    if ( ThreadPriorityVerbose ) {
3770      tty->print_cr ("set_lwp_priority(%d %d) Class=%d: actual=%d vs expected=%d\n",
3771             lwpid, newPrio, ReadBack.pc_cid, Actual, Expected);
3772    }
3773  }
3774#endif
3775
3776  return 0;
3777}
3778
3779
3780
3781// Solaris only gives access to 128 real priorities at a time,
3782// so we expand Java's ten to fill this range.  This would be better
3783// if we dynamically adjusted relative priorities.
3784//
3785// The ThreadPriorityPolicy option allows us to select 2 different
3786// priority scales.
3787//
3788// ThreadPriorityPolicy=0
3789// Since the Solaris' default priority is MaximumPriority, we do not
3790// set a priority lower than Max unless a priority lower than
3791// NormPriority is requested.
3792//
3793// ThreadPriorityPolicy=1
3794// This mode causes the priority table to get filled with
3795// linear values.  NormPriority get's mapped to 50% of the
3796// Maximum priority an so on.  This will cause VM threads
3797// to get unfair treatment against other Solaris processes
3798// which do not explicitly alter their thread priorities.
3799//
3800
3801
3802int os::java_to_os_priority[MaxPriority + 1] = {
3803  -99999,         // 0 Entry should never be used
3804
3805  0,              // 1 MinPriority
3806  32,             // 2
3807  64,             // 3
3808
3809  96,             // 4
3810  127,            // 5 NormPriority
3811  127,            // 6
3812
3813  127,            // 7
3814  127,            // 8
3815  127,            // 9 NearMaxPriority
3816
3817  127             // 10 MaxPriority
3818};
3819
3820
3821OSReturn os::set_native_priority(Thread* thread, int newpri) {
3822  assert(newpri >= MinimumPriority && newpri <= MaximumPriority, "bad priority mapping");
3823  if ( !UseThreadPriorities ) return OS_OK;
3824  int status = thr_setprio(thread->osthread()->thread_id(), newpri);
3825  if ( os::Solaris::T2_libthread() || (UseBoundThreads && thread->osthread()->is_vm_created()) )
3826    status |= (set_lwp_priority (thread->osthread()->thread_id(),
3827                    thread->osthread()->lwp_id(), newpri ));
3828  return (status == 0) ? OS_OK : OS_ERR;
3829}
3830
3831
3832OSReturn os::get_native_priority(const Thread* const thread, int *priority_ptr) {
3833  int p;
3834  if ( !UseThreadPriorities ) {
3835    *priority_ptr = NormalPriority;
3836    return OS_OK;
3837  }
3838  int status = thr_getprio(thread->osthread()->thread_id(), &p);
3839  if (status != 0) {
3840    return OS_ERR;
3841  }
3842  *priority_ptr = p;
3843  return OS_OK;
3844}
3845
3846
3847// Hint to the underlying OS that a task switch would not be good.
3848// Void return because it's a hint and can fail.
3849void os::hint_no_preempt() {
3850  schedctl_start(schedctl_init());
3851}
3852
3853void os::interrupt(Thread* thread) {
3854  assert(Thread::current() == thread || Threads_lock->owned_by_self(), "possibility of dangling Thread pointer");
3855
3856  OSThread* osthread = thread->osthread();
3857
3858  int isInterrupted = osthread->interrupted();
3859  if (!isInterrupted) {
3860      osthread->set_interrupted(true);
3861      OrderAccess::fence();
3862      // os::sleep() is implemented with either poll (NULL,0,timeout) or
3863      // by parking on _SleepEvent.  If the former, thr_kill will unwedge
3864      // the sleeper by SIGINTR, otherwise the unpark() will wake the sleeper.
3865      ParkEvent * const slp = thread->_SleepEvent ;
3866      if (slp != NULL) slp->unpark() ;
3867  }
3868
3869  // For JSR166:  unpark after setting status but before thr_kill -dl
3870  if (thread->is_Java_thread()) {
3871    ((JavaThread*)thread)->parker()->unpark();
3872  }
3873
3874  // Handle interruptible wait() ...
3875  ParkEvent * const ev = thread->_ParkEvent ;
3876  if (ev != NULL) ev->unpark() ;
3877
3878  // When events are used everywhere for os::sleep, then this thr_kill
3879  // will only be needed if UseVMInterruptibleIO is true.
3880
3881  if (!isInterrupted) {
3882    int status = thr_kill(osthread->thread_id(), os::Solaris::SIGinterrupt());
3883    assert_status(status == 0, status, "thr_kill");
3884
3885    // Bump thread interruption counter
3886    RuntimeService::record_thread_interrupt_signaled_count();
3887  }
3888}
3889
3890
3891bool os::is_interrupted(Thread* thread, bool clear_interrupted) {
3892  assert(Thread::current() == thread || Threads_lock->owned_by_self(), "possibility of dangling Thread pointer");
3893
3894  OSThread* osthread = thread->osthread();
3895
3896  bool res = osthread->interrupted();
3897
3898  // NOTE that since there is no "lock" around these two operations,
3899  // there is the possibility that the interrupted flag will be
3900  // "false" but that the interrupt event will be set. This is
3901  // intentional. The effect of this is that Object.wait() will appear
3902  // to have a spurious wakeup, which is not harmful, and the
3903  // possibility is so rare that it is not worth the added complexity
3904  // to add yet another lock. It has also been recommended not to put
3905  // the interrupted flag into the os::Solaris::Event structure,
3906  // because it hides the issue.
3907  if (res && clear_interrupted) {
3908    osthread->set_interrupted(false);
3909  }
3910  return res;
3911}
3912
3913
3914void os::print_statistics() {
3915}
3916
3917int os::message_box(const char* title, const char* message) {
3918  int i;
3919  fdStream err(defaultStream::error_fd());
3920  for (i = 0; i < 78; i++) err.print_raw("=");
3921  err.cr();
3922  err.print_raw_cr(title);
3923  for (i = 0; i < 78; i++) err.print_raw("-");
3924  err.cr();
3925  err.print_raw_cr(message);
3926  for (i = 0; i < 78; i++) err.print_raw("=");
3927  err.cr();
3928
3929  char buf[16];
3930  // Prevent process from exiting upon "read error" without consuming all CPU
3931  while (::read(0, buf, sizeof(buf)) <= 0) { ::sleep(100); }
3932
3933  return buf[0] == 'y' || buf[0] == 'Y';
3934}
3935
3936// A lightweight implementation that does not suspend the target thread and
3937// thus returns only a hint. Used for profiling only!
3938ExtendedPC os::get_thread_pc(Thread* thread) {
3939  // Make sure that it is called by the watcher and the Threads lock is owned.
3940  assert(Thread::current()->is_Watcher_thread(), "Must be watcher and own Threads_lock");
3941  // For now, is only used to profile the VM Thread
3942  assert(thread->is_VM_thread(), "Can only be called for VMThread");
3943  ExtendedPC epc;
3944
3945  GetThreadPC_Callback  cb(ProfileVM_lock);
3946  OSThread *osthread = thread->osthread();
3947  const int time_to_wait = 400; // 400ms wait for initial response
3948  int status = cb.interrupt(thread, time_to_wait);
3949
3950  if (cb.is_done() ) {
3951    epc = cb.addr();
3952  } else {
3953    DEBUG_ONLY(tty->print_cr("Failed to get pc for thread: %d got %d status",
3954                              osthread->thread_id(), status););
3955    // epc is already NULL
3956  }
3957  return epc;
3958}
3959
3960
3961// This does not do anything on Solaris. This is basically a hook for being
3962// able to use structured exception handling (thread-local exception filters) on, e.g., Win32.
3963void os::os_exception_wrapper(java_call_t f, JavaValue* value, methodHandle* method, JavaCallArguments* args, Thread* thread) {
3964  f(value, method, args, thread);
3965}
3966
3967// This routine may be used by user applications as a "hook" to catch signals.
3968// The user-defined signal handler must pass unrecognized signals to this
3969// routine, and if it returns true (non-zero), then the signal handler must
3970// return immediately.  If the flag "abort_if_unrecognized" is true, then this
3971// routine will never retun false (zero), but instead will execute a VM panic
3972// routine kill the process.
3973//
3974// If this routine returns false, it is OK to call it again.  This allows
3975// the user-defined signal handler to perform checks either before or after
3976// the VM performs its own checks.  Naturally, the user code would be making
3977// a serious error if it tried to handle an exception (such as a null check
3978// or breakpoint) that the VM was generating for its own correct operation.
3979//
3980// This routine may recognize any of the following kinds of signals:
3981// SIGBUS, SIGSEGV, SIGILL, SIGFPE, BREAK_SIGNAL, SIGPIPE, SIGXFSZ,
3982// os::Solaris::SIGasync
3983// It should be consulted by handlers for any of those signals.
3984// It explicitly does not recognize os::Solaris::SIGinterrupt
3985//
3986// The caller of this routine must pass in the three arguments supplied
3987// to the function referred to in the "sa_sigaction" (not the "sa_handler")
3988// field of the structure passed to sigaction().  This routine assumes that
3989// the sa_flags field passed to sigaction() includes SA_SIGINFO and SA_RESTART.
3990//
3991// Note that the VM will print warnings if it detects conflicting signal
3992// handlers, unless invoked with the option "-XX:+AllowUserSignalHandlers".
3993//
3994extern "C" int JVM_handle_solaris_signal(int signo, siginfo_t* siginfo, void* ucontext, int abort_if_unrecognized);
3995
3996
3997void signalHandler(int sig, siginfo_t* info, void* ucVoid) {
3998  JVM_handle_solaris_signal(sig, info, ucVoid, true);
3999}
4000
4001/* Do not delete - if guarantee is ever removed,  a signal handler (even empty)
4002   is needed to provoke threads blocked on IO to return an EINTR
4003   Note: this explicitly does NOT call JVM_handle_solaris_signal and
4004   does NOT participate in signal chaining due to requirement for
4005   NOT setting SA_RESTART to make EINTR work. */
4006extern "C" void sigINTRHandler(int sig, siginfo_t* info, void* ucVoid) {
4007   if (UseSignalChaining) {
4008      struct sigaction *actp = os::Solaris::get_chained_signal_action(sig);
4009      if (actp && actp->sa_handler) {
4010        vm_exit_during_initialization("Signal chaining detected for VM interrupt signal, try -XX:+UseAltSigs");
4011      }
4012   }
4013}
4014
4015// This boolean allows users to forward their own non-matching signals
4016// to JVM_handle_solaris_signal, harmlessly.
4017bool os::Solaris::signal_handlers_are_installed = false;
4018
4019// For signal-chaining
4020bool os::Solaris::libjsig_is_loaded = false;
4021typedef struct sigaction *(*get_signal_t)(int);
4022get_signal_t os::Solaris::get_signal_action = NULL;
4023
4024struct sigaction* os::Solaris::get_chained_signal_action(int sig) {
4025  struct sigaction *actp = NULL;
4026
4027  if ((libjsig_is_loaded)  && (sig <= Maxlibjsigsigs)) {
4028    // Retrieve the old signal handler from libjsig
4029    actp = (*get_signal_action)(sig);
4030  }
4031  if (actp == NULL) {
4032    // Retrieve the preinstalled signal handler from jvm
4033    actp = get_preinstalled_handler(sig);
4034  }
4035
4036  return actp;
4037}
4038
4039static bool call_chained_handler(struct sigaction *actp, int sig,
4040                                 siginfo_t *siginfo, void *context) {
4041  // Call the old signal handler
4042  if (actp->sa_handler == SIG_DFL) {
4043    // It's more reasonable to let jvm treat it as an unexpected exception
4044    // instead of taking the default action.
4045    return false;
4046  } else if (actp->sa_handler != SIG_IGN) {
4047    if ((actp->sa_flags & SA_NODEFER) == 0) {
4048      // automaticlly block the signal
4049      sigaddset(&(actp->sa_mask), sig);
4050    }
4051
4052    sa_handler_t hand;
4053    sa_sigaction_t sa;
4054    bool siginfo_flag_set = (actp->sa_flags & SA_SIGINFO) != 0;
4055    // retrieve the chained handler
4056    if (siginfo_flag_set) {
4057      sa = actp->sa_sigaction;
4058    } else {
4059      hand = actp->sa_handler;
4060    }
4061
4062    if ((actp->sa_flags & SA_RESETHAND) != 0) {
4063      actp->sa_handler = SIG_DFL;
4064    }
4065
4066    // try to honor the signal mask
4067    sigset_t oset;
4068    thr_sigsetmask(SIG_SETMASK, &(actp->sa_mask), &oset);
4069
4070    // call into the chained handler
4071    if (siginfo_flag_set) {
4072      (*sa)(sig, siginfo, context);
4073    } else {
4074      (*hand)(sig);
4075    }
4076
4077    // restore the signal mask
4078    thr_sigsetmask(SIG_SETMASK, &oset, 0);
4079  }
4080  // Tell jvm's signal handler the signal is taken care of.
4081  return true;
4082}
4083
4084bool os::Solaris::chained_handler(int sig, siginfo_t* siginfo, void* context) {
4085  bool chained = false;
4086  // signal-chaining
4087  if (UseSignalChaining) {
4088    struct sigaction *actp = get_chained_signal_action(sig);
4089    if (actp != NULL) {
4090      chained = call_chained_handler(actp, sig, siginfo, context);
4091    }
4092  }
4093  return chained;
4094}
4095
4096struct sigaction* os::Solaris::get_preinstalled_handler(int sig) {
4097  assert((chainedsigactions != (struct sigaction *)NULL) && (preinstalled_sigs != (int *)NULL) , "signals not yet initialized");
4098  if (preinstalled_sigs[sig] != 0) {
4099    return &chainedsigactions[sig];
4100  }
4101  return NULL;
4102}
4103
4104void os::Solaris::save_preinstalled_handler(int sig, struct sigaction& oldAct) {
4105
4106  assert(sig > 0 && sig <= Maxsignum, "vm signal out of expected range");
4107  assert((chainedsigactions != (struct sigaction *)NULL) && (preinstalled_sigs != (int *)NULL) , "signals not yet initialized");
4108  chainedsigactions[sig] = oldAct;
4109  preinstalled_sigs[sig] = 1;
4110}
4111
4112void os::Solaris::set_signal_handler(int sig, bool set_installed, bool oktochain) {
4113  // Check for overwrite.
4114  struct sigaction oldAct;
4115  sigaction(sig, (struct sigaction*)NULL, &oldAct);
4116  void* oldhand = oldAct.sa_sigaction ? CAST_FROM_FN_PTR(void*,  oldAct.sa_sigaction)
4117                                      : CAST_FROM_FN_PTR(void*,  oldAct.sa_handler);
4118  if (oldhand != CAST_FROM_FN_PTR(void*, SIG_DFL) &&
4119      oldhand != CAST_FROM_FN_PTR(void*, SIG_IGN) &&
4120      oldhand != CAST_FROM_FN_PTR(void*, signalHandler)) {
4121    if (AllowUserSignalHandlers || !set_installed) {
4122      // Do not overwrite; user takes responsibility to forward to us.
4123      return;
4124    } else if (UseSignalChaining) {
4125      if (oktochain) {
4126        // save the old handler in jvm
4127        save_preinstalled_handler(sig, oldAct);
4128      } else {
4129        vm_exit_during_initialization("Signal chaining not allowed for VM interrupt signal, try -XX:+UseAltSigs.");
4130      }
4131      // libjsig also interposes the sigaction() call below and saves the
4132      // old sigaction on it own.
4133    } else {
4134      fatal2("Encountered unexpected pre-existing sigaction handler %#lx for signal %d.", (long)oldhand, sig);
4135    }
4136  }
4137
4138  struct sigaction sigAct;
4139  sigfillset(&(sigAct.sa_mask));
4140  sigAct.sa_handler = SIG_DFL;
4141
4142  sigAct.sa_sigaction = signalHandler;
4143  // Handle SIGSEGV on alternate signal stack if
4144  // not using stack banging
4145  if (!UseStackBanging && sig == SIGSEGV) {
4146    sigAct.sa_flags = SA_SIGINFO | SA_RESTART | SA_ONSTACK;
4147  // Interruptible i/o requires SA_RESTART cleared so EINTR
4148  // is returned instead of restarting system calls
4149  } else if (sig == os::Solaris::SIGinterrupt()) {
4150    sigemptyset(&sigAct.sa_mask);
4151    sigAct.sa_handler = NULL;
4152    sigAct.sa_flags = SA_SIGINFO;
4153    sigAct.sa_sigaction = sigINTRHandler;
4154  } else {
4155    sigAct.sa_flags = SA_SIGINFO | SA_RESTART;
4156  }
4157  os::Solaris::set_our_sigflags(sig, sigAct.sa_flags);
4158
4159  sigaction(sig, &sigAct, &oldAct);
4160
4161  void* oldhand2 = oldAct.sa_sigaction ? CAST_FROM_FN_PTR(void*, oldAct.sa_sigaction)
4162                                       : CAST_FROM_FN_PTR(void*, oldAct.sa_handler);
4163  assert(oldhand2 == oldhand, "no concurrent signal handler installation");
4164}
4165
4166
4167#define DO_SIGNAL_CHECK(sig) \
4168  if (!sigismember(&check_signal_done, sig)) \
4169    os::Solaris::check_signal_handler(sig)
4170
4171// This method is a periodic task to check for misbehaving JNI applications
4172// under CheckJNI, we can add any periodic checks here
4173
4174void os::run_periodic_checks() {
4175  // A big source of grief is hijacking virt. addr 0x0 on Solaris,
4176  // thereby preventing a NULL checks.
4177  if(!check_addr0_done) check_addr0_done = check_addr0(tty);
4178
4179  if (check_signals == false) return;
4180
4181  // SEGV and BUS if overridden could potentially prevent
4182  // generation of hs*.log in the event of a crash, debugging
4183  // such a case can be very challenging, so we absolutely
4184  // check for the following for a good measure:
4185  DO_SIGNAL_CHECK(SIGSEGV);
4186  DO_SIGNAL_CHECK(SIGILL);
4187  DO_SIGNAL_CHECK(SIGFPE);
4188  DO_SIGNAL_CHECK(SIGBUS);
4189  DO_SIGNAL_CHECK(SIGPIPE);
4190  DO_SIGNAL_CHECK(SIGXFSZ);
4191
4192  // ReduceSignalUsage allows the user to override these handlers
4193  // see comments at the very top and jvm_solaris.h
4194  if (!ReduceSignalUsage) {
4195    DO_SIGNAL_CHECK(SHUTDOWN1_SIGNAL);
4196    DO_SIGNAL_CHECK(SHUTDOWN2_SIGNAL);
4197    DO_SIGNAL_CHECK(SHUTDOWN3_SIGNAL);
4198    DO_SIGNAL_CHECK(BREAK_SIGNAL);
4199  }
4200
4201  // See comments above for using JVM1/JVM2 and UseAltSigs
4202  DO_SIGNAL_CHECK(os::Solaris::SIGinterrupt());
4203  DO_SIGNAL_CHECK(os::Solaris::SIGasync());
4204
4205}
4206
4207typedef int (*os_sigaction_t)(int, const struct sigaction *, struct sigaction *);
4208
4209static os_sigaction_t os_sigaction = NULL;
4210
4211void os::Solaris::check_signal_handler(int sig) {
4212  char buf[O_BUFLEN];
4213  address jvmHandler = NULL;
4214
4215  struct sigaction act;
4216  if (os_sigaction == NULL) {
4217    // only trust the default sigaction, in case it has been interposed
4218    os_sigaction = (os_sigaction_t)dlsym(RTLD_DEFAULT, "sigaction");
4219    if (os_sigaction == NULL) return;
4220  }
4221
4222  os_sigaction(sig, (struct sigaction*)NULL, &act);
4223
4224  address thisHandler = (act.sa_flags & SA_SIGINFO)
4225    ? CAST_FROM_FN_PTR(address, act.sa_sigaction)
4226    : CAST_FROM_FN_PTR(address, act.sa_handler) ;
4227
4228
4229  switch(sig) {
4230    case SIGSEGV:
4231    case SIGBUS:
4232    case SIGFPE:
4233    case SIGPIPE:
4234    case SIGXFSZ:
4235    case SIGILL:
4236      jvmHandler = CAST_FROM_FN_PTR(address, signalHandler);
4237      break;
4238
4239    case SHUTDOWN1_SIGNAL:
4240    case SHUTDOWN2_SIGNAL:
4241    case SHUTDOWN3_SIGNAL:
4242    case BREAK_SIGNAL:
4243      jvmHandler = (address)user_handler();
4244      break;
4245
4246    default:
4247      int intrsig = os::Solaris::SIGinterrupt();
4248      int asynsig = os::Solaris::SIGasync();
4249
4250      if (sig == intrsig) {
4251        jvmHandler = CAST_FROM_FN_PTR(address, sigINTRHandler);
4252      } else if (sig == asynsig) {
4253        jvmHandler = CAST_FROM_FN_PTR(address, signalHandler);
4254      } else {
4255        return;
4256      }
4257      break;
4258  }
4259
4260
4261  if (thisHandler != jvmHandler) {
4262    tty->print("Warning: %s handler ", exception_name(sig, buf, O_BUFLEN));
4263    tty->print("expected:%s", get_signal_handler_name(jvmHandler, buf, O_BUFLEN));
4264    tty->print_cr("  found:%s", get_signal_handler_name(thisHandler, buf, O_BUFLEN));
4265    // No need to check this sig any longer
4266    sigaddset(&check_signal_done, sig);
4267  } else if(os::Solaris::get_our_sigflags(sig) != 0 && act.sa_flags != os::Solaris::get_our_sigflags(sig)) {
4268    tty->print("Warning: %s handler flags ", exception_name(sig, buf, O_BUFLEN));
4269    tty->print("expected:" PTR32_FORMAT, os::Solaris::get_our_sigflags(sig));
4270    tty->print_cr("  found:" PTR32_FORMAT, act.sa_flags);
4271    // No need to check this sig any longer
4272    sigaddset(&check_signal_done, sig);
4273  }
4274
4275  // Print all the signal handler state
4276  if (sigismember(&check_signal_done, sig)) {
4277    print_signal_handlers(tty, buf, O_BUFLEN);
4278  }
4279
4280}
4281
4282void os::Solaris::install_signal_handlers() {
4283  bool libjsigdone = false;
4284  signal_handlers_are_installed = true;
4285
4286  // signal-chaining
4287  typedef void (*signal_setting_t)();
4288  signal_setting_t begin_signal_setting = NULL;
4289  signal_setting_t end_signal_setting = NULL;
4290  begin_signal_setting = CAST_TO_FN_PTR(signal_setting_t,
4291                                        dlsym(RTLD_DEFAULT, "JVM_begin_signal_setting"));
4292  if (begin_signal_setting != NULL) {
4293    end_signal_setting = CAST_TO_FN_PTR(signal_setting_t,
4294                                        dlsym(RTLD_DEFAULT, "JVM_end_signal_setting"));
4295    get_signal_action = CAST_TO_FN_PTR(get_signal_t,
4296                                       dlsym(RTLD_DEFAULT, "JVM_get_signal_action"));
4297    get_libjsig_version = CAST_TO_FN_PTR(version_getting_t,
4298                                         dlsym(RTLD_DEFAULT, "JVM_get_libjsig_version"));
4299    libjsig_is_loaded = true;
4300    if (os::Solaris::get_libjsig_version != NULL) {
4301      libjsigversion =  (*os::Solaris::get_libjsig_version)();
4302    }
4303    assert(UseSignalChaining, "should enable signal-chaining");
4304  }
4305  if (libjsig_is_loaded) {
4306    // Tell libjsig jvm is setting signal handlers
4307    (*begin_signal_setting)();
4308  }
4309
4310  set_signal_handler(SIGSEGV, true, true);
4311  set_signal_handler(SIGPIPE, true, true);
4312  set_signal_handler(SIGXFSZ, true, true);
4313  set_signal_handler(SIGBUS, true, true);
4314  set_signal_handler(SIGILL, true, true);
4315  set_signal_handler(SIGFPE, true, true);
4316
4317
4318  if (os::Solaris::SIGinterrupt() > OLDMAXSIGNUM || os::Solaris::SIGasync() > OLDMAXSIGNUM) {
4319
4320    // Pre-1.4.1 Libjsig limited to signal chaining signals <= 32 so
4321    // can not register overridable signals which might be > 32
4322    if (libjsig_is_loaded && libjsigversion <= JSIG_VERSION_1_4_1) {
4323    // Tell libjsig jvm has finished setting signal handlers
4324      (*end_signal_setting)();
4325      libjsigdone = true;
4326    }
4327  }
4328
4329  // Never ok to chain our SIGinterrupt
4330  set_signal_handler(os::Solaris::SIGinterrupt(), true, false);
4331  set_signal_handler(os::Solaris::SIGasync(), true, true);
4332
4333  if (libjsig_is_loaded && !libjsigdone) {
4334    // Tell libjsig jvm finishes setting signal handlers
4335    (*end_signal_setting)();
4336  }
4337
4338  // We don't activate signal checker if libjsig is in place, we trust ourselves
4339  // and if UserSignalHandler is installed all bets are off
4340  if (CheckJNICalls) {
4341    if (libjsig_is_loaded) {
4342      tty->print_cr("Info: libjsig is activated, all active signal checking is disabled");
4343      check_signals = false;
4344    }
4345    if (AllowUserSignalHandlers) {
4346      tty->print_cr("Info: AllowUserSignalHandlers is activated, all active signal checking is disabled");
4347      check_signals = false;
4348    }
4349  }
4350}
4351
4352
4353void report_error(const char* file_name, int line_no, const char* title, const char* format, ...);
4354
4355const char * signames[] = {
4356  "SIG0",
4357  "SIGHUP", "SIGINT", "SIGQUIT", "SIGILL", "SIGTRAP",
4358  "SIGABRT", "SIGEMT", "SIGFPE", "SIGKILL", "SIGBUS",
4359  "SIGSEGV", "SIGSYS", "SIGPIPE", "SIGALRM", "SIGTERM",
4360  "SIGUSR1", "SIGUSR2", "SIGCLD", "SIGPWR", "SIGWINCH",
4361  "SIGURG", "SIGPOLL", "SIGSTOP", "SIGTSTP", "SIGCONT",
4362  "SIGTTIN", "SIGTTOU", "SIGVTALRM", "SIGPROF", "SIGXCPU",
4363  "SIGXFSZ", "SIGWAITING", "SIGLWP", "SIGFREEZE", "SIGTHAW",
4364  "SIGCANCEL", "SIGLOST"
4365};
4366
4367const char* os::exception_name(int exception_code, char* buf, size_t size) {
4368  if (0 < exception_code && exception_code <= SIGRTMAX) {
4369    // signal
4370    if (exception_code < sizeof(signames)/sizeof(const char*)) {
4371       jio_snprintf(buf, size, "%s", signames[exception_code]);
4372    } else {
4373       jio_snprintf(buf, size, "SIG%d", exception_code);
4374    }
4375    return buf;
4376  } else {
4377    return NULL;
4378  }
4379}
4380
4381// (Static) wrappers for the new libthread API
4382int_fnP_thread_t_iP_uP_stack_tP_gregset_t os::Solaris::_thr_getstate;
4383int_fnP_thread_t_i_gregset_t os::Solaris::_thr_setstate;
4384int_fnP_thread_t_i os::Solaris::_thr_setmutator;
4385int_fnP_thread_t os::Solaris::_thr_suspend_mutator;
4386int_fnP_thread_t os::Solaris::_thr_continue_mutator;
4387
4388// (Static) wrappers for the liblgrp API
4389os::Solaris::lgrp_home_func_t os::Solaris::_lgrp_home;
4390os::Solaris::lgrp_init_func_t os::Solaris::_lgrp_init;
4391os::Solaris::lgrp_fini_func_t os::Solaris::_lgrp_fini;
4392os::Solaris::lgrp_root_func_t os::Solaris::_lgrp_root;
4393os::Solaris::lgrp_children_func_t os::Solaris::_lgrp_children;
4394os::Solaris::lgrp_resources_func_t os::Solaris::_lgrp_resources;
4395os::Solaris::lgrp_nlgrps_func_t os::Solaris::_lgrp_nlgrps;
4396os::Solaris::lgrp_cookie_stale_func_t os::Solaris::_lgrp_cookie_stale;
4397os::Solaris::lgrp_cookie_t os::Solaris::_lgrp_cookie = 0;
4398
4399// (Static) wrapper for meminfo() call.
4400os::Solaris::meminfo_func_t os::Solaris::_meminfo = 0;
4401
4402static address resolve_symbol(const char *name) {
4403  address addr;
4404
4405  addr = (address) dlsym(RTLD_DEFAULT, name);
4406  if(addr == NULL) {
4407    // RTLD_DEFAULT was not defined on some early versions of 2.5.1
4408    addr = (address) dlsym(RTLD_NEXT, name);
4409    if(addr == NULL) {
4410      fatal(dlerror());
4411    }
4412  }
4413  return addr;
4414}
4415
4416
4417
4418// isT2_libthread()
4419//
4420// Routine to determine if we are currently using the new T2 libthread.
4421//
4422// We determine if we are using T2 by reading /proc/self/lstatus and
4423// looking for a thread with the ASLWP bit set.  If we find this status
4424// bit set, we must assume that we are NOT using T2.  The T2 team
4425// has approved this algorithm.
4426//
4427// We need to determine if we are running with the new T2 libthread
4428// since setting native thread priorities is handled differently
4429// when using this library.  All threads created using T2 are bound
4430// threads. Calling thr_setprio is meaningless in this case.
4431//
4432bool isT2_libthread() {
4433  static prheader_t * lwpArray = NULL;
4434  static int lwpSize = 0;
4435  static int lwpFile = -1;
4436  lwpstatus_t * that;
4437  char lwpName [128];
4438  bool isT2 = false;
4439
4440#define ADR(x)  ((uintptr_t)(x))
4441#define LWPINDEX(ary,ix)   ((lwpstatus_t *)(((ary)->pr_entsize * (ix)) + (ADR((ary) + 1))))
4442
4443  lwpFile = open("/proc/self/lstatus", O_RDONLY, 0);
4444  if (lwpFile < 0) {
4445      if (ThreadPriorityVerbose) warning ("Couldn't open /proc/self/lstatus\n");
4446      return false;
4447  }
4448  lwpSize = 16*1024;
4449  for (;;) {
4450    lseek (lwpFile, 0, SEEK_SET);
4451    lwpArray = (prheader_t *)NEW_C_HEAP_ARRAY(char, lwpSize);
4452    if (read(lwpFile, lwpArray, lwpSize) < 0) {
4453      if (ThreadPriorityVerbose) warning("Error reading /proc/self/lstatus\n");
4454      break;
4455    }
4456    if ((lwpArray->pr_nent * lwpArray->pr_entsize) <= lwpSize) {
4457       // We got a good snapshot - now iterate over the list.
4458      int aslwpcount = 0;
4459      for (int i = 0; i < lwpArray->pr_nent; i++ ) {
4460        that = LWPINDEX(lwpArray,i);
4461        if (that->pr_flags & PR_ASLWP) {
4462          aslwpcount++;
4463        }
4464      }
4465      if (aslwpcount == 0) isT2 = true;
4466      break;
4467    }
4468    lwpSize = lwpArray->pr_nent * lwpArray->pr_entsize;
4469    FREE_C_HEAP_ARRAY(char, lwpArray);  // retry.
4470  }
4471
4472  FREE_C_HEAP_ARRAY(char, lwpArray);
4473  close (lwpFile);
4474  if (ThreadPriorityVerbose) {
4475    if (isT2) tty->print_cr("We are running with a T2 libthread\n");
4476    else tty->print_cr("We are not running with a T2 libthread\n");
4477  }
4478  return isT2;
4479}
4480
4481
4482void os::Solaris::libthread_init() {
4483  address func = (address)dlsym(RTLD_DEFAULT, "_thr_suspend_allmutators");
4484
4485  // Determine if we are running with the new T2 libthread
4486  os::Solaris::set_T2_libthread(isT2_libthread());
4487
4488  lwp_priocntl_init();
4489
4490  // RTLD_DEFAULT was not defined on some early versions of 5.5.1
4491  if(func == NULL) {
4492    func = (address) dlsym(RTLD_NEXT, "_thr_suspend_allmutators");
4493    // Guarantee that this VM is running on an new enough OS (5.6 or
4494    // later) that it will have a new enough libthread.so.
4495    guarantee(func != NULL, "libthread.so is too old.");
4496  }
4497
4498  // Initialize the new libthread getstate API wrappers
4499  func = resolve_symbol("thr_getstate");
4500  os::Solaris::set_thr_getstate(CAST_TO_FN_PTR(int_fnP_thread_t_iP_uP_stack_tP_gregset_t, func));
4501
4502  func = resolve_symbol("thr_setstate");
4503  os::Solaris::set_thr_setstate(CAST_TO_FN_PTR(int_fnP_thread_t_i_gregset_t, func));
4504
4505  func = resolve_symbol("thr_setmutator");
4506  os::Solaris::set_thr_setmutator(CAST_TO_FN_PTR(int_fnP_thread_t_i, func));
4507
4508  func = resolve_symbol("thr_suspend_mutator");
4509  os::Solaris::set_thr_suspend_mutator(CAST_TO_FN_PTR(int_fnP_thread_t, func));
4510
4511  func = resolve_symbol("thr_continue_mutator");
4512  os::Solaris::set_thr_continue_mutator(CAST_TO_FN_PTR(int_fnP_thread_t, func));
4513
4514  int size;
4515  void (*handler_info_func)(address *, int *);
4516  handler_info_func = CAST_TO_FN_PTR(void (*)(address *, int *), resolve_symbol("thr_sighndlrinfo"));
4517  handler_info_func(&handler_start, &size);
4518  handler_end = handler_start + size;
4519}
4520
4521
4522int_fnP_mutex_tP os::Solaris::_mutex_lock;
4523int_fnP_mutex_tP os::Solaris::_mutex_trylock;
4524int_fnP_mutex_tP os::Solaris::_mutex_unlock;
4525int_fnP_mutex_tP_i_vP os::Solaris::_mutex_init;
4526int_fnP_mutex_tP os::Solaris::_mutex_destroy;
4527int os::Solaris::_mutex_scope = USYNC_THREAD;
4528
4529int_fnP_cond_tP_mutex_tP_timestruc_tP os::Solaris::_cond_timedwait;
4530int_fnP_cond_tP_mutex_tP os::Solaris::_cond_wait;
4531int_fnP_cond_tP os::Solaris::_cond_signal;
4532int_fnP_cond_tP os::Solaris::_cond_broadcast;
4533int_fnP_cond_tP_i_vP os::Solaris::_cond_init;
4534int_fnP_cond_tP os::Solaris::_cond_destroy;
4535int os::Solaris::_cond_scope = USYNC_THREAD;
4536
4537void os::Solaris::synchronization_init() {
4538  if(UseLWPSynchronization) {
4539    os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_lock")));
4540    os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_trylock")));
4541    os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_unlock")));
4542    os::Solaris::set_mutex_init(lwp_mutex_init);
4543    os::Solaris::set_mutex_destroy(lwp_mutex_destroy);
4544    os::Solaris::set_mutex_scope(USYNC_THREAD);
4545
4546    os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("_lwp_cond_timedwait")));
4547    os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("_lwp_cond_wait")));
4548    os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("_lwp_cond_signal")));
4549    os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("_lwp_cond_broadcast")));
4550    os::Solaris::set_cond_init(lwp_cond_init);
4551    os::Solaris::set_cond_destroy(lwp_cond_destroy);
4552    os::Solaris::set_cond_scope(USYNC_THREAD);
4553  }
4554  else {
4555    os::Solaris::set_mutex_scope(USYNC_THREAD);
4556    os::Solaris::set_cond_scope(USYNC_THREAD);
4557
4558    if(UsePthreads) {
4559      os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_lock")));
4560      os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_trylock")));
4561      os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_unlock")));
4562      os::Solaris::set_mutex_init(pthread_mutex_default_init);
4563      os::Solaris::set_mutex_destroy(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_destroy")));
4564
4565      os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("pthread_cond_timedwait")));
4566      os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("pthread_cond_wait")));
4567      os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_signal")));
4568      os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_broadcast")));
4569      os::Solaris::set_cond_init(pthread_cond_default_init);
4570      os::Solaris::set_cond_destroy(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_destroy")));
4571    }
4572    else {
4573      os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_lock")));
4574      os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_trylock")));
4575      os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_unlock")));
4576      os::Solaris::set_mutex_init(::mutex_init);
4577      os::Solaris::set_mutex_destroy(::mutex_destroy);
4578
4579      os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("cond_timedwait")));
4580      os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("cond_wait")));
4581      os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("cond_signal")));
4582      os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("cond_broadcast")));
4583      os::Solaris::set_cond_init(::cond_init);
4584      os::Solaris::set_cond_destroy(::cond_destroy);
4585    }
4586  }
4587}
4588
4589void os::Solaris::liblgrp_init() {
4590  void *handle = dlopen("liblgrp.so.1", RTLD_LAZY);
4591  if (handle != NULL) {
4592    os::Solaris::set_lgrp_home(CAST_TO_FN_PTR(lgrp_home_func_t, dlsym(handle, "lgrp_home")));
4593    os::Solaris::set_lgrp_init(CAST_TO_FN_PTR(lgrp_init_func_t, dlsym(handle, "lgrp_init")));
4594    os::Solaris::set_lgrp_fini(CAST_TO_FN_PTR(lgrp_fini_func_t, dlsym(handle, "lgrp_fini")));
4595    os::Solaris::set_lgrp_root(CAST_TO_FN_PTR(lgrp_root_func_t, dlsym(handle, "lgrp_root")));
4596    os::Solaris::set_lgrp_children(CAST_TO_FN_PTR(lgrp_children_func_t, dlsym(handle, "lgrp_children")));
4597    os::Solaris::set_lgrp_resources(CAST_TO_FN_PTR(lgrp_resources_func_t, dlsym(handle, "lgrp_resources")));
4598    os::Solaris::set_lgrp_nlgrps(CAST_TO_FN_PTR(lgrp_nlgrps_func_t, dlsym(handle, "lgrp_nlgrps")));
4599    os::Solaris::set_lgrp_cookie_stale(CAST_TO_FN_PTR(lgrp_cookie_stale_func_t,
4600                                       dlsym(handle, "lgrp_cookie_stale")));
4601
4602    lgrp_cookie_t c = lgrp_init(LGRP_VIEW_CALLER);
4603    set_lgrp_cookie(c);
4604  } else {
4605    warning("your OS does not support NUMA");
4606  }
4607}
4608
4609void os::Solaris::misc_sym_init() {
4610  address func = (address)dlsym(RTLD_DEFAULT, "meminfo");
4611  if(func == NULL) {
4612    func = (address) dlsym(RTLD_NEXT, "meminfo");
4613  }
4614  if (func != NULL) {
4615    os::Solaris::set_meminfo(CAST_TO_FN_PTR(meminfo_func_t, func));
4616  }
4617}
4618
4619// Symbol doesn't exist in Solaris 8 pset.h
4620#ifndef PS_MYID
4621#define PS_MYID -3
4622#endif
4623
4624// int pset_getloadavg(psetid_t pset, double loadavg[], int nelem);
4625typedef long (*pset_getloadavg_type)(psetid_t pset, double loadavg[], int nelem);
4626static pset_getloadavg_type pset_getloadavg_ptr = NULL;
4627
4628void init_pset_getloadavg_ptr(void) {
4629  pset_getloadavg_ptr =
4630    (pset_getloadavg_type)dlsym(RTLD_DEFAULT, "pset_getloadavg");
4631  if (PrintMiscellaneous && Verbose && pset_getloadavg_ptr == NULL) {
4632    warning("pset_getloadavg function not found");
4633  }
4634}
4635
4636int os::Solaris::_dev_zero_fd = -1;
4637
4638// this is called _before_ the global arguments have been parsed
4639void os::init(void) {
4640  _initial_pid = getpid();
4641
4642  max_hrtime = first_hrtime = gethrtime();
4643
4644  init_random(1234567);
4645
4646  page_size = sysconf(_SC_PAGESIZE);
4647  if (page_size == -1)
4648    fatal1("os_solaris.cpp: os::init: sysconf failed (%s)", strerror(errno));
4649  init_page_sizes((size_t) page_size);
4650
4651  Solaris::initialize_system_info();
4652
4653  int fd = open("/dev/zero", O_RDWR);
4654  if (fd < 0) {
4655    fatal1("os::init: cannot open /dev/zero (%s)", strerror(errno));
4656  } else {
4657    Solaris::set_dev_zero_fd(fd);
4658
4659    // Close on exec, child won't inherit.
4660    fcntl(fd, F_SETFD, FD_CLOEXEC);
4661  }
4662
4663  clock_tics_per_sec = CLK_TCK;
4664
4665  // check if dladdr1() exists; dladdr1 can provide more information than
4666  // dladdr for os::dll_address_to_function_name. It comes with SunOS 5.9
4667  // and is available on linker patches for 5.7 and 5.8.
4668  // libdl.so must have been loaded, this call is just an entry lookup
4669  void * hdl = dlopen("libdl.so", RTLD_NOW);
4670  if (hdl)
4671    dladdr1_func = CAST_TO_FN_PTR(dladdr1_func_type, dlsym(hdl, "dladdr1"));
4672
4673  // (Solaris only) this switches to calls that actually do locking.
4674  ThreadCritical::initialize();
4675
4676  main_thread = thr_self();
4677
4678  // Constant minimum stack size allowed. It must be at least
4679  // the minimum of what the OS supports (thr_min_stack()), and
4680  // enough to allow the thread to get to user bytecode execution.
4681  Solaris::min_stack_allowed = MAX2(thr_min_stack(), Solaris::min_stack_allowed);
4682  // If the pagesize of the VM is greater than 8K determine the appropriate
4683  // number of initial guard pages.  The user can change this with the
4684  // command line arguments, if needed.
4685  if (vm_page_size() > 8*K) {
4686    StackYellowPages = 1;
4687    StackRedPages = 1;
4688    StackShadowPages = round_to((StackShadowPages*8*K), vm_page_size()) / vm_page_size();
4689  }
4690}
4691
4692// To install functions for atexit system call
4693extern "C" {
4694  static void perfMemory_exit_helper() {
4695    perfMemory_exit();
4696  }
4697}
4698
4699// this is called _after_ the global arguments have been parsed
4700jint os::init_2(void) {
4701  // try to enable extended file IO ASAP, see 6431278
4702  os::Solaris::try_enable_extended_io();
4703
4704  // Allocate a single page and mark it as readable for safepoint polling.  Also
4705  // use this first mmap call to check support for MAP_ALIGN.
4706  address polling_page = (address)Solaris::mmap_chunk((char*)page_size,
4707                                                      page_size,
4708                                                      MAP_PRIVATE | MAP_ALIGN,
4709                                                      PROT_READ);
4710  if (polling_page == NULL) {
4711    has_map_align = false;
4712    polling_page = (address)Solaris::mmap_chunk(NULL, page_size, MAP_PRIVATE,
4713                                                PROT_READ);
4714  }
4715
4716  os::set_polling_page(polling_page);
4717
4718#ifndef PRODUCT
4719  if( Verbose && PrintMiscellaneous )
4720    tty->print("[SafePoint Polling address: " INTPTR_FORMAT "]\n", (intptr_t)polling_page);
4721#endif
4722
4723  if (!UseMembar) {
4724    address mem_serialize_page = (address)Solaris::mmap_chunk( NULL, page_size, MAP_PRIVATE, PROT_READ | PROT_WRITE );
4725    guarantee( mem_serialize_page != NULL, "mmap Failed for memory serialize page");
4726    os::set_memory_serialize_page( mem_serialize_page );
4727
4728#ifndef PRODUCT
4729    if(Verbose && PrintMiscellaneous)
4730      tty->print("[Memory Serialize  Page address: " INTPTR_FORMAT "]\n", (intptr_t)mem_serialize_page);
4731#endif
4732}
4733
4734  FLAG_SET_DEFAULT(UseLargePages, os::large_page_init());
4735
4736  // Check minimum allowable stack size for thread creation and to initialize
4737  // the java system classes, including StackOverflowError - depends on page
4738  // size.  Add a page for compiler2 recursion in main thread.
4739  // Add in BytesPerWord times page size to account for VM stack during
4740  // class initialization depending on 32 or 64 bit VM.
4741  guarantee((Solaris::min_stack_allowed >=
4742    (StackYellowPages+StackRedPages+StackShadowPages+BytesPerWord
4743     COMPILER2_PRESENT(+1)) * page_size),
4744    "need to increase Solaris::min_stack_allowed on this platform");
4745
4746  size_t threadStackSizeInBytes = ThreadStackSize * K;
4747  if (threadStackSizeInBytes != 0 &&
4748    threadStackSizeInBytes < Solaris::min_stack_allowed) {
4749    tty->print_cr("\nThe stack size specified is too small, Specify at least %dk",
4750                  Solaris::min_stack_allowed/K);
4751    return JNI_ERR;
4752  }
4753
4754  // For 64kbps there will be a 64kb page size, which makes
4755  // the usable default stack size quite a bit less.  Increase the
4756  // stack for 64kb (or any > than 8kb) pages, this increases
4757  // virtual memory fragmentation (since we're not creating the
4758  // stack on a power of 2 boundary.  The real fix for this
4759  // should be to fix the guard page mechanism.
4760
4761  if (vm_page_size() > 8*K) {
4762      threadStackSizeInBytes = (threadStackSizeInBytes != 0)
4763         ? threadStackSizeInBytes +
4764           ((StackYellowPages + StackRedPages) * vm_page_size())
4765         : 0;
4766      ThreadStackSize = threadStackSizeInBytes/K;
4767  }
4768
4769  // Make the stack size a multiple of the page size so that
4770  // the yellow/red zones can be guarded.
4771  JavaThread::set_stack_size_at_create(round_to(threadStackSizeInBytes,
4772        vm_page_size()));
4773
4774  Solaris::libthread_init();
4775  if (UseNUMA) {
4776    Solaris::liblgrp_init();
4777  }
4778  Solaris::misc_sym_init();
4779  Solaris::signal_sets_init();
4780  Solaris::init_signal_mem();
4781  Solaris::install_signal_handlers();
4782
4783  if (libjsigversion < JSIG_VERSION_1_4_1) {
4784    Maxlibjsigsigs = OLDMAXSIGNUM;
4785  }
4786
4787  // initialize synchronization primitives to use either thread or
4788  // lwp synchronization (controlled by UseLWPSynchronization)
4789  Solaris::synchronization_init();
4790
4791  if (MaxFDLimit) {
4792    // set the number of file descriptors to max. print out error
4793    // if getrlimit/setrlimit fails but continue regardless.
4794    struct rlimit nbr_files;
4795    int status = getrlimit(RLIMIT_NOFILE, &nbr_files);
4796    if (status != 0) {
4797      if (PrintMiscellaneous && (Verbose || WizardMode))
4798        perror("os::init_2 getrlimit failed");
4799    } else {
4800      nbr_files.rlim_cur = nbr_files.rlim_max;
4801      status = setrlimit(RLIMIT_NOFILE, &nbr_files);
4802      if (status != 0) {
4803        if (PrintMiscellaneous && (Verbose || WizardMode))
4804          perror("os::init_2 setrlimit failed");
4805      }
4806    }
4807  }
4808
4809  // Initialize HPI.
4810  jint hpi_result = hpi::initialize();
4811  if (hpi_result != JNI_OK) {
4812    tty->print_cr("There was an error trying to initialize the HPI library.");
4813    return hpi_result;
4814  }
4815
4816  // Calculate theoretical max. size of Threads to guard gainst
4817  // artifical out-of-memory situations, where all available address-
4818  // space has been reserved by thread stacks. Default stack size is 1Mb.
4819  size_t pre_thread_stack_size = (JavaThread::stack_size_at_create()) ?
4820    JavaThread::stack_size_at_create() : (1*K*K);
4821  assert(pre_thread_stack_size != 0, "Must have a stack");
4822  // Solaris has a maximum of 4Gb of user programs. Calculate the thread limit when
4823  // we should start doing Virtual Memory banging. Currently when the threads will
4824  // have used all but 200Mb of space.
4825  size_t max_address_space = ((unsigned int)4 * K * K * K) - (200 * K * K);
4826  Solaris::_os_thread_limit = max_address_space / pre_thread_stack_size;
4827
4828  // at-exit methods are called in the reverse order of their registration.
4829  // In Solaris 7 and earlier, atexit functions are called on return from
4830  // main or as a result of a call to exit(3C). There can be only 32 of
4831  // these functions registered and atexit() does not set errno. In Solaris
4832  // 8 and later, there is no limit to the number of functions registered
4833  // and atexit() sets errno. In addition, in Solaris 8 and later, atexit
4834  // functions are called upon dlclose(3DL) in addition to return from main
4835  // and exit(3C).
4836
4837  if (PerfAllowAtExitRegistration) {
4838    // only register atexit functions if PerfAllowAtExitRegistration is set.
4839    // atexit functions can be delayed until process exit time, which
4840    // can be problematic for embedded VM situations. Embedded VMs should
4841    // call DestroyJavaVM() to assure that VM resources are released.
4842
4843    // note: perfMemory_exit_helper atexit function may be removed in
4844    // the future if the appropriate cleanup code can be added to the
4845    // VM_Exit VMOperation's doit method.
4846    if (atexit(perfMemory_exit_helper) != 0) {
4847      warning("os::init2 atexit(perfMemory_exit_helper) failed");
4848    }
4849  }
4850
4851  // Init pset_loadavg function pointer
4852  init_pset_getloadavg_ptr();
4853
4854  return JNI_OK;
4855}
4856
4857
4858// Mark the polling page as unreadable
4859void os::make_polling_page_unreadable(void) {
4860  if( mprotect((char *)_polling_page, page_size, PROT_NONE) != 0 )
4861    fatal("Could not disable polling page");
4862};
4863
4864// Mark the polling page as readable
4865void os::make_polling_page_readable(void) {
4866  if( mprotect((char *)_polling_page, page_size, PROT_READ) != 0 )
4867    fatal("Could not enable polling page");
4868};
4869
4870// OS interface.
4871
4872int os::stat(const char *path, struct stat *sbuf) {
4873  char pathbuf[MAX_PATH];
4874  if (strlen(path) > MAX_PATH - 1) {
4875    errno = ENAMETOOLONG;
4876    return -1;
4877  }
4878  hpi::native_path(strcpy(pathbuf, path));
4879  return ::stat(pathbuf, sbuf);
4880}
4881
4882
4883bool os::check_heap(bool force) { return true; }
4884
4885typedef int (*vsnprintf_t)(char* buf, size_t count, const char* fmt, va_list argptr);
4886static vsnprintf_t sol_vsnprintf = NULL;
4887
4888int local_vsnprintf(char* buf, size_t count, const char* fmt, va_list argptr) {
4889  if (!sol_vsnprintf) {
4890    //search  for the named symbol in the objects that were loaded after libjvm
4891    void* where = RTLD_NEXT;
4892    if ((sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "__vsnprintf"))) == NULL)
4893        sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "vsnprintf"));
4894    if (!sol_vsnprintf){
4895      //search  for the named symbol in the objects that were loaded before libjvm
4896      where = RTLD_DEFAULT;
4897      if ((sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "__vsnprintf"))) == NULL)
4898        sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "vsnprintf"));
4899      assert(sol_vsnprintf != NULL, "vsnprintf not found");
4900    }
4901  }
4902  return (*sol_vsnprintf)(buf, count, fmt, argptr);
4903}
4904
4905
4906// Is a (classpath) directory empty?
4907bool os::dir_is_empty(const char* path) {
4908  DIR *dir = NULL;
4909  struct dirent *ptr;
4910
4911  dir = opendir(path);
4912  if (dir == NULL) return true;
4913
4914  /* Scan the directory */
4915  bool result = true;
4916  char buf[sizeof(struct dirent) + MAX_PATH];
4917  struct dirent *dbuf = (struct dirent *) buf;
4918  while (result && (ptr = readdir(dir, dbuf)) != NULL) {
4919    if (strcmp(ptr->d_name, ".") != 0 && strcmp(ptr->d_name, "..") != 0) {
4920      result = false;
4921    }
4922  }
4923  closedir(dir);
4924  return result;
4925}
4926
4927// create binary file, rewriting existing file if required
4928int os::create_binary_file(const char* path, bool rewrite_existing) {
4929  int oflags = O_WRONLY | O_CREAT;
4930  if (!rewrite_existing) {
4931    oflags |= O_EXCL;
4932  }
4933  return ::open64(path, oflags, S_IREAD | S_IWRITE);
4934}
4935
4936// return current position of file pointer
4937jlong os::current_file_offset(int fd) {
4938  return (jlong)::lseek64(fd, (off64_t)0, SEEK_CUR);
4939}
4940
4941// move file pointer to the specified offset
4942jlong os::seek_to_file_offset(int fd, jlong offset) {
4943  return (jlong)::lseek64(fd, (off64_t)offset, SEEK_SET);
4944}
4945
4946// Map a block of memory.
4947char* os::map_memory(int fd, const char* file_name, size_t file_offset,
4948                     char *addr, size_t bytes, bool read_only,
4949                     bool allow_exec) {
4950  int prot;
4951  int flags;
4952
4953  if (read_only) {
4954    prot = PROT_READ;
4955    flags = MAP_SHARED;
4956  } else {
4957    prot = PROT_READ | PROT_WRITE;
4958    flags = MAP_PRIVATE;
4959  }
4960
4961  if (allow_exec) {
4962    prot |= PROT_EXEC;
4963  }
4964
4965  if (addr != NULL) {
4966    flags |= MAP_FIXED;
4967  }
4968
4969  char* mapped_address = (char*)mmap(addr, (size_t)bytes, prot, flags,
4970                                     fd, file_offset);
4971  if (mapped_address == MAP_FAILED) {
4972    return NULL;
4973  }
4974  return mapped_address;
4975}
4976
4977
4978// Remap a block of memory.
4979char* os::remap_memory(int fd, const char* file_name, size_t file_offset,
4980                       char *addr, size_t bytes, bool read_only,
4981                       bool allow_exec) {
4982  // same as map_memory() on this OS
4983  return os::map_memory(fd, file_name, file_offset, addr, bytes, read_only,
4984                        allow_exec);
4985}
4986
4987
4988// Unmap a block of memory.
4989bool os::unmap_memory(char* addr, size_t bytes) {
4990  return munmap(addr, bytes) == 0;
4991}
4992
4993void os::pause() {
4994  char filename[MAX_PATH];
4995  if (PauseAtStartupFile && PauseAtStartupFile[0]) {
4996    jio_snprintf(filename, MAX_PATH, PauseAtStartupFile);
4997  } else {
4998    jio_snprintf(filename, MAX_PATH, "./vm.paused.%d", current_process_id());
4999  }
5000
5001  int fd = ::open(filename, O_WRONLY | O_CREAT | O_TRUNC, 0666);
5002  if (fd != -1) {
5003    struct stat buf;
5004    close(fd);
5005    while (::stat(filename, &buf) == 0) {
5006      (void)::poll(NULL, 0, 100);
5007    }
5008  } else {
5009    jio_fprintf(stderr,
5010      "Could not open pause file '%s', continuing immediately.\n", filename);
5011  }
5012}
5013
5014#ifndef PRODUCT
5015#ifdef INTERPOSE_ON_SYSTEM_SYNCH_FUNCTIONS
5016// Turn this on if you need to trace synch operations.
5017// Set RECORD_SYNCH_LIMIT to a large-enough value,
5018// and call record_synch_enable and record_synch_disable
5019// around the computation of interest.
5020
5021void record_synch(char* name, bool returning);  // defined below
5022
5023class RecordSynch {
5024  char* _name;
5025 public:
5026  RecordSynch(char* name) :_name(name)
5027                 { record_synch(_name, false); }
5028  ~RecordSynch() { record_synch(_name,   true);  }
5029};
5030
5031#define CHECK_SYNCH_OP(ret, name, params, args, inner)          \
5032extern "C" ret name params {                                    \
5033  typedef ret name##_t params;                                  \
5034  static name##_t* implem = NULL;                               \
5035  static int callcount = 0;                                     \
5036  if (implem == NULL) {                                         \
5037    implem = (name##_t*) dlsym(RTLD_NEXT, #name);               \
5038    if (implem == NULL)  fatal(dlerror());                      \
5039  }                                                             \
5040  ++callcount;                                                  \
5041  RecordSynch _rs(#name);                                       \
5042  inner;                                                        \
5043  return implem args;                                           \
5044}
5045// in dbx, examine callcounts this way:
5046// for n in $(eval whereis callcount | awk '{print $2}'); do print $n; done
5047
5048#define CHECK_POINTER_OK(p) \
5049  (Universe::perm_gen() == NULL || !Universe::is_reserved_heap((oop)(p)))
5050#define CHECK_MU \
5051  if (!CHECK_POINTER_OK(mu)) fatal("Mutex must be in C heap only.");
5052#define CHECK_CV \
5053  if (!CHECK_POINTER_OK(cv)) fatal("Condvar must be in C heap only.");
5054#define CHECK_P(p) \
5055  if (!CHECK_POINTER_OK(p))  fatal(false,  "Pointer must be in C heap only.");
5056
5057#define CHECK_MUTEX(mutex_op) \
5058CHECK_SYNCH_OP(int, mutex_op, (mutex_t *mu), (mu), CHECK_MU);
5059
5060CHECK_MUTEX(   mutex_lock)
5061CHECK_MUTEX(  _mutex_lock)
5062CHECK_MUTEX( mutex_unlock)
5063CHECK_MUTEX(_mutex_unlock)
5064CHECK_MUTEX( mutex_trylock)
5065CHECK_MUTEX(_mutex_trylock)
5066
5067#define CHECK_COND(cond_op) \
5068CHECK_SYNCH_OP(int, cond_op, (cond_t *cv, mutex_t *mu), (cv, mu), CHECK_MU;CHECK_CV);
5069
5070CHECK_COND( cond_wait);
5071CHECK_COND(_cond_wait);
5072CHECK_COND(_cond_wait_cancel);
5073
5074#define CHECK_COND2(cond_op) \
5075CHECK_SYNCH_OP(int, cond_op, (cond_t *cv, mutex_t *mu, timestruc_t* ts), (cv, mu, ts), CHECK_MU;CHECK_CV);
5076
5077CHECK_COND2( cond_timedwait);
5078CHECK_COND2(_cond_timedwait);
5079CHECK_COND2(_cond_timedwait_cancel);
5080
5081// do the _lwp_* versions too
5082#define mutex_t lwp_mutex_t
5083#define cond_t  lwp_cond_t
5084CHECK_MUTEX(  _lwp_mutex_lock)
5085CHECK_MUTEX(  _lwp_mutex_unlock)
5086CHECK_MUTEX(  _lwp_mutex_trylock)
5087CHECK_MUTEX( __lwp_mutex_lock)
5088CHECK_MUTEX( __lwp_mutex_unlock)
5089CHECK_MUTEX( __lwp_mutex_trylock)
5090CHECK_MUTEX(___lwp_mutex_lock)
5091CHECK_MUTEX(___lwp_mutex_unlock)
5092
5093CHECK_COND(  _lwp_cond_wait);
5094CHECK_COND( __lwp_cond_wait);
5095CHECK_COND(___lwp_cond_wait);
5096
5097CHECK_COND2(  _lwp_cond_timedwait);
5098CHECK_COND2( __lwp_cond_timedwait);
5099#undef mutex_t
5100#undef cond_t
5101
5102CHECK_SYNCH_OP(int, _lwp_suspend2,       (int lwp, int *n), (lwp, n), 0);
5103CHECK_SYNCH_OP(int,__lwp_suspend2,       (int lwp, int *n), (lwp, n), 0);
5104CHECK_SYNCH_OP(int, _lwp_kill,           (int lwp, int n),  (lwp, n), 0);
5105CHECK_SYNCH_OP(int,__lwp_kill,           (int lwp, int n),  (lwp, n), 0);
5106CHECK_SYNCH_OP(int, _lwp_sema_wait,      (lwp_sema_t* p),   (p),  CHECK_P(p));
5107CHECK_SYNCH_OP(int,__lwp_sema_wait,      (lwp_sema_t* p),   (p),  CHECK_P(p));
5108CHECK_SYNCH_OP(int, _lwp_cond_broadcast, (lwp_cond_t* cv),  (cv), CHECK_CV);
5109CHECK_SYNCH_OP(int,__lwp_cond_broadcast, (lwp_cond_t* cv),  (cv), CHECK_CV);
5110
5111
5112// recording machinery:
5113
5114enum { RECORD_SYNCH_LIMIT = 200 };
5115char* record_synch_name[RECORD_SYNCH_LIMIT];
5116void* record_synch_arg0ptr[RECORD_SYNCH_LIMIT];
5117bool record_synch_returning[RECORD_SYNCH_LIMIT];
5118thread_t record_synch_thread[RECORD_SYNCH_LIMIT];
5119int record_synch_count = 0;
5120bool record_synch_enabled = false;
5121
5122// in dbx, examine recorded data this way:
5123// for n in name arg0ptr returning thread; do print record_synch_$n[0..record_synch_count-1]; done
5124
5125void record_synch(char* name, bool returning) {
5126  if (record_synch_enabled) {
5127    if (record_synch_count < RECORD_SYNCH_LIMIT) {
5128      record_synch_name[record_synch_count] = name;
5129      record_synch_returning[record_synch_count] = returning;
5130      record_synch_thread[record_synch_count] = thr_self();
5131      record_synch_arg0ptr[record_synch_count] = &name;
5132      record_synch_count++;
5133    }
5134    // put more checking code here:
5135    // ...
5136  }
5137}
5138
5139void record_synch_enable() {
5140  // start collecting trace data, if not already doing so
5141  if (!record_synch_enabled)  record_synch_count = 0;
5142  record_synch_enabled = true;
5143}
5144
5145void record_synch_disable() {
5146  // stop collecting trace data
5147  record_synch_enabled = false;
5148}
5149
5150#endif // INTERPOSE_ON_SYSTEM_SYNCH_FUNCTIONS
5151#endif // PRODUCT
5152
5153const intptr_t thr_time_off  = (intptr_t)(&((prusage_t *)(NULL))->pr_utime);
5154const intptr_t thr_time_size = (intptr_t)(&((prusage_t *)(NULL))->pr_ttime) -
5155                               (intptr_t)(&((prusage_t *)(NULL))->pr_utime);
5156
5157
5158// JVMTI & JVM monitoring and management support
5159// The thread_cpu_time() and current_thread_cpu_time() are only
5160// supported if is_thread_cpu_time_supported() returns true.
5161// They are not supported on Solaris T1.
5162
5163// current_thread_cpu_time(bool) and thread_cpu_time(Thread*, bool)
5164// are used by JVM M&M and JVMTI to get user+sys or user CPU time
5165// of a thread.
5166//
5167// current_thread_cpu_time() and thread_cpu_time(Thread *)
5168// returns the fast estimate available on the platform.
5169
5170// hrtime_t gethrvtime() return value includes
5171// user time but does not include system time
5172jlong os::current_thread_cpu_time() {
5173  return (jlong) gethrvtime();
5174}
5175
5176jlong os::thread_cpu_time(Thread *thread) {
5177  // return user level CPU time only to be consistent with
5178  // what current_thread_cpu_time returns.
5179  // thread_cpu_time_info() must be changed if this changes
5180  return os::thread_cpu_time(thread, false /* user time only */);
5181}
5182
5183jlong os::current_thread_cpu_time(bool user_sys_cpu_time) {
5184  if (user_sys_cpu_time) {
5185    return os::thread_cpu_time(Thread::current(), user_sys_cpu_time);
5186  } else {
5187    return os::current_thread_cpu_time();
5188  }
5189}
5190
5191jlong os::thread_cpu_time(Thread *thread, bool user_sys_cpu_time) {
5192  char proc_name[64];
5193  int count;
5194  prusage_t prusage;
5195  jlong lwp_time;
5196  int fd;
5197
5198  sprintf(proc_name, "/proc/%d/lwp/%d/lwpusage",
5199                     getpid(),
5200                     thread->osthread()->lwp_id());
5201  fd = open(proc_name, O_RDONLY);
5202  if ( fd == -1 ) return -1;
5203
5204  do {
5205    count = pread(fd,
5206                  (void *)&prusage.pr_utime,
5207                  thr_time_size,
5208                  thr_time_off);
5209  } while (count < 0 && errno == EINTR);
5210  close(fd);
5211  if ( count < 0 ) return -1;
5212
5213  if (user_sys_cpu_time) {
5214    // user + system CPU time
5215    lwp_time = (((jlong)prusage.pr_stime.tv_sec +
5216                 (jlong)prusage.pr_utime.tv_sec) * (jlong)1000000000) +
5217                 (jlong)prusage.pr_stime.tv_nsec +
5218                 (jlong)prusage.pr_utime.tv_nsec;
5219  } else {
5220    // user level CPU time only
5221    lwp_time = ((jlong)prusage.pr_utime.tv_sec * (jlong)1000000000) +
5222                (jlong)prusage.pr_utime.tv_nsec;
5223  }
5224
5225  return(lwp_time);
5226}
5227
5228void os::current_thread_cpu_time_info(jvmtiTimerInfo *info_ptr) {
5229  info_ptr->max_value = ALL_64_BITS;      // will not wrap in less than 64 bits
5230  info_ptr->may_skip_backward = false;    // elapsed time not wall time
5231  info_ptr->may_skip_forward = false;     // elapsed time not wall time
5232  info_ptr->kind = JVMTI_TIMER_USER_CPU;  // only user time is returned
5233}
5234
5235void os::thread_cpu_time_info(jvmtiTimerInfo *info_ptr) {
5236  info_ptr->max_value = ALL_64_BITS;      // will not wrap in less than 64 bits
5237  info_ptr->may_skip_backward = false;    // elapsed time not wall time
5238  info_ptr->may_skip_forward = false;     // elapsed time not wall time
5239  info_ptr->kind = JVMTI_TIMER_USER_CPU;  // only user time is returned
5240}
5241
5242bool os::is_thread_cpu_time_supported() {
5243  if ( os::Solaris::T2_libthread() || UseBoundThreads ) {
5244    return true;
5245  } else {
5246    return false;
5247  }
5248}
5249
5250// System loadavg support.  Returns -1 if load average cannot be obtained.
5251// Return the load average for our processor set if the primitive exists
5252// (Solaris 9 and later).  Otherwise just return system wide loadavg.
5253int os::loadavg(double loadavg[], int nelem) {
5254  if (pset_getloadavg_ptr != NULL) {
5255    return (*pset_getloadavg_ptr)(PS_MYID, loadavg, nelem);
5256  } else {
5257    return ::getloadavg(loadavg, nelem);
5258  }
5259}
5260
5261//---------------------------------------------------------------------------------
5262#ifndef PRODUCT
5263
5264static address same_page(address x, address y) {
5265  intptr_t page_bits = -os::vm_page_size();
5266  if ((intptr_t(x) & page_bits) == (intptr_t(y) & page_bits))
5267    return x;
5268  else if (x > y)
5269    return (address)(intptr_t(y) | ~page_bits) + 1;
5270  else
5271    return (address)(intptr_t(y) & page_bits);
5272}
5273
5274bool os::find(address addr) {
5275  Dl_info dlinfo;
5276  memset(&dlinfo, 0, sizeof(dlinfo));
5277  if (dladdr(addr, &dlinfo)) {
5278#ifdef _LP64
5279    tty->print("0x%016lx: ", addr);
5280#else
5281    tty->print("0x%08x: ", addr);
5282#endif
5283    if (dlinfo.dli_sname != NULL)
5284      tty->print("%s+%#lx", dlinfo.dli_sname, addr-(intptr_t)dlinfo.dli_saddr);
5285    else if (dlinfo.dli_fname)
5286      tty->print("<offset %#lx>", addr-(intptr_t)dlinfo.dli_fbase);
5287    else
5288      tty->print("<absolute address>");
5289    if (dlinfo.dli_fname)  tty->print(" in %s", dlinfo.dli_fname);
5290#ifdef _LP64
5291    if (dlinfo.dli_fbase)  tty->print(" at 0x%016lx", dlinfo.dli_fbase);
5292#else
5293    if (dlinfo.dli_fbase)  tty->print(" at 0x%08x", dlinfo.dli_fbase);
5294#endif
5295    tty->cr();
5296
5297    if (Verbose) {
5298      // decode some bytes around the PC
5299      address begin = same_page(addr-40, addr);
5300      address end   = same_page(addr+40, addr);
5301      address       lowest = (address) dlinfo.dli_sname;
5302      if (!lowest)  lowest = (address) dlinfo.dli_fbase;
5303      if (begin < lowest)  begin = lowest;
5304      Dl_info dlinfo2;
5305      if (dladdr(end, &dlinfo2) && dlinfo2.dli_saddr != dlinfo.dli_saddr
5306          && end > dlinfo2.dli_saddr && dlinfo2.dli_saddr > begin)
5307        end = (address) dlinfo2.dli_saddr;
5308      Disassembler::decode(begin, end);
5309    }
5310    return true;
5311  }
5312  return false;
5313}
5314
5315#endif
5316
5317
5318// Following function has been added to support HotSparc's libjvm.so running
5319// under Solaris production JDK 1.2.2 / 1.3.0.  These came from
5320// src/solaris/hpi/native_threads in the EVM codebase.
5321//
5322// NOTE: This is no longer needed in the 1.3.1 and 1.4 production release
5323// libraries and should thus be removed. We will leave it behind for a while
5324// until we no longer want to able to run on top of 1.3.0 Solaris production
5325// JDK. See 4341971.
5326
5327#define STACK_SLACK 0x800
5328
5329extern "C" {
5330  intptr_t sysThreadAvailableStackWithSlack() {
5331    stack_t st;
5332    intptr_t retval, stack_top;
5333    retval = thr_stksegment(&st);
5334    assert(retval == 0, "incorrect return value from thr_stksegment");
5335    assert((address)&st < (address)st.ss_sp, "Invalid stack base returned");
5336    assert((address)&st > (address)st.ss_sp-st.ss_size, "Invalid stack size returned");
5337    stack_top=(intptr_t)st.ss_sp-st.ss_size;
5338    return ((intptr_t)&stack_top - stack_top - STACK_SLACK);
5339  }
5340}
5341
5342// Just to get the Kernel build to link on solaris for testing.
5343
5344extern "C" {
5345class ASGCT_CallTrace;
5346void AsyncGetCallTrace(ASGCT_CallTrace *trace, jint depth, void* ucontext)
5347  KERNEL_RETURN;
5348}
5349
5350
5351// ObjectMonitor park-unpark infrastructure ...
5352//
5353// We implement Solaris and Linux PlatformEvents with the
5354// obvious condvar-mutex-flag triple.
5355// Another alternative that works quite well is pipes:
5356// Each PlatformEvent consists of a pipe-pair.
5357// The thread associated with the PlatformEvent
5358// calls park(), which reads from the input end of the pipe.
5359// Unpark() writes into the other end of the pipe.
5360// The write-side of the pipe must be set NDELAY.
5361// Unfortunately pipes consume a large # of handles.
5362// Native solaris lwp_park() and lwp_unpark() work nicely, too.
5363// Using pipes for the 1st few threads might be workable, however.
5364//
5365// park() is permitted to return spuriously.
5366// Callers of park() should wrap the call to park() in
5367// an appropriate loop.  A litmus test for the correct
5368// usage of park is the following: if park() were modified
5369// to immediately return 0 your code should still work,
5370// albeit degenerating to a spin loop.
5371//
5372// An interesting optimization for park() is to use a trylock()
5373// to attempt to acquire the mutex.  If the trylock() fails
5374// then we know that a concurrent unpark() operation is in-progress.
5375// in that case the park() code could simply set _count to 0
5376// and return immediately.  The subsequent park() operation *might*
5377// return immediately.  That's harmless as the caller of park() is
5378// expected to loop.  By using trylock() we will have avoided a
5379// avoided a context switch caused by contention on the per-thread mutex.
5380//
5381// TODO-FIXME:
5382// 1.  Reconcile Doug's JSR166 j.u.c park-unpark with the
5383//     objectmonitor implementation.
5384// 2.  Collapse the JSR166 parker event, and the
5385//     objectmonitor ParkEvent into a single "Event" construct.
5386// 3.  In park() and unpark() add:
5387//     assert (Thread::current() == AssociatedWith).
5388// 4.  add spurious wakeup injection on a -XX:EarlyParkReturn=N switch.
5389//     1-out-of-N park() operations will return immediately.
5390//
5391// _Event transitions in park()
5392//   -1 => -1 : illegal
5393//    1 =>  0 : pass - return immediately
5394//    0 => -1 : block
5395//
5396// _Event serves as a restricted-range semaphore.
5397//
5398// Another possible encoding of _Event would be with
5399// explicit "PARKED" == 01b and "SIGNALED" == 10b bits.
5400//
5401// TODO-FIXME: add DTRACE probes for:
5402// 1.   Tx parks
5403// 2.   Ty unparks Tx
5404// 3.   Tx resumes from park
5405
5406
5407// value determined through experimentation
5408#define ROUNDINGFIX 11
5409
5410// utility to compute the abstime argument to timedwait.
5411// TODO-FIXME: switch from compute_abstime() to unpackTime().
5412
5413static timestruc_t* compute_abstime(timestruc_t* abstime, jlong millis) {
5414  // millis is the relative timeout time
5415  // abstime will be the absolute timeout time
5416  if (millis < 0)  millis = 0;
5417  struct timeval now;
5418  int status = gettimeofday(&now, NULL);
5419  assert(status == 0, "gettimeofday");
5420  jlong seconds = millis / 1000;
5421  jlong max_wait_period;
5422
5423  if (UseLWPSynchronization) {
5424    // forward port of fix for 4275818 (not sleeping long enough)
5425    // There was a bug in Solaris 6, 7 and pre-patch 5 of 8 where
5426    // _lwp_cond_timedwait() used a round_down algorithm rather
5427    // than a round_up. For millis less than our roundfactor
5428    // it rounded down to 0 which doesn't meet the spec.
5429    // For millis > roundfactor we may return a bit sooner, but
5430    // since we can not accurately identify the patch level and
5431    // this has already been fixed in Solaris 9 and 8 we will
5432    // leave it alone rather than always rounding down.
5433
5434    if (millis > 0 && millis < ROUNDINGFIX) millis = ROUNDINGFIX;
5435       // It appears that when we go directly through Solaris _lwp_cond_timedwait()
5436           // the acceptable max time threshold is smaller than for libthread on 2.5.1 and 2.6
5437           max_wait_period = 21000000;
5438  } else {
5439    max_wait_period = 50000000;
5440  }
5441  millis %= 1000;
5442  if (seconds > max_wait_period) {      // see man cond_timedwait(3T)
5443     seconds = max_wait_period;
5444  }
5445  abstime->tv_sec = now.tv_sec  + seconds;
5446  long       usec = now.tv_usec + millis * 1000;
5447  if (usec >= 1000000) {
5448    abstime->tv_sec += 1;
5449    usec -= 1000000;
5450  }
5451  abstime->tv_nsec = usec * 1000;
5452  return abstime;
5453}
5454
5455// Test-and-clear _Event, always leaves _Event set to 0, returns immediately.
5456// Conceptually TryPark() should be equivalent to park(0).
5457
5458int os::PlatformEvent::TryPark() {
5459  for (;;) {
5460    const int v = _Event ;
5461    guarantee ((v == 0) || (v == 1), "invariant") ;
5462    if (Atomic::cmpxchg (0, &_Event, v) == v) return v  ;
5463  }
5464}
5465
5466void os::PlatformEvent::park() {           // AKA: down()
5467  // Invariant: Only the thread associated with the Event/PlatformEvent
5468  // may call park().
5469  int v ;
5470  for (;;) {
5471      v = _Event ;
5472      if (Atomic::cmpxchg (v-1, &_Event, v) == v) break ;
5473  }
5474  guarantee (v >= 0, "invariant") ;
5475  if (v == 0) {
5476     // Do this the hard way by blocking ...
5477     // See http://monaco.sfbay/detail.jsf?cr=5094058.
5478     // TODO-FIXME: for Solaris SPARC set fprs.FEF=0 prior to parking.
5479     // Only for SPARC >= V8PlusA
5480#if defined(__sparc) && defined(COMPILER2)
5481     if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5482#endif
5483     int status = os::Solaris::mutex_lock(_mutex);
5484     assert_status(status == 0, status,  "mutex_lock");
5485     guarantee (_nParked == 0, "invariant") ;
5486     ++ _nParked ;
5487     while (_Event < 0) {
5488        // for some reason, under 2.7 lwp_cond_wait() may return ETIME ...
5489        // Treat this the same as if the wait was interrupted
5490        // With usr/lib/lwp going to kernel, always handle ETIME
5491        status = os::Solaris::cond_wait(_cond, _mutex);
5492        if (status == ETIME) status = EINTR ;
5493        assert_status(status == 0 || status == EINTR, status, "cond_wait");
5494     }
5495     -- _nParked ;
5496     _Event = 0 ;
5497     status = os::Solaris::mutex_unlock(_mutex);
5498     assert_status(status == 0, status, "mutex_unlock");
5499  }
5500}
5501
5502int os::PlatformEvent::park(jlong millis) {
5503  guarantee (_nParked == 0, "invariant") ;
5504  int v ;
5505  for (;;) {
5506      v = _Event ;
5507      if (Atomic::cmpxchg (v-1, &_Event, v) == v) break ;
5508  }
5509  guarantee (v >= 0, "invariant") ;
5510  if (v != 0) return OS_OK ;
5511
5512  int ret = OS_TIMEOUT;
5513  timestruc_t abst;
5514  compute_abstime (&abst, millis);
5515
5516  // See http://monaco.sfbay/detail.jsf?cr=5094058.
5517  // For Solaris SPARC set fprs.FEF=0 prior to parking.
5518  // Only for SPARC >= V8PlusA
5519#if defined(__sparc) && defined(COMPILER2)
5520 if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5521#endif
5522  int status = os::Solaris::mutex_lock(_mutex);
5523  assert_status(status == 0, status, "mutex_lock");
5524  guarantee (_nParked == 0, "invariant") ;
5525  ++ _nParked ;
5526  while (_Event < 0) {
5527     int status = os::Solaris::cond_timedwait(_cond, _mutex, &abst);
5528     assert_status(status == 0 || status == EINTR ||
5529                   status == ETIME || status == ETIMEDOUT,
5530                   status, "cond_timedwait");
5531     if (!FilterSpuriousWakeups) break ;                // previous semantics
5532     if (status == ETIME || status == ETIMEDOUT) break ;
5533     // We consume and ignore EINTR and spurious wakeups.
5534  }
5535  -- _nParked ;
5536  if (_Event >= 0) ret = OS_OK ;
5537  _Event = 0 ;
5538  status = os::Solaris::mutex_unlock(_mutex);
5539  assert_status(status == 0, status, "mutex_unlock");
5540  return ret;
5541}
5542
5543void os::PlatformEvent::unpark() {
5544  int v, AnyWaiters;
5545
5546  // Increment _Event.
5547  // Another acceptable implementation would be to simply swap 1
5548  // into _Event:
5549  //   if (Swap (&_Event, 1) < 0) {
5550  //      mutex_lock (_mutex) ; AnyWaiters = nParked; mutex_unlock (_mutex) ;
5551  //      if (AnyWaiters) cond_signal (_cond) ;
5552  //   }
5553
5554  for (;;) {
5555    v = _Event ;
5556    if (v > 0) {
5557       // The LD of _Event could have reordered or be satisfied
5558       // by a read-aside from this processor's write buffer.
5559       // To avoid problems execute a barrier and then
5560       // ratify the value.  A degenerate CAS() would also work.
5561       // Viz., CAS (v+0, &_Event, v) == v).
5562       OrderAccess::fence() ;
5563       if (_Event == v) return ;
5564       continue ;
5565    }
5566    if (Atomic::cmpxchg (v+1, &_Event, v) == v) break ;
5567  }
5568
5569  // If the thread associated with the event was parked, wake it.
5570  if (v < 0) {
5571     int status ;
5572     // Wait for the thread assoc with the PlatformEvent to vacate.
5573     status = os::Solaris::mutex_lock(_mutex);
5574     assert_status(status == 0, status, "mutex_lock");
5575     AnyWaiters = _nParked ;
5576     status = os::Solaris::mutex_unlock(_mutex);
5577     assert_status(status == 0, status, "mutex_unlock");
5578     guarantee (AnyWaiters == 0 || AnyWaiters == 1, "invariant") ;
5579     if (AnyWaiters != 0) {
5580       // We intentional signal *after* dropping the lock
5581       // to avoid a common class of futile wakeups.
5582       status = os::Solaris::cond_signal(_cond);
5583       assert_status(status == 0, status, "cond_signal");
5584     }
5585  }
5586}
5587
5588// JSR166
5589// -------------------------------------------------------
5590
5591/*
5592 * The solaris and linux implementations of park/unpark are fairly
5593 * conservative for now, but can be improved. They currently use a
5594 * mutex/condvar pair, plus _counter.
5595 * Park decrements _counter if > 0, else does a condvar wait.  Unpark
5596 * sets count to 1 and signals condvar.  Only one thread ever waits
5597 * on the condvar. Contention seen when trying to park implies that someone
5598 * is unparking you, so don't wait. And spurious returns are fine, so there
5599 * is no need to track notifications.
5600 */
5601
5602#define NANOSECS_PER_SEC 1000000000
5603#define NANOSECS_PER_MILLISEC 1000000
5604#define MAX_SECS 100000000
5605
5606/*
5607 * This code is common to linux and solaris and will be moved to a
5608 * common place in dolphin.
5609 *
5610 * The passed in time value is either a relative time in nanoseconds
5611 * or an absolute time in milliseconds. Either way it has to be unpacked
5612 * into suitable seconds and nanoseconds components and stored in the
5613 * given timespec structure.
5614 * Given time is a 64-bit value and the time_t used in the timespec is only
5615 * a signed-32-bit value (except on 64-bit Linux) we have to watch for
5616 * overflow if times way in the future are given. Further on Solaris versions
5617 * prior to 10 there is a restriction (see cond_timedwait) that the specified
5618 * number of seconds, in abstime, is less than current_time  + 100,000,000.
5619 * As it will be 28 years before "now + 100000000" will overflow we can
5620 * ignore overflow and just impose a hard-limit on seconds using the value
5621 * of "now + 100,000,000". This places a limit on the timeout of about 3.17
5622 * years from "now".
5623 */
5624static void unpackTime(timespec* absTime, bool isAbsolute, jlong time) {
5625  assert (time > 0, "convertTime");
5626
5627  struct timeval now;
5628  int status = gettimeofday(&now, NULL);
5629  assert(status == 0, "gettimeofday");
5630
5631  time_t max_secs = now.tv_sec + MAX_SECS;
5632
5633  if (isAbsolute) {
5634    jlong secs = time / 1000;
5635    if (secs > max_secs) {
5636      absTime->tv_sec = max_secs;
5637    }
5638    else {
5639      absTime->tv_sec = secs;
5640    }
5641    absTime->tv_nsec = (time % 1000) * NANOSECS_PER_MILLISEC;
5642  }
5643  else {
5644    jlong secs = time / NANOSECS_PER_SEC;
5645    if (secs >= MAX_SECS) {
5646      absTime->tv_sec = max_secs;
5647      absTime->tv_nsec = 0;
5648    }
5649    else {
5650      absTime->tv_sec = now.tv_sec + secs;
5651      absTime->tv_nsec = (time % NANOSECS_PER_SEC) + now.tv_usec*1000;
5652      if (absTime->tv_nsec >= NANOSECS_PER_SEC) {
5653        absTime->tv_nsec -= NANOSECS_PER_SEC;
5654        ++absTime->tv_sec; // note: this must be <= max_secs
5655      }
5656    }
5657  }
5658  assert(absTime->tv_sec >= 0, "tv_sec < 0");
5659  assert(absTime->tv_sec <= max_secs, "tv_sec > max_secs");
5660  assert(absTime->tv_nsec >= 0, "tv_nsec < 0");
5661  assert(absTime->tv_nsec < NANOSECS_PER_SEC, "tv_nsec >= nanos_per_sec");
5662}
5663
5664void Parker::park(bool isAbsolute, jlong time) {
5665
5666  // Optional fast-path check:
5667  // Return immediately if a permit is available.
5668  if (_counter > 0) {
5669      _counter = 0 ;
5670      return ;
5671  }
5672
5673  // Optional fast-exit: Check interrupt before trying to wait
5674  Thread* thread = Thread::current();
5675  assert(thread->is_Java_thread(), "Must be JavaThread");
5676  JavaThread *jt = (JavaThread *)thread;
5677  if (Thread::is_interrupted(thread, false)) {
5678    return;
5679  }
5680
5681  // First, demultiplex/decode time arguments
5682  timespec absTime;
5683  if (time < 0) { // don't wait at all
5684    return;
5685  }
5686  if (time > 0) {
5687    // Warning: this code might be exposed to the old Solaris time
5688    // round-down bugs.  Grep "roundingFix" for details.
5689    unpackTime(&absTime, isAbsolute, time);
5690  }
5691
5692  // Enter safepoint region
5693  // Beware of deadlocks such as 6317397.
5694  // The per-thread Parker:: _mutex is a classic leaf-lock.
5695  // In particular a thread must never block on the Threads_lock while
5696  // holding the Parker:: mutex.  If safepoints are pending both the
5697  // the ThreadBlockInVM() CTOR and DTOR may grab Threads_lock.
5698  ThreadBlockInVM tbivm(jt);
5699
5700  // Don't wait if cannot get lock since interference arises from
5701  // unblocking.  Also. check interrupt before trying wait
5702  if (Thread::is_interrupted(thread, false) ||
5703      os::Solaris::mutex_trylock(_mutex) != 0) {
5704    return;
5705  }
5706
5707  int status ;
5708
5709  if (_counter > 0)  { // no wait needed
5710    _counter = 0;
5711    status = os::Solaris::mutex_unlock(_mutex);
5712    assert (status == 0, "invariant") ;
5713    return;
5714  }
5715
5716#ifdef ASSERT
5717  // Don't catch signals while blocked; let the running threads have the signals.
5718  // (This allows a debugger to break into the running thread.)
5719  sigset_t oldsigs;
5720  sigset_t* allowdebug_blocked = os::Solaris::allowdebug_blocked_signals();
5721  thr_sigsetmask(SIG_BLOCK, allowdebug_blocked, &oldsigs);
5722#endif
5723
5724  OSThreadWaitState osts(thread->osthread(), false /* not Object.wait() */);
5725  jt->set_suspend_equivalent();
5726  // cleared by handle_special_suspend_equivalent_condition() or java_suspend_self()
5727
5728  // Do this the hard way by blocking ...
5729  // See http://monaco.sfbay/detail.jsf?cr=5094058.
5730  // TODO-FIXME: for Solaris SPARC set fprs.FEF=0 prior to parking.
5731  // Only for SPARC >= V8PlusA
5732#if defined(__sparc) && defined(COMPILER2)
5733  if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5734#endif
5735
5736  if (time == 0) {
5737    status = os::Solaris::cond_wait (_cond, _mutex) ;
5738  } else {
5739    status = os::Solaris::cond_timedwait (_cond, _mutex, &absTime);
5740  }
5741  // Note that an untimed cond_wait() can sometimes return ETIME on older
5742  // versions of the Solaris.
5743  assert_status(status == 0 || status == EINTR ||
5744                status == ETIME || status == ETIMEDOUT,
5745                status, "cond_timedwait");
5746
5747#ifdef ASSERT
5748  thr_sigsetmask(SIG_SETMASK, &oldsigs, NULL);
5749#endif
5750  _counter = 0 ;
5751  status = os::Solaris::mutex_unlock(_mutex);
5752  assert_status(status == 0, status, "mutex_unlock") ;
5753
5754  // If externally suspended while waiting, re-suspend
5755  if (jt->handle_special_suspend_equivalent_condition()) {
5756    jt->java_suspend_self();
5757  }
5758
5759}
5760
5761void Parker::unpark() {
5762  int s, status ;
5763  status = os::Solaris::mutex_lock (_mutex) ;
5764  assert (status == 0, "invariant") ;
5765  s = _counter;
5766  _counter = 1;
5767  status = os::Solaris::mutex_unlock (_mutex) ;
5768  assert (status == 0, "invariant") ;
5769
5770  if (s < 1) {
5771    status = os::Solaris::cond_signal (_cond) ;
5772    assert (status == 0, "invariant") ;
5773  }
5774}
5775
5776extern char** environ;
5777
5778// Run the specified command in a separate process. Return its exit value,
5779// or -1 on failure (e.g. can't fork a new process).
5780// Unlike system(), this function can be called from signal handler. It
5781// doesn't block SIGINT et al.
5782int os::fork_and_exec(char* cmd) {
5783  char * argv[4];
5784  argv[0] = (char *)"sh";
5785  argv[1] = (char *)"-c";
5786  argv[2] = cmd;
5787  argv[3] = NULL;
5788
5789  // fork is async-safe, fork1 is not so can't use in signal handler
5790  pid_t pid;
5791  Thread* t = ThreadLocalStorage::get_thread_slow();
5792  if (t != NULL && t->is_inside_signal_handler()) {
5793    pid = fork();
5794  } else {
5795    pid = fork1();
5796  }
5797
5798  if (pid < 0) {
5799    // fork failed
5800    warning("fork failed: %s", strerror(errno));
5801    return -1;
5802
5803  } else if (pid == 0) {
5804    // child process
5805
5806    // try to be consistent with system(), which uses "/usr/bin/sh" on Solaris
5807    execve("/usr/bin/sh", argv, environ);
5808
5809    // execve failed
5810    _exit(-1);
5811
5812  } else  {
5813    // copied from J2SE ..._waitForProcessExit() in UNIXProcess_md.c; we don't
5814    // care about the actual exit code, for now.
5815
5816    int status;
5817
5818    // Wait for the child process to exit.  This returns immediately if
5819    // the child has already exited. */
5820    while (waitpid(pid, &status, 0) < 0) {
5821        switch (errno) {
5822        case ECHILD: return 0;
5823        case EINTR: break;
5824        default: return -1;
5825        }
5826    }
5827
5828    if (WIFEXITED(status)) {
5829       // The child exited normally; get its exit code.
5830       return WEXITSTATUS(status);
5831    } else if (WIFSIGNALED(status)) {
5832       // The child exited because of a signal
5833       // The best value to return is 0x80 + signal number,
5834       // because that is what all Unix shells do, and because
5835       // it allows callers to distinguish between process exit and
5836       // process death by signal.
5837       return 0x80 + WTERMSIG(status);
5838    } else {
5839       // Unknown exit code; pass it through
5840       return status;
5841    }
5842  }
5843}
5844