os_solaris.cpp revision 579:0fbdb4381b99
1/*
2 * Copyright 1997-2009 Sun Microsystems, Inc.  All Rights Reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
20 * CA 95054 USA or visit www.sun.com if you need additional information or
21 * have any questions.
22 *
23 */
24
25// do not include  precompiled  header file
26# include "incls/_os_solaris.cpp.incl"
27
28// put OS-includes here
29# include <dlfcn.h>
30# include <errno.h>
31# include <link.h>
32# include <poll.h>
33# include <pthread.h>
34# include <pwd.h>
35# include <schedctl.h>
36# include <setjmp.h>
37# include <signal.h>
38# include <stdio.h>
39# include <alloca.h>
40# include <sys/filio.h>
41# include <sys/ipc.h>
42# include <sys/lwp.h>
43# include <sys/machelf.h>     // for elf Sym structure used by dladdr1
44# include <sys/mman.h>
45# include <sys/processor.h>
46# include <sys/procset.h>
47# include <sys/pset.h>
48# include <sys/resource.h>
49# include <sys/shm.h>
50# include <sys/socket.h>
51# include <sys/stat.h>
52# include <sys/systeminfo.h>
53# include <sys/time.h>
54# include <sys/times.h>
55# include <sys/types.h>
56# include <sys/wait.h>
57# include <sys/utsname.h>
58# include <thread.h>
59# include <unistd.h>
60# include <sys/priocntl.h>
61# include <sys/rtpriocntl.h>
62# include <sys/tspriocntl.h>
63# include <sys/iapriocntl.h>
64# include <sys/loadavg.h>
65# include <string.h>
66
67# define _STRUCTURED_PROC 1  //  this gets us the new structured proc interfaces of 5.6 & later
68# include <sys/procfs.h>     //  see comment in <sys/procfs.h>
69
70#define MAX_PATH (2 * K)
71
72// for timer info max values which include all bits
73#define ALL_64_BITS CONST64(0xFFFFFFFFFFFFFFFF)
74
75#ifdef _GNU_SOURCE
76// See bug #6514594
77extern "C" int madvise(caddr_t, size_t, int);
78extern "C"  int memcntl(caddr_t addr, size_t len, int cmd, caddr_t  arg,
79     int attr, int mask);
80#endif //_GNU_SOURCE
81
82/*
83  MPSS Changes Start.
84  The JVM binary needs to be built and run on pre-Solaris 9
85  systems, but the constants needed by MPSS are only in Solaris 9
86  header files.  They are textually replicated here to allow
87  building on earlier systems.  Once building on Solaris 8 is
88  no longer a requirement, these #defines can be replaced by ordinary
89  system .h inclusion.
90
91  In earlier versions of the  JDK and Solaris, we used ISM for large pages.
92  But ISM requires shared memory to achieve this and thus has many caveats.
93  MPSS is a fully transparent and is a cleaner way to get large pages.
94  Although we still require keeping ISM for backward compatiblitiy as well as
95  giving the opportunity to use large pages on older systems it is
96  recommended that MPSS be used for Solaris 9 and above.
97
98*/
99
100#ifndef MC_HAT_ADVISE
101
102struct memcntl_mha {
103  uint_t          mha_cmd;        /* command(s) */
104  uint_t          mha_flags;
105  size_t          mha_pagesize;
106};
107#define MC_HAT_ADVISE   7       /* advise hat map size */
108#define MHA_MAPSIZE_VA  0x1     /* set preferred page size */
109#define MAP_ALIGN       0x200   /* addr specifies alignment */
110
111#endif
112// MPSS Changes End.
113
114
115// Here are some liblgrp types from sys/lgrp_user.h to be able to
116// compile on older systems without this header file.
117
118#ifndef MADV_ACCESS_LWP
119# define  MADV_ACCESS_LWP         7       /* next LWP to access heavily */
120#endif
121#ifndef MADV_ACCESS_MANY
122# define  MADV_ACCESS_MANY        8       /* many processes to access heavily */
123#endif
124
125#ifndef LGRP_RSRC_CPU
126# define LGRP_RSRC_CPU           0       /* CPU resources */
127#endif
128#ifndef LGRP_RSRC_MEM
129# define LGRP_RSRC_MEM           1       /* memory resources */
130#endif
131
132// Some more macros from sys/mman.h that are not present in Solaris 8.
133
134#ifndef MAX_MEMINFO_CNT
135/*
136 * info_req request type definitions for meminfo
137 * request types starting with MEMINFO_V are used for Virtual addresses
138 * and should not be mixed with MEMINFO_PLGRP which is targeted for Physical
139 * addresses
140 */
141# define MEMINFO_SHIFT           16
142# define MEMINFO_MASK            (0xFF << MEMINFO_SHIFT)
143# define MEMINFO_VPHYSICAL       (0x01 << MEMINFO_SHIFT) /* get physical addr */
144# define MEMINFO_VLGRP           (0x02 << MEMINFO_SHIFT) /* get lgroup */
145# define MEMINFO_VPAGESIZE       (0x03 << MEMINFO_SHIFT) /* size of phys page */
146# define MEMINFO_VREPLCNT        (0x04 << MEMINFO_SHIFT) /* no. of replica */
147# define MEMINFO_VREPL           (0x05 << MEMINFO_SHIFT) /* physical replica */
148# define MEMINFO_VREPL_LGRP      (0x06 << MEMINFO_SHIFT) /* lgrp of replica */
149# define MEMINFO_PLGRP           (0x07 << MEMINFO_SHIFT) /* lgroup for paddr */
150
151/* maximum number of addresses meminfo() can process at a time */
152# define MAX_MEMINFO_CNT 256
153
154/* maximum number of request types */
155# define MAX_MEMINFO_REQ 31
156#endif
157
158// see thr_setprio(3T) for the basis of these numbers
159#define MinimumPriority 0
160#define NormalPriority  64
161#define MaximumPriority 127
162
163// Values for ThreadPriorityPolicy == 1
164int prio_policy1[MaxPriority+1] = { -99999, 0, 16, 32, 48, 64,
165                                        80, 96, 112, 124, 127 };
166
167// System parameters used internally
168static clock_t clock_tics_per_sec = 100;
169
170// For diagnostics to print a message once. see run_periodic_checks
171static bool check_addr0_done = false;
172static sigset_t check_signal_done;
173static bool check_signals = true;
174
175address os::Solaris::handler_start;  // start pc of thr_sighndlrinfo
176address os::Solaris::handler_end;    // end pc of thr_sighndlrinfo
177
178address os::Solaris::_main_stack_base = NULL;  // 4352906 workaround
179
180
181// "default" initializers for missing libc APIs
182extern "C" {
183  static int lwp_mutex_init(mutex_t *mx, int scope, void *arg) { memset(mx, 0, sizeof(mutex_t)); return 0; }
184  static int lwp_mutex_destroy(mutex_t *mx)                 { return 0; }
185
186  static int lwp_cond_init(cond_t *cv, int scope, void *arg){ memset(cv, 0, sizeof(cond_t)); return 0; }
187  static int lwp_cond_destroy(cond_t *cv)                   { return 0; }
188}
189
190// "default" initializers for pthread-based synchronization
191extern "C" {
192  static int pthread_mutex_default_init(mutex_t *mx, int scope, void *arg) { memset(mx, 0, sizeof(mutex_t)); return 0; }
193  static int pthread_cond_default_init(cond_t *cv, int scope, void *arg){ memset(cv, 0, sizeof(cond_t)); return 0; }
194}
195
196// Thread Local Storage
197// This is common to all Solaris platforms so it is defined here,
198// in this common file.
199// The declarations are in the os_cpu threadLS*.hpp files.
200//
201// Static member initialization for TLS
202Thread* ThreadLocalStorage::_get_thread_cache[ThreadLocalStorage::_pd_cache_size] = {NULL};
203
204#ifndef PRODUCT
205#define _PCT(n,d)       ((100.0*(double)(n))/(double)(d))
206
207int ThreadLocalStorage::_tcacheHit = 0;
208int ThreadLocalStorage::_tcacheMiss = 0;
209
210void ThreadLocalStorage::print_statistics() {
211  int total = _tcacheMiss+_tcacheHit;
212  tty->print_cr("Thread cache hits %d misses %d total %d percent %f\n",
213                _tcacheHit, _tcacheMiss, total, _PCT(_tcacheHit, total));
214}
215#undef _PCT
216#endif // PRODUCT
217
218Thread* ThreadLocalStorage::get_thread_via_cache_slowly(uintptr_t raw_id,
219                                                        int index) {
220  Thread *thread = get_thread_slow();
221  if (thread != NULL) {
222    address sp = os::current_stack_pointer();
223    guarantee(thread->_stack_base == NULL ||
224              (sp <= thread->_stack_base &&
225                 sp >= thread->_stack_base - thread->_stack_size) ||
226               is_error_reported(),
227              "sp must be inside of selected thread stack");
228
229    thread->_self_raw_id = raw_id;  // mark for quick retrieval
230    _get_thread_cache[ index ] = thread;
231  }
232  return thread;
233}
234
235
236static const double all_zero[ sizeof(Thread) / sizeof(double) + 1 ] = {0};
237#define NO_CACHED_THREAD ((Thread*)all_zero)
238
239void ThreadLocalStorage::pd_set_thread(Thread* thread) {
240
241  // Store the new value before updating the cache to prevent a race
242  // between get_thread_via_cache_slowly() and this store operation.
243  os::thread_local_storage_at_put(ThreadLocalStorage::thread_index(), thread);
244
245  // Update thread cache with new thread if setting on thread create,
246  // or NO_CACHED_THREAD (zeroed) thread if resetting thread on exit.
247  uintptr_t raw = pd_raw_thread_id();
248  int ix = pd_cache_index(raw);
249  _get_thread_cache[ix] = thread == NULL ? NO_CACHED_THREAD : thread;
250}
251
252void ThreadLocalStorage::pd_init() {
253  for (int i = 0; i < _pd_cache_size; i++) {
254    _get_thread_cache[i] = NO_CACHED_THREAD;
255  }
256}
257
258// Invalidate all the caches (happens to be the same as pd_init).
259void ThreadLocalStorage::pd_invalidate_all() { pd_init(); }
260
261#undef NO_CACHED_THREAD
262
263// END Thread Local Storage
264
265static inline size_t adjust_stack_size(address base, size_t size) {
266  if ((ssize_t)size < 0) {
267    // 4759953: Compensate for ridiculous stack size.
268    size = max_intx;
269  }
270  if (size > (size_t)base) {
271    // 4812466: Make sure size doesn't allow the stack to wrap the address space.
272    size = (size_t)base;
273  }
274  return size;
275}
276
277static inline stack_t get_stack_info() {
278  stack_t st;
279  int retval = thr_stksegment(&st);
280  st.ss_size = adjust_stack_size((address)st.ss_sp, st.ss_size);
281  assert(retval == 0, "incorrect return value from thr_stksegment");
282  assert((address)&st < (address)st.ss_sp, "Invalid stack base returned");
283  assert((address)&st > (address)st.ss_sp-st.ss_size, "Invalid stack size returned");
284  return st;
285}
286
287address os::current_stack_base() {
288  int r = thr_main() ;
289  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
290  bool is_primordial_thread = r;
291
292  // Workaround 4352906, avoid calls to thr_stksegment by
293  // thr_main after the first one (it looks like we trash
294  // some data, causing the value for ss_sp to be incorrect).
295  if (!is_primordial_thread || os::Solaris::_main_stack_base == NULL) {
296    stack_t st = get_stack_info();
297    if (is_primordial_thread) {
298      // cache initial value of stack base
299      os::Solaris::_main_stack_base = (address)st.ss_sp;
300    }
301    return (address)st.ss_sp;
302  } else {
303    guarantee(os::Solaris::_main_stack_base != NULL, "Attempt to use null cached stack base");
304    return os::Solaris::_main_stack_base;
305  }
306}
307
308size_t os::current_stack_size() {
309  size_t size;
310
311  int r = thr_main() ;
312  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
313  if(!r) {
314    size = get_stack_info().ss_size;
315  } else {
316    struct rlimit limits;
317    getrlimit(RLIMIT_STACK, &limits);
318    size = adjust_stack_size(os::Solaris::_main_stack_base, (size_t)limits.rlim_cur);
319  }
320  // base may not be page aligned
321  address base = current_stack_base();
322  address bottom = (address)align_size_up((intptr_t)(base - size), os::vm_page_size());;
323  return (size_t)(base - bottom);
324}
325
326struct tm* os::localtime_pd(const time_t* clock, struct tm*  res) {
327  return localtime_r(clock, res);
328}
329
330// interruptible infrastructure
331
332// setup_interruptible saves the thread state before going into an
333// interruptible system call.
334// The saved state is used to restore the thread to
335// its former state whether or not an interrupt is received.
336// Used by classloader os::read
337// hpi calls skip this layer and stay in _thread_in_native
338
339void os::Solaris::setup_interruptible(JavaThread* thread) {
340
341  JavaThreadState thread_state = thread->thread_state();
342
343  assert(thread_state != _thread_blocked, "Coming from the wrong thread");
344  assert(thread_state != _thread_in_native, "Native threads skip setup_interruptible");
345  OSThread* osthread = thread->osthread();
346  osthread->set_saved_interrupt_thread_state(thread_state);
347  thread->frame_anchor()->make_walkable(thread);
348  ThreadStateTransition::transition(thread, thread_state, _thread_blocked);
349}
350
351// Version of setup_interruptible() for threads that are already in
352// _thread_blocked. Used by os_sleep().
353void os::Solaris::setup_interruptible_already_blocked(JavaThread* thread) {
354  thread->frame_anchor()->make_walkable(thread);
355}
356
357JavaThread* os::Solaris::setup_interruptible() {
358  JavaThread* thread = (JavaThread*)ThreadLocalStorage::thread();
359  setup_interruptible(thread);
360  return thread;
361}
362
363void os::Solaris::try_enable_extended_io() {
364  typedef int (*enable_extended_FILE_stdio_t)(int, int);
365
366  if (!UseExtendedFileIO) {
367    return;
368  }
369
370  enable_extended_FILE_stdio_t enabler =
371    (enable_extended_FILE_stdio_t) dlsym(RTLD_DEFAULT,
372                                         "enable_extended_FILE_stdio");
373  if (enabler) {
374    enabler(-1, -1);
375  }
376}
377
378
379#ifdef ASSERT
380
381JavaThread* os::Solaris::setup_interruptible_native() {
382  JavaThread* thread = (JavaThread*)ThreadLocalStorage::thread();
383  JavaThreadState thread_state = thread->thread_state();
384  assert(thread_state == _thread_in_native, "Assumed thread_in_native");
385  return thread;
386}
387
388void os::Solaris::cleanup_interruptible_native(JavaThread* thread) {
389  JavaThreadState thread_state = thread->thread_state();
390  assert(thread_state == _thread_in_native, "Assumed thread_in_native");
391}
392#endif
393
394// cleanup_interruptible reverses the effects of setup_interruptible
395// setup_interruptible_already_blocked() does not need any cleanup.
396
397void os::Solaris::cleanup_interruptible(JavaThread* thread) {
398  OSThread* osthread = thread->osthread();
399
400  ThreadStateTransition::transition(thread, _thread_blocked, osthread->saved_interrupt_thread_state());
401}
402
403// I/O interruption related counters called in _INTERRUPTIBLE
404
405void os::Solaris::bump_interrupted_before_count() {
406  RuntimeService::record_interrupted_before_count();
407}
408
409void os::Solaris::bump_interrupted_during_count() {
410  RuntimeService::record_interrupted_during_count();
411}
412
413static int _processors_online = 0;
414
415         jint os::Solaris::_os_thread_limit = 0;
416volatile jint os::Solaris::_os_thread_count = 0;
417
418julong os::available_memory() {
419  return Solaris::available_memory();
420}
421
422julong os::Solaris::available_memory() {
423  return (julong)sysconf(_SC_AVPHYS_PAGES) * os::vm_page_size();
424}
425
426julong os::Solaris::_physical_memory = 0;
427
428julong os::physical_memory() {
429   return Solaris::physical_memory();
430}
431
432julong os::allocatable_physical_memory(julong size) {
433#ifdef _LP64
434   return size;
435#else
436   julong result = MIN2(size, (julong)3835*M);
437   if (!is_allocatable(result)) {
438     // Memory allocations will be aligned but the alignment
439     // is not known at this point.  Alignments will
440     // be at most to LargePageSizeInBytes.  Protect
441     // allocations from alignments up to illegal
442     // values. If at this point 2G is illegal.
443     julong reasonable_size = (julong)2*G - 2 * LargePageSizeInBytes;
444     result =  MIN2(size, reasonable_size);
445   }
446   return result;
447#endif
448}
449
450static hrtime_t first_hrtime = 0;
451static const hrtime_t hrtime_hz = 1000*1000*1000;
452const int LOCK_BUSY = 1;
453const int LOCK_FREE = 0;
454const int LOCK_INVALID = -1;
455static volatile hrtime_t max_hrtime = 0;
456static volatile int max_hrtime_lock = LOCK_FREE;     // Update counter with LSB as lock-in-progress
457
458
459void os::Solaris::initialize_system_info() {
460  _processor_count = sysconf(_SC_NPROCESSORS_CONF);
461  _processors_online = sysconf (_SC_NPROCESSORS_ONLN);
462  _physical_memory = (julong)sysconf(_SC_PHYS_PAGES) * (julong)sysconf(_SC_PAGESIZE);
463}
464
465int os::active_processor_count() {
466  int online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
467  pid_t pid = getpid();
468  psetid_t pset = PS_NONE;
469  // Are we running in a processor set or is there any processor set around?
470  if (pset_bind(PS_QUERY, P_PID, pid, &pset) == 0) {
471    uint_t pset_cpus;
472    // Query the number of cpus available to us.
473    if (pset_info(pset, NULL, &pset_cpus, NULL) == 0) {
474      assert(pset_cpus > 0 && pset_cpus <= online_cpus, "sanity check");
475      _processors_online = pset_cpus;
476      return pset_cpus;
477    }
478  }
479  // Otherwise return number of online cpus
480  return online_cpus;
481}
482
483static bool find_processors_in_pset(psetid_t        pset,
484                                    processorid_t** id_array,
485                                    uint_t*         id_length) {
486  bool result = false;
487  // Find the number of processors in the processor set.
488  if (pset_info(pset, NULL, id_length, NULL) == 0) {
489    // Make up an array to hold their ids.
490    *id_array = NEW_C_HEAP_ARRAY(processorid_t, *id_length);
491    // Fill in the array with their processor ids.
492    if (pset_info(pset, NULL, id_length, *id_array) == 0) {
493      result = true;
494    }
495  }
496  return result;
497}
498
499// Callers of find_processors_online() must tolerate imprecise results --
500// the system configuration can change asynchronously because of DR
501// or explicit psradm operations.
502//
503// We also need to take care that the loop (below) terminates as the
504// number of processors online can change between the _SC_NPROCESSORS_ONLN
505// request and the loop that builds the list of processor ids.   Unfortunately
506// there's no reliable way to determine the maximum valid processor id,
507// so we use a manifest constant, MAX_PROCESSOR_ID, instead.  See p_online
508// man pages, which claim the processor id set is "sparse, but
509// not too sparse".  MAX_PROCESSOR_ID is used to ensure that we eventually
510// exit the loop.
511//
512// In the future we'll be able to use sysconf(_SC_CPUID_MAX), but that's
513// not available on S8.0.
514
515static bool find_processors_online(processorid_t** id_array,
516                                   uint*           id_length) {
517  const processorid_t MAX_PROCESSOR_ID = 100000 ;
518  // Find the number of processors online.
519  *id_length = sysconf(_SC_NPROCESSORS_ONLN);
520  // Make up an array to hold their ids.
521  *id_array = NEW_C_HEAP_ARRAY(processorid_t, *id_length);
522  // Processors need not be numbered consecutively.
523  long found = 0;
524  processorid_t next = 0;
525  while (found < *id_length && next < MAX_PROCESSOR_ID) {
526    processor_info_t info;
527    if (processor_info(next, &info) == 0) {
528      // NB, PI_NOINTR processors are effectively online ...
529      if (info.pi_state == P_ONLINE || info.pi_state == P_NOINTR) {
530        (*id_array)[found] = next;
531        found += 1;
532      }
533    }
534    next += 1;
535  }
536  if (found < *id_length) {
537      // The loop above didn't identify the expected number of processors.
538      // We could always retry the operation, calling sysconf(_SC_NPROCESSORS_ONLN)
539      // and re-running the loop, above, but there's no guarantee of progress
540      // if the system configuration is in flux.  Instead, we just return what
541      // we've got.  Note that in the worst case find_processors_online() could
542      // return an empty set.  (As a fall-back in the case of the empty set we
543      // could just return the ID of the current processor).
544      *id_length = found ;
545  }
546
547  return true;
548}
549
550static bool assign_distribution(processorid_t* id_array,
551                                uint           id_length,
552                                uint*          distribution,
553                                uint           distribution_length) {
554  // We assume we can assign processorid_t's to uint's.
555  assert(sizeof(processorid_t) == sizeof(uint),
556         "can't convert processorid_t to uint");
557  // Quick check to see if we won't succeed.
558  if (id_length < distribution_length) {
559    return false;
560  }
561  // Assign processor ids to the distribution.
562  // Try to shuffle processors to distribute work across boards,
563  // assuming 4 processors per board.
564  const uint processors_per_board = ProcessDistributionStride;
565  // Find the maximum processor id.
566  processorid_t max_id = 0;
567  for (uint m = 0; m < id_length; m += 1) {
568    max_id = MAX2(max_id, id_array[m]);
569  }
570  // The next id, to limit loops.
571  const processorid_t limit_id = max_id + 1;
572  // Make up markers for available processors.
573  bool* available_id = NEW_C_HEAP_ARRAY(bool, limit_id);
574  for (uint c = 0; c < limit_id; c += 1) {
575    available_id[c] = false;
576  }
577  for (uint a = 0; a < id_length; a += 1) {
578    available_id[id_array[a]] = true;
579  }
580  // Step by "boards", then by "slot", copying to "assigned".
581  // NEEDS_CLEANUP: The assignment of processors should be stateful,
582  //                remembering which processors have been assigned by
583  //                previous calls, etc., so as to distribute several
584  //                independent calls of this method.  What we'd like is
585  //                It would be nice to have an API that let us ask
586  //                how many processes are bound to a processor,
587  //                but we don't have that, either.
588  //                In the short term, "board" is static so that
589  //                subsequent distributions don't all start at board 0.
590  static uint board = 0;
591  uint assigned = 0;
592  // Until we've found enough processors ....
593  while (assigned < distribution_length) {
594    // ... find the next available processor in the board.
595    for (uint slot = 0; slot < processors_per_board; slot += 1) {
596      uint try_id = board * processors_per_board + slot;
597      if ((try_id < limit_id) && (available_id[try_id] == true)) {
598        distribution[assigned] = try_id;
599        available_id[try_id] = false;
600        assigned += 1;
601        break;
602      }
603    }
604    board += 1;
605    if (board * processors_per_board + 0 >= limit_id) {
606      board = 0;
607    }
608  }
609  if (available_id != NULL) {
610    FREE_C_HEAP_ARRAY(bool, available_id);
611  }
612  return true;
613}
614
615bool os::distribute_processes(uint length, uint* distribution) {
616  bool result = false;
617  // Find the processor id's of all the available CPUs.
618  processorid_t* id_array  = NULL;
619  uint           id_length = 0;
620  // There are some races between querying information and using it,
621  // since processor sets can change dynamically.
622  psetid_t pset = PS_NONE;
623  // Are we running in a processor set?
624  if ((pset_bind(PS_QUERY, P_PID, P_MYID, &pset) == 0) && pset != PS_NONE) {
625    result = find_processors_in_pset(pset, &id_array, &id_length);
626  } else {
627    result = find_processors_online(&id_array, &id_length);
628  }
629  if (result == true) {
630    if (id_length >= length) {
631      result = assign_distribution(id_array, id_length, distribution, length);
632    } else {
633      result = false;
634    }
635  }
636  if (id_array != NULL) {
637    FREE_C_HEAP_ARRAY(processorid_t, id_array);
638  }
639  return result;
640}
641
642bool os::bind_to_processor(uint processor_id) {
643  // We assume that a processorid_t can be stored in a uint.
644  assert(sizeof(uint) == sizeof(processorid_t),
645         "can't convert uint to processorid_t");
646  int bind_result =
647    processor_bind(P_LWPID,                       // bind LWP.
648                   P_MYID,                        // bind current LWP.
649                   (processorid_t) processor_id,  // id.
650                   NULL);                         // don't return old binding.
651  return (bind_result == 0);
652}
653
654bool os::getenv(const char* name, char* buffer, int len) {
655  char* val = ::getenv( name );
656  if ( val == NULL
657  ||   strlen(val) + 1  >  len ) {
658    if (len > 0)  buffer[0] = 0; // return a null string
659    return false;
660  }
661  strcpy( buffer, val );
662  return true;
663}
664
665
666// Return true if user is running as root.
667
668bool os::have_special_privileges() {
669  static bool init = false;
670  static bool privileges = false;
671  if (!init) {
672    privileges = (getuid() != geteuid()) || (getgid() != getegid());
673    init = true;
674  }
675  return privileges;
676}
677
678
679static char* get_property(char* name, char* buffer, int buffer_size) {
680  if (os::getenv(name, buffer, buffer_size)) {
681    return buffer;
682  }
683  static char empty[] = "";
684  return empty;
685}
686
687
688void os::init_system_properties_values() {
689  char arch[12];
690  sysinfo(SI_ARCHITECTURE, arch, sizeof(arch));
691
692  // The next steps are taken in the product version:
693  //
694  // Obtain the JAVA_HOME value from the location of libjvm[_g].so.
695  // This library should be located at:
696  // <JAVA_HOME>/jre/lib/<arch>/{client|server}/libjvm[_g].so.
697  //
698  // If "/jre/lib/" appears at the right place in the path, then we
699  // assume libjvm[_g].so is installed in a JDK and we use this path.
700  //
701  // Otherwise exit with message: "Could not create the Java virtual machine."
702  //
703  // The following extra steps are taken in the debugging version:
704  //
705  // If "/jre/lib/" does NOT appear at the right place in the path
706  // instead of exit check for $JAVA_HOME environment variable.
707  //
708  // If it is defined and we are able to locate $JAVA_HOME/jre/lib/<arch>,
709  // then we append a fake suffix "hotspot/libjvm[_g].so" to this path so
710  // it looks like libjvm[_g].so is installed there
711  // <JAVA_HOME>/jre/lib/<arch>/hotspot/libjvm[_g].so.
712  //
713  // Otherwise exit.
714  //
715  // Important note: if the location of libjvm.so changes this
716  // code needs to be changed accordingly.
717
718  // The next few definitions allow the code to be verbatim:
719#define malloc(n) (char*)NEW_C_HEAP_ARRAY(char, (n))
720#define free(p) FREE_C_HEAP_ARRAY(char, p)
721#define getenv(n) ::getenv(n)
722
723#define EXTENSIONS_DIR  "/lib/ext"
724#define ENDORSED_DIR    "/lib/endorsed"
725#define COMMON_DIR      "/usr/jdk/packages"
726
727  {
728    /* sysclasspath, java_home, dll_dir */
729    {
730        char *home_path;
731        char *dll_path;
732        char *pslash;
733        char buf[MAXPATHLEN];
734        os::jvm_path(buf, sizeof(buf));
735
736        // Found the full path to libjvm.so.
737        // Now cut the path to <java_home>/jre if we can.
738        *(strrchr(buf, '/')) = '\0';  /* get rid of /libjvm.so */
739        pslash = strrchr(buf, '/');
740        if (pslash != NULL)
741            *pslash = '\0';           /* get rid of /{client|server|hotspot} */
742        dll_path = malloc(strlen(buf) + 1);
743        if (dll_path == NULL)
744            return;
745        strcpy(dll_path, buf);
746        Arguments::set_dll_dir(dll_path);
747
748        if (pslash != NULL) {
749            pslash = strrchr(buf, '/');
750            if (pslash != NULL) {
751                *pslash = '\0';       /* get rid of /<arch> */
752                pslash = strrchr(buf, '/');
753                if (pslash != NULL)
754                    *pslash = '\0';   /* get rid of /lib */
755            }
756        }
757
758        home_path = malloc(strlen(buf) + 1);
759        if (home_path == NULL)
760            return;
761        strcpy(home_path, buf);
762        Arguments::set_java_home(home_path);
763
764        if (!set_boot_path('/', ':'))
765            return;
766    }
767
768    /*
769     * Where to look for native libraries
770     */
771    {
772      // Use dlinfo() to determine the correct java.library.path.
773      //
774      // If we're launched by the Java launcher, and the user
775      // does not set java.library.path explicitly on the commandline,
776      // the Java launcher sets LD_LIBRARY_PATH for us and unsets
777      // LD_LIBRARY_PATH_32 and LD_LIBRARY_PATH_64.  In this case
778      // dlinfo returns LD_LIBRARY_PATH + crle settings (including
779      // /usr/lib), which is exactly what we want.
780      //
781      // If the user does set java.library.path, it completely
782      // overwrites this setting, and always has.
783      //
784      // If we're not launched by the Java launcher, we may
785      // get here with any/all of the LD_LIBRARY_PATH[_32|64]
786      // settings.  Again, dlinfo does exactly what we want.
787
788      Dl_serinfo     _info, *info = &_info;
789      Dl_serpath     *path;
790      char*          library_path;
791      char           *common_path;
792      int            i;
793
794      // determine search path count and required buffer size
795      if (dlinfo(RTLD_SELF, RTLD_DI_SERINFOSIZE, (void *)info) == -1) {
796        vm_exit_during_initialization("dlinfo SERINFOSIZE request", dlerror());
797      }
798
799      // allocate new buffer and initialize
800      info = (Dl_serinfo*)malloc(_info.dls_size);
801      if (info == NULL) {
802        vm_exit_out_of_memory(_info.dls_size,
803                              "init_system_properties_values info");
804      }
805      info->dls_size = _info.dls_size;
806      info->dls_cnt = _info.dls_cnt;
807
808      // obtain search path information
809      if (dlinfo(RTLD_SELF, RTLD_DI_SERINFO, (void *)info) == -1) {
810        free(info);
811        vm_exit_during_initialization("dlinfo SERINFO request", dlerror());
812      }
813
814      path = &info->dls_serpath[0];
815
816      // Note: Due to a legacy implementation, most of the library path
817      // is set in the launcher.  This was to accomodate linking restrictions
818      // on legacy Solaris implementations (which are no longer supported).
819      // Eventually, all the library path setting will be done here.
820      //
821      // However, to prevent the proliferation of improperly built native
822      // libraries, the new path component /usr/jdk/packages is added here.
823
824      // Determine the actual CPU architecture.
825      char cpu_arch[12];
826      sysinfo(SI_ARCHITECTURE, cpu_arch, sizeof(cpu_arch));
827#ifdef _LP64
828      // If we are a 64-bit vm, perform the following translations:
829      //   sparc   -> sparcv9
830      //   i386    -> amd64
831      if (strcmp(cpu_arch, "sparc") == 0)
832        strcat(cpu_arch, "v9");
833      else if (strcmp(cpu_arch, "i386") == 0)
834        strcpy(cpu_arch, "amd64");
835#endif
836
837      // Construct the invariant part of ld_library_path. Note that the
838      // space for the colon and the trailing null are provided by the
839      // nulls included by the sizeof operator.
840      size_t bufsize = sizeof(COMMON_DIR) + sizeof("/lib/") + strlen(cpu_arch);
841      common_path = malloc(bufsize);
842      if (common_path == NULL) {
843        free(info);
844        vm_exit_out_of_memory(bufsize,
845                              "init_system_properties_values common_path");
846      }
847      sprintf(common_path, COMMON_DIR "/lib/%s", cpu_arch);
848
849      // struct size is more than sufficient for the path components obtained
850      // through the dlinfo() call, so only add additional space for the path
851      // components explicitly added here.
852      bufsize = info->dls_size + strlen(common_path);
853      library_path = malloc(bufsize);
854      if (library_path == NULL) {
855        free(info);
856        free(common_path);
857        vm_exit_out_of_memory(bufsize,
858                              "init_system_properties_values library_path");
859      }
860      library_path[0] = '\0';
861
862      // Construct the desired Java library path from the linker's library
863      // search path.
864      //
865      // For compatibility, it is optimal that we insert the additional path
866      // components specific to the Java VM after those components specified
867      // in LD_LIBRARY_PATH (if any) but before those added by the ld.so
868      // infrastructure.
869      if (info->dls_cnt == 0) { // Not sure this can happen, but allow for it
870        strcpy(library_path, common_path);
871      } else {
872        int inserted = 0;
873        for (i = 0; i < info->dls_cnt; i++, path++) {
874          uint_t flags = path->dls_flags & LA_SER_MASK;
875          if (((flags & LA_SER_LIBPATH) == 0) && !inserted) {
876            strcat(library_path, common_path);
877            strcat(library_path, os::path_separator());
878            inserted = 1;
879          }
880          strcat(library_path, path->dls_name);
881          strcat(library_path, os::path_separator());
882        }
883        // eliminate trailing path separator
884        library_path[strlen(library_path)-1] = '\0';
885      }
886
887      // happens before argument parsing - can't use a trace flag
888      // tty->print_raw("init_system_properties_values: native lib path: ");
889      // tty->print_raw_cr(library_path);
890
891      // callee copies into its own buffer
892      Arguments::set_library_path(library_path);
893
894      free(common_path);
895      free(library_path);
896      free(info);
897    }
898
899    /*
900     * Extensions directories.
901     *
902     * Note that the space for the colon and the trailing null are provided
903     * by the nulls included by the sizeof operator (so actually one byte more
904     * than necessary is allocated).
905     */
906    {
907        char *buf = (char *) malloc(strlen(Arguments::get_java_home()) +
908            sizeof(EXTENSIONS_DIR) + sizeof(COMMON_DIR) +
909            sizeof(EXTENSIONS_DIR));
910        sprintf(buf, "%s" EXTENSIONS_DIR ":" COMMON_DIR EXTENSIONS_DIR,
911            Arguments::get_java_home());
912        Arguments::set_ext_dirs(buf);
913    }
914
915    /* Endorsed standards default directory. */
916    {
917        char * buf = malloc(strlen(Arguments::get_java_home()) + sizeof(ENDORSED_DIR));
918        sprintf(buf, "%s" ENDORSED_DIR, Arguments::get_java_home());
919        Arguments::set_endorsed_dirs(buf);
920    }
921  }
922
923#undef malloc
924#undef free
925#undef getenv
926#undef EXTENSIONS_DIR
927#undef ENDORSED_DIR
928#undef COMMON_DIR
929
930}
931
932void os::breakpoint() {
933  BREAKPOINT;
934}
935
936bool os::obsolete_option(const JavaVMOption *option)
937{
938  if (!strncmp(option->optionString, "-Xt", 3)) {
939    return true;
940  } else if (!strncmp(option->optionString, "-Xtm", 4)) {
941    return true;
942  } else if (!strncmp(option->optionString, "-Xverifyheap", 12)) {
943    return true;
944  } else if (!strncmp(option->optionString, "-Xmaxjitcodesize", 16)) {
945    return true;
946  }
947  return false;
948}
949
950bool os::Solaris::valid_stack_address(Thread* thread, address sp) {
951  address  stackStart  = (address)thread->stack_base();
952  address  stackEnd    = (address)(stackStart - (address)thread->stack_size());
953  if (sp < stackStart && sp >= stackEnd ) return true;
954  return false;
955}
956
957extern "C" void breakpoint() {
958  // use debugger to set breakpoint here
959}
960
961// Returns an estimate of the current stack pointer. Result must be guaranteed to
962// point into the calling threads stack, and be no lower than the current stack
963// pointer.
964address os::current_stack_pointer() {
965  volatile int dummy;
966  address sp = (address)&dummy + 8;     // %%%% need to confirm if this is right
967  return sp;
968}
969
970static thread_t main_thread;
971
972// Thread start routine for all new Java threads
973extern "C" void* java_start(void* thread_addr) {
974  // Try to randomize the cache line index of hot stack frames.
975  // This helps when threads of the same stack traces evict each other's
976  // cache lines. The threads can be either from the same JVM instance, or
977  // from different JVM instances. The benefit is especially true for
978  // processors with hyperthreading technology.
979  static int counter = 0;
980  int pid = os::current_process_id();
981  alloca(((pid ^ counter++) & 7) * 128);
982
983  int prio;
984  Thread* thread = (Thread*)thread_addr;
985  OSThread* osthr = thread->osthread();
986
987  osthr->set_lwp_id( _lwp_self() );  // Store lwp in case we are bound
988  thread->_schedctl = (void *) schedctl_init () ;
989
990  if (UseNUMA) {
991    int lgrp_id = os::numa_get_group_id();
992    if (lgrp_id != -1) {
993      thread->set_lgrp_id(lgrp_id);
994    }
995  }
996
997  // If the creator called set priority before we started,
998  // we need to call set priority now that we have an lwp.
999  // Get the priority from libthread and set the priority
1000  // for the new Solaris lwp.
1001  if ( osthr->thread_id() != -1 ) {
1002    if ( UseThreadPriorities ) {
1003      thr_getprio(osthr->thread_id(), &prio);
1004      if (ThreadPriorityVerbose) {
1005        tty->print_cr("Starting Thread " INTPTR_FORMAT ", LWP is " INTPTR_FORMAT ", setting priority: %d\n",
1006                      osthr->thread_id(), osthr->lwp_id(), prio );
1007      }
1008      os::set_native_priority(thread, prio);
1009    }
1010  } else if (ThreadPriorityVerbose) {
1011    warning("Can't set priority in _start routine, thread id hasn't been set\n");
1012  }
1013
1014  assert(osthr->get_state() == RUNNABLE, "invalid os thread state");
1015
1016  // initialize signal mask for this thread
1017  os::Solaris::hotspot_sigmask(thread);
1018
1019  thread->run();
1020
1021  // One less thread is executing
1022  // When the VMThread gets here, the main thread may have already exited
1023  // which frees the CodeHeap containing the Atomic::dec code
1024  if (thread != VMThread::vm_thread() && VMThread::vm_thread() != NULL) {
1025    Atomic::dec(&os::Solaris::_os_thread_count);
1026  }
1027
1028  if (UseDetachedThreads) {
1029    thr_exit(NULL);
1030    ShouldNotReachHere();
1031  }
1032  return NULL;
1033}
1034
1035static OSThread* create_os_thread(Thread* thread, thread_t thread_id) {
1036  // Allocate the OSThread object
1037  OSThread* osthread = new OSThread(NULL, NULL);
1038  if (osthread == NULL) return NULL;
1039
1040  // Store info on the Solaris thread into the OSThread
1041  osthread->set_thread_id(thread_id);
1042  osthread->set_lwp_id(_lwp_self());
1043  thread->_schedctl = (void *) schedctl_init () ;
1044
1045  if (UseNUMA) {
1046    int lgrp_id = os::numa_get_group_id();
1047    if (lgrp_id != -1) {
1048      thread->set_lgrp_id(lgrp_id);
1049    }
1050  }
1051
1052  if ( ThreadPriorityVerbose ) {
1053    tty->print_cr("In create_os_thread, Thread " INTPTR_FORMAT ", LWP is " INTPTR_FORMAT "\n",
1054                  osthread->thread_id(), osthread->lwp_id() );
1055  }
1056
1057  // Initial thread state is INITIALIZED, not SUSPENDED
1058  osthread->set_state(INITIALIZED);
1059
1060  return osthread;
1061}
1062
1063void os::Solaris::hotspot_sigmask(Thread* thread) {
1064
1065  //Save caller's signal mask
1066  sigset_t sigmask;
1067  thr_sigsetmask(SIG_SETMASK, NULL, &sigmask);
1068  OSThread *osthread = thread->osthread();
1069  osthread->set_caller_sigmask(sigmask);
1070
1071  thr_sigsetmask(SIG_UNBLOCK, os::Solaris::unblocked_signals(), NULL);
1072  if (!ReduceSignalUsage) {
1073    if (thread->is_VM_thread()) {
1074      // Only the VM thread handles BREAK_SIGNAL ...
1075      thr_sigsetmask(SIG_UNBLOCK, vm_signals(), NULL);
1076    } else {
1077      // ... all other threads block BREAK_SIGNAL
1078      assert(!sigismember(vm_signals(), SIGINT), "SIGINT should not be blocked");
1079      thr_sigsetmask(SIG_BLOCK, vm_signals(), NULL);
1080    }
1081  }
1082}
1083
1084bool os::create_attached_thread(JavaThread* thread) {
1085#ifdef ASSERT
1086  thread->verify_not_published();
1087#endif
1088  OSThread* osthread = create_os_thread(thread, thr_self());
1089  if (osthread == NULL) {
1090     return false;
1091  }
1092
1093  // Initial thread state is RUNNABLE
1094  osthread->set_state(RUNNABLE);
1095  thread->set_osthread(osthread);
1096
1097  // initialize signal mask for this thread
1098  // and save the caller's signal mask
1099  os::Solaris::hotspot_sigmask(thread);
1100
1101  return true;
1102}
1103
1104bool os::create_main_thread(JavaThread* thread) {
1105#ifdef ASSERT
1106  thread->verify_not_published();
1107#endif
1108  if (_starting_thread == NULL) {
1109    _starting_thread = create_os_thread(thread, main_thread);
1110     if (_starting_thread == NULL) {
1111        return false;
1112     }
1113  }
1114
1115  // The primodial thread is runnable from the start
1116  _starting_thread->set_state(RUNNABLE);
1117
1118  thread->set_osthread(_starting_thread);
1119
1120  // initialize signal mask for this thread
1121  // and save the caller's signal mask
1122  os::Solaris::hotspot_sigmask(thread);
1123
1124  return true;
1125}
1126
1127// _T2_libthread is true if we believe we are running with the newer
1128// SunSoft lwp/libthread.so (2.8 patch, 2.9 default)
1129bool os::Solaris::_T2_libthread = false;
1130
1131bool os::create_thread(Thread* thread, ThreadType thr_type, size_t stack_size) {
1132  // Allocate the OSThread object
1133  OSThread* osthread = new OSThread(NULL, NULL);
1134  if (osthread == NULL) {
1135    return false;
1136  }
1137
1138  if ( ThreadPriorityVerbose ) {
1139    char *thrtyp;
1140    switch ( thr_type ) {
1141      case vm_thread:
1142        thrtyp = (char *)"vm";
1143        break;
1144      case cgc_thread:
1145        thrtyp = (char *)"cgc";
1146        break;
1147      case pgc_thread:
1148        thrtyp = (char *)"pgc";
1149        break;
1150      case java_thread:
1151        thrtyp = (char *)"java";
1152        break;
1153      case compiler_thread:
1154        thrtyp = (char *)"compiler";
1155        break;
1156      case watcher_thread:
1157        thrtyp = (char *)"watcher";
1158        break;
1159      default:
1160        thrtyp = (char *)"unknown";
1161        break;
1162    }
1163    tty->print_cr("In create_thread, creating a %s thread\n", thrtyp);
1164  }
1165
1166  // Calculate stack size if it's not specified by caller.
1167  if (stack_size == 0) {
1168    // The default stack size 1M (2M for LP64).
1169    stack_size = (BytesPerWord >> 2) * K * K;
1170
1171    switch (thr_type) {
1172    case os::java_thread:
1173      // Java threads use ThreadStackSize which default value can be changed with the flag -Xss
1174      if (JavaThread::stack_size_at_create() > 0) stack_size = JavaThread::stack_size_at_create();
1175      break;
1176    case os::compiler_thread:
1177      if (CompilerThreadStackSize > 0) {
1178        stack_size = (size_t)(CompilerThreadStackSize * K);
1179        break;
1180      } // else fall through:
1181        // use VMThreadStackSize if CompilerThreadStackSize is not defined
1182    case os::vm_thread:
1183    case os::pgc_thread:
1184    case os::cgc_thread:
1185    case os::watcher_thread:
1186      if (VMThreadStackSize > 0) stack_size = (size_t)(VMThreadStackSize * K);
1187      break;
1188    }
1189  }
1190  stack_size = MAX2(stack_size, os::Solaris::min_stack_allowed);
1191
1192  // Initial state is ALLOCATED but not INITIALIZED
1193  osthread->set_state(ALLOCATED);
1194
1195  if (os::Solaris::_os_thread_count > os::Solaris::_os_thread_limit) {
1196    // We got lots of threads. Check if we still have some address space left.
1197    // Need to be at least 5Mb of unreserved address space. We do check by
1198    // trying to reserve some.
1199    const size_t VirtualMemoryBangSize = 20*K*K;
1200    char* mem = os::reserve_memory(VirtualMemoryBangSize);
1201    if (mem == NULL) {
1202      delete osthread;
1203      return false;
1204    } else {
1205      // Release the memory again
1206      os::release_memory(mem, VirtualMemoryBangSize);
1207    }
1208  }
1209
1210  // Setup osthread because the child thread may need it.
1211  thread->set_osthread(osthread);
1212
1213  // Create the Solaris thread
1214  // explicit THR_BOUND for T2_libthread case in case
1215  // that assumption is not accurate, but our alternate signal stack
1216  // handling is based on it which must have bound threads
1217  thread_t tid = 0;
1218  long     flags = (UseDetachedThreads ? THR_DETACHED : 0) | THR_SUSPENDED
1219                   | ((UseBoundThreads || os::Solaris::T2_libthread() ||
1220                       (thr_type == vm_thread) ||
1221                       (thr_type == cgc_thread) ||
1222                       (thr_type == pgc_thread) ||
1223                       (thr_type == compiler_thread && BackgroundCompilation)) ?
1224                      THR_BOUND : 0);
1225  int      status;
1226
1227  // 4376845 -- libthread/kernel don't provide enough LWPs to utilize all CPUs.
1228  //
1229  // On multiprocessors systems, libthread sometimes under-provisions our
1230  // process with LWPs.  On a 30-way systems, for instance, we could have
1231  // 50 user-level threads in ready state and only 2 or 3 LWPs assigned
1232  // to our process.  This can result in under utilization of PEs.
1233  // I suspect the problem is related to libthread's LWP
1234  // pool management and to the kernel's SIGBLOCKING "last LWP parked"
1235  // upcall policy.
1236  //
1237  // The following code is palliative -- it attempts to ensure that our
1238  // process has sufficient LWPs to take advantage of multiple PEs.
1239  // Proper long-term cures include using user-level threads bound to LWPs
1240  // (THR_BOUND) or using LWP-based synchronization.  Note that there is a
1241  // slight timing window with respect to sampling _os_thread_count, but
1242  // the race is benign.  Also, we should periodically recompute
1243  // _processors_online as the min of SC_NPROCESSORS_ONLN and the
1244  // the number of PEs in our partition.  You might be tempted to use
1245  // THR_NEW_LWP here, but I'd recommend against it as that could
1246  // result in undesirable growth of the libthread's LWP pool.
1247  // The fix below isn't sufficient; for instance, it doesn't take into count
1248  // LWPs parked on IO.  It does, however, help certain CPU-bound benchmarks.
1249  //
1250  // Some pathologies this scheme doesn't handle:
1251  // *  Threads can block, releasing the LWPs.  The LWPs can age out.
1252  //    When a large number of threads become ready again there aren't
1253  //    enough LWPs available to service them.  This can occur when the
1254  //    number of ready threads oscillates.
1255  // *  LWPs/Threads park on IO, thus taking the LWP out of circulation.
1256  //
1257  // Finally, we should call thr_setconcurrency() periodically to refresh
1258  // the LWP pool and thwart the LWP age-out mechanism.
1259  // The "+3" term provides a little slop -- we want to slightly overprovision.
1260
1261  if (AdjustConcurrency && os::Solaris::_os_thread_count < (_processors_online+3)) {
1262    if (!(flags & THR_BOUND)) {
1263      thr_setconcurrency (os::Solaris::_os_thread_count);       // avoid starvation
1264    }
1265  }
1266  // Although this doesn't hurt, we should warn of undefined behavior
1267  // when using unbound T1 threads with schedctl().  This should never
1268  // happen, as the compiler and VM threads are always created bound
1269  DEBUG_ONLY(
1270      if ((VMThreadHintNoPreempt || CompilerThreadHintNoPreempt) &&
1271          (!os::Solaris::T2_libthread() && (!(flags & THR_BOUND))) &&
1272          ((thr_type == vm_thread) || (thr_type == cgc_thread) ||
1273           (thr_type == pgc_thread) || (thr_type == compiler_thread && BackgroundCompilation))) {
1274         warning("schedctl behavior undefined when Compiler/VM/GC Threads are Unbound");
1275      }
1276  );
1277
1278
1279  // Mark that we don't have an lwp or thread id yet.
1280  // In case we attempt to set the priority before the thread starts.
1281  osthread->set_lwp_id(-1);
1282  osthread->set_thread_id(-1);
1283
1284  status = thr_create(NULL, stack_size, java_start, thread, flags, &tid);
1285  if (status != 0) {
1286    if (PrintMiscellaneous && (Verbose || WizardMode)) {
1287      perror("os::create_thread");
1288    }
1289    thread->set_osthread(NULL);
1290    // Need to clean up stuff we've allocated so far
1291    delete osthread;
1292    return false;
1293  }
1294
1295  Atomic::inc(&os::Solaris::_os_thread_count);
1296
1297  // Store info on the Solaris thread into the OSThread
1298  osthread->set_thread_id(tid);
1299
1300  // Remember that we created this thread so we can set priority on it
1301  osthread->set_vm_created();
1302
1303  // Set the default thread priority otherwise use NormalPriority
1304
1305  if ( UseThreadPriorities ) {
1306     thr_setprio(tid, (DefaultThreadPriority == -1) ?
1307                        java_to_os_priority[NormPriority] :
1308                        DefaultThreadPriority);
1309  }
1310
1311  // Initial thread state is INITIALIZED, not SUSPENDED
1312  osthread->set_state(INITIALIZED);
1313
1314  // The thread is returned suspended (in state INITIALIZED), and is started higher up in the call chain
1315  return true;
1316}
1317
1318/* defined for >= Solaris 10. This allows builds on earlier versions
1319 *  of Solaris to take advantage of the newly reserved Solaris JVM signals
1320 *  With SIGJVM1, SIGJVM2, INTERRUPT_SIGNAL is SIGJVM1, ASYNC_SIGNAL is SIGJVM2
1321 *  and -XX:+UseAltSigs does nothing since these should have no conflict
1322 */
1323#if !defined(SIGJVM1)
1324#define SIGJVM1 39
1325#define SIGJVM2 40
1326#endif
1327
1328debug_only(static bool signal_sets_initialized = false);
1329static sigset_t unblocked_sigs, vm_sigs, allowdebug_blocked_sigs;
1330int os::Solaris::_SIGinterrupt = INTERRUPT_SIGNAL;
1331int os::Solaris::_SIGasync = ASYNC_SIGNAL;
1332
1333bool os::Solaris::is_sig_ignored(int sig) {
1334      struct sigaction oact;
1335      sigaction(sig, (struct sigaction*)NULL, &oact);
1336      void* ohlr = oact.sa_sigaction ? CAST_FROM_FN_PTR(void*,  oact.sa_sigaction)
1337                                     : CAST_FROM_FN_PTR(void*,  oact.sa_handler);
1338      if (ohlr == CAST_FROM_FN_PTR(void*, SIG_IGN))
1339           return true;
1340      else
1341           return false;
1342}
1343
1344// Note: SIGRTMIN is a macro that calls sysconf() so it will
1345// dynamically detect SIGRTMIN value for the system at runtime, not buildtime
1346static bool isJVM1available() {
1347  return SIGJVM1 < SIGRTMIN;
1348}
1349
1350void os::Solaris::signal_sets_init() {
1351  // Should also have an assertion stating we are still single-threaded.
1352  assert(!signal_sets_initialized, "Already initialized");
1353  // Fill in signals that are necessarily unblocked for all threads in
1354  // the VM. Currently, we unblock the following signals:
1355  // SHUTDOWN{1,2,3}_SIGNAL: for shutdown hooks support (unless over-ridden
1356  //                         by -Xrs (=ReduceSignalUsage));
1357  // BREAK_SIGNAL which is unblocked only by the VM thread and blocked by all
1358  // other threads. The "ReduceSignalUsage" boolean tells us not to alter
1359  // the dispositions or masks wrt these signals.
1360  // Programs embedding the VM that want to use the above signals for their
1361  // own purposes must, at this time, use the "-Xrs" option to prevent
1362  // interference with shutdown hooks and BREAK_SIGNAL thread dumping.
1363  // (See bug 4345157, and other related bugs).
1364  // In reality, though, unblocking these signals is really a nop, since
1365  // these signals are not blocked by default.
1366  sigemptyset(&unblocked_sigs);
1367  sigemptyset(&allowdebug_blocked_sigs);
1368  sigaddset(&unblocked_sigs, SIGILL);
1369  sigaddset(&unblocked_sigs, SIGSEGV);
1370  sigaddset(&unblocked_sigs, SIGBUS);
1371  sigaddset(&unblocked_sigs, SIGFPE);
1372
1373  if (isJVM1available) {
1374    os::Solaris::set_SIGinterrupt(SIGJVM1);
1375    os::Solaris::set_SIGasync(SIGJVM2);
1376  } else if (UseAltSigs) {
1377    os::Solaris::set_SIGinterrupt(ALT_INTERRUPT_SIGNAL);
1378    os::Solaris::set_SIGasync(ALT_ASYNC_SIGNAL);
1379  } else {
1380    os::Solaris::set_SIGinterrupt(INTERRUPT_SIGNAL);
1381    os::Solaris::set_SIGasync(ASYNC_SIGNAL);
1382  }
1383
1384  sigaddset(&unblocked_sigs, os::Solaris::SIGinterrupt());
1385  sigaddset(&unblocked_sigs, os::Solaris::SIGasync());
1386
1387  if (!ReduceSignalUsage) {
1388   if (!os::Solaris::is_sig_ignored(SHUTDOWN1_SIGNAL)) {
1389      sigaddset(&unblocked_sigs, SHUTDOWN1_SIGNAL);
1390      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN1_SIGNAL);
1391   }
1392   if (!os::Solaris::is_sig_ignored(SHUTDOWN2_SIGNAL)) {
1393      sigaddset(&unblocked_sigs, SHUTDOWN2_SIGNAL);
1394      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN2_SIGNAL);
1395   }
1396   if (!os::Solaris::is_sig_ignored(SHUTDOWN3_SIGNAL)) {
1397      sigaddset(&unblocked_sigs, SHUTDOWN3_SIGNAL);
1398      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN3_SIGNAL);
1399   }
1400  }
1401  // Fill in signals that are blocked by all but the VM thread.
1402  sigemptyset(&vm_sigs);
1403  if (!ReduceSignalUsage)
1404    sigaddset(&vm_sigs, BREAK_SIGNAL);
1405  debug_only(signal_sets_initialized = true);
1406
1407  // For diagnostics only used in run_periodic_checks
1408  sigemptyset(&check_signal_done);
1409}
1410
1411// These are signals that are unblocked while a thread is running Java.
1412// (For some reason, they get blocked by default.)
1413sigset_t* os::Solaris::unblocked_signals() {
1414  assert(signal_sets_initialized, "Not initialized");
1415  return &unblocked_sigs;
1416}
1417
1418// These are the signals that are blocked while a (non-VM) thread is
1419// running Java. Only the VM thread handles these signals.
1420sigset_t* os::Solaris::vm_signals() {
1421  assert(signal_sets_initialized, "Not initialized");
1422  return &vm_sigs;
1423}
1424
1425// These are signals that are blocked during cond_wait to allow debugger in
1426sigset_t* os::Solaris::allowdebug_blocked_signals() {
1427  assert(signal_sets_initialized, "Not initialized");
1428  return &allowdebug_blocked_sigs;
1429}
1430
1431// First crack at OS-specific initialization, from inside the new thread.
1432void os::initialize_thread() {
1433  int r = thr_main() ;
1434  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
1435  if (r) {
1436    JavaThread* jt = (JavaThread *)Thread::current();
1437    assert(jt != NULL,"Sanity check");
1438    size_t stack_size;
1439    address base = jt->stack_base();
1440    if (Arguments::created_by_java_launcher()) {
1441      // Use 2MB to allow for Solaris 7 64 bit mode.
1442      stack_size = JavaThread::stack_size_at_create() == 0
1443        ? 2048*K : JavaThread::stack_size_at_create();
1444
1445      // There are rare cases when we may have already used more than
1446      // the basic stack size allotment before this method is invoked.
1447      // Attempt to allow for a normally sized java_stack.
1448      size_t current_stack_offset = (size_t)(base - (address)&stack_size);
1449      stack_size += ReservedSpace::page_align_size_down(current_stack_offset);
1450    } else {
1451      // 6269555: If we were not created by a Java launcher, i.e. if we are
1452      // running embedded in a native application, treat the primordial thread
1453      // as much like a native attached thread as possible.  This means using
1454      // the current stack size from thr_stksegment(), unless it is too large
1455      // to reliably setup guard pages.  A reasonable max size is 8MB.
1456      size_t current_size = current_stack_size();
1457      // This should never happen, but just in case....
1458      if (current_size == 0) current_size = 2 * K * K;
1459      stack_size = current_size > (8 * K * K) ? (8 * K * K) : current_size;
1460    }
1461    address bottom = (address)align_size_up((intptr_t)(base - stack_size), os::vm_page_size());;
1462    stack_size = (size_t)(base - bottom);
1463
1464    assert(stack_size > 0, "Stack size calculation problem");
1465
1466    if (stack_size > jt->stack_size()) {
1467      NOT_PRODUCT(
1468        struct rlimit limits;
1469        getrlimit(RLIMIT_STACK, &limits);
1470        size_t size = adjust_stack_size(base, (size_t)limits.rlim_cur);
1471        assert(size >= jt->stack_size(), "Stack size problem in main thread");
1472      )
1473      tty->print_cr(
1474        "Stack size of %d Kb exceeds current limit of %d Kb.\n"
1475        "(Stack sizes are rounded up to a multiple of the system page size.)\n"
1476        "See limit(1) to increase the stack size limit.",
1477        stack_size / K, jt->stack_size() / K);
1478      vm_exit(1);
1479    }
1480    assert(jt->stack_size() >= stack_size,
1481          "Attempt to map more stack than was allocated");
1482    jt->set_stack_size(stack_size);
1483  }
1484
1485   // 5/22/01: Right now alternate signal stacks do not handle
1486   // throwing stack overflow exceptions, see bug 4463178
1487   // Until a fix is found for this, T2 will NOT imply alternate signal
1488   // stacks.
1489   // If using T2 libthread threads, install an alternate signal stack.
1490   // Because alternate stacks associate with LWPs on Solaris,
1491   // see sigaltstack(2), if using UNBOUND threads, or if UseBoundThreads
1492   // we prefer to explicitly stack bang.
1493   // If not using T2 libthread, but using UseBoundThreads any threads
1494   // (primordial thread, jni_attachCurrentThread) we do not create,
1495   // probably are not bound, therefore they can not have an alternate
1496   // signal stack. Since our stack banging code is generated and
1497   // is shared across threads, all threads must be bound to allow
1498   // using alternate signal stacks.  The alternative is to interpose
1499   // on _lwp_create to associate an alt sig stack with each LWP,
1500   // and this could be a problem when the JVM is embedded.
1501   // We would prefer to use alternate signal stacks with T2
1502   // Since there is currently no accurate way to detect T2
1503   // we do not. Assuming T2 when running T1 causes sig 11s or assertions
1504   // on installing alternate signal stacks
1505
1506
1507   // 05/09/03: removed alternate signal stack support for Solaris
1508   // The alternate signal stack mechanism is no longer needed to
1509   // handle stack overflow. This is now handled by allocating
1510   // guard pages (red zone) and stackbanging.
1511   // Initially the alternate signal stack mechanism was removed because
1512   // it did not work with T1 llibthread. Alternate
1513   // signal stacks MUST have all threads bound to lwps. Applications
1514   // can create their own threads and attach them without their being
1515   // bound under T1. This is frequently the case for the primordial thread.
1516   // If we were ever to reenable this mechanism we would need to
1517   // use the dynamic check for T2 libthread.
1518
1519  os::Solaris::init_thread_fpu_state();
1520}
1521
1522
1523
1524// Free Solaris resources related to the OSThread
1525void os::free_thread(OSThread* osthread) {
1526  assert(osthread != NULL, "os::free_thread but osthread not set");
1527
1528
1529  // We are told to free resources of the argument thread,
1530  // but we can only really operate on the current thread.
1531  // The main thread must take the VMThread down synchronously
1532  // before the main thread exits and frees up CodeHeap
1533  guarantee((Thread::current()->osthread() == osthread
1534     || (osthread == VMThread::vm_thread()->osthread())), "os::free_thread but not current thread");
1535  if (Thread::current()->osthread() == osthread) {
1536    // Restore caller's signal mask
1537    sigset_t sigmask = osthread->caller_sigmask();
1538    thr_sigsetmask(SIG_SETMASK, &sigmask, NULL);
1539  }
1540  delete osthread;
1541}
1542
1543void os::pd_start_thread(Thread* thread) {
1544  int status = thr_continue(thread->osthread()->thread_id());
1545  assert_status(status == 0, status, "thr_continue failed");
1546}
1547
1548
1549intx os::current_thread_id() {
1550  return (intx)thr_self();
1551}
1552
1553static pid_t _initial_pid = 0;
1554
1555int os::current_process_id() {
1556  return (int)(_initial_pid ? _initial_pid : getpid());
1557}
1558
1559int os::allocate_thread_local_storage() {
1560  // %%%       in Win32 this allocates a memory segment pointed to by a
1561  //           register.  Dan Stein can implement a similar feature in
1562  //           Solaris.  Alternatively, the VM can do the same thing
1563  //           explicitly: malloc some storage and keep the pointer in a
1564  //           register (which is part of the thread's context) (or keep it
1565  //           in TLS).
1566  // %%%       In current versions of Solaris, thr_self and TSD can
1567  //           be accessed via short sequences of displaced indirections.
1568  //           The value of thr_self is available as %g7(36).
1569  //           The value of thr_getspecific(k) is stored in %g7(12)(4)(k*4-4),
1570  //           assuming that the current thread already has a value bound to k.
1571  //           It may be worth experimenting with such access patterns,
1572  //           and later having the parameters formally exported from a Solaris
1573  //           interface.  I think, however, that it will be faster to
1574  //           maintain the invariant that %g2 always contains the
1575  //           JavaThread in Java code, and have stubs simply
1576  //           treat %g2 as a caller-save register, preserving it in a %lN.
1577  thread_key_t tk;
1578  if (thr_keycreate( &tk, NULL ) )
1579    fatal1("os::allocate_thread_local_storage: thr_keycreate failed (%s)", strerror(errno));
1580  return int(tk);
1581}
1582
1583void os::free_thread_local_storage(int index) {
1584  // %%% don't think we need anything here
1585  // if ( pthread_key_delete((pthread_key_t) tk) )
1586  //   fatal("os::free_thread_local_storage: pthread_key_delete failed");
1587}
1588
1589#define SMALLINT 32   // libthread allocate for tsd_common is a version specific
1590                      // small number - point is NO swap space available
1591void os::thread_local_storage_at_put(int index, void* value) {
1592  // %%% this is used only in threadLocalStorage.cpp
1593  if (thr_setspecific((thread_key_t)index, value)) {
1594    if (errno == ENOMEM) {
1595       vm_exit_out_of_memory(SMALLINT, "thr_setspecific: out of swap space");
1596    } else {
1597      fatal1("os::thread_local_storage_at_put: thr_setspecific failed (%s)", strerror(errno));
1598    }
1599  } else {
1600      ThreadLocalStorage::set_thread_in_slot ((Thread *) value) ;
1601  }
1602}
1603
1604// This function could be called before TLS is initialized, for example, when
1605// VM receives an async signal or when VM causes a fatal error during
1606// initialization. Return NULL if thr_getspecific() fails.
1607void* os::thread_local_storage_at(int index) {
1608  // %%% this is used only in threadLocalStorage.cpp
1609  void* r = NULL;
1610  return thr_getspecific((thread_key_t)index, &r) != 0 ? NULL : r;
1611}
1612
1613
1614const int NANOSECS_PER_MILLISECS = 1000000;
1615// gethrtime can move backwards if read from one cpu and then a different cpu
1616// getTimeNanos is guaranteed to not move backward on Solaris
1617// local spinloop created as faster for a CAS on an int than
1618// a CAS on a 64bit jlong. Also Atomic::cmpxchg for jlong is not
1619// supported on sparc v8 or pre supports_cx8 intel boxes.
1620// oldgetTimeNanos for systems which do not support CAS on 64bit jlong
1621// i.e. sparc v8 and pre supports_cx8 (i486) intel boxes
1622inline hrtime_t oldgetTimeNanos() {
1623  int gotlock = LOCK_INVALID;
1624  hrtime_t newtime = gethrtime();
1625
1626  for (;;) {
1627// grab lock for max_hrtime
1628    int curlock = max_hrtime_lock;
1629    if (curlock & LOCK_BUSY)  continue;
1630    if (gotlock = Atomic::cmpxchg(LOCK_BUSY, &max_hrtime_lock, LOCK_FREE) != LOCK_FREE) continue;
1631    if (newtime > max_hrtime) {
1632      max_hrtime = newtime;
1633    } else {
1634      newtime = max_hrtime;
1635    }
1636    // release lock
1637    max_hrtime_lock = LOCK_FREE;
1638    return newtime;
1639  }
1640}
1641// gethrtime can move backwards if read from one cpu and then a different cpu
1642// getTimeNanos is guaranteed to not move backward on Solaris
1643inline hrtime_t getTimeNanos() {
1644  if (VM_Version::supports_cx8()) {
1645    const hrtime_t now = gethrtime();
1646    const hrtime_t prev = max_hrtime;
1647    if (now <= prev)  return prev;   // same or retrograde time;
1648    const hrtime_t obsv = Atomic::cmpxchg(now, (volatile jlong*)&max_hrtime, prev);
1649    assert(obsv >= prev, "invariant");   // Monotonicity
1650    // If the CAS succeeded then we're done and return "now".
1651    // If the CAS failed and the observed value "obs" is >= now then
1652    // we should return "obs".  If the CAS failed and now > obs > prv then
1653    // some other thread raced this thread and installed a new value, in which case
1654    // we could either (a) retry the entire operation, (b) retry trying to install now
1655    // or (c) just return obs.  We use (c).   No loop is required although in some cases
1656    // we might discard a higher "now" value in deference to a slightly lower but freshly
1657    // installed obs value.   That's entirely benign -- it admits no new orderings compared
1658    // to (a) or (b) -- and greatly reduces coherence traffic.
1659    // We might also condition (c) on the magnitude of the delta between obs and now.
1660    // Avoiding excessive CAS operations to hot RW locations is critical.
1661    // See http://blogs.sun.com/dave/entry/cas_and_cache_trivia_invalidate
1662    return (prev == obsv) ? now : obsv ;
1663  } else {
1664    return oldgetTimeNanos();
1665  }
1666}
1667
1668// Time since start-up in seconds to a fine granularity.
1669// Used by VMSelfDestructTimer and the MemProfiler.
1670double os::elapsedTime() {
1671  return (double)(getTimeNanos() - first_hrtime) / (double)hrtime_hz;
1672}
1673
1674jlong os::elapsed_counter() {
1675  return (jlong)(getTimeNanos() - first_hrtime);
1676}
1677
1678jlong os::elapsed_frequency() {
1679   return hrtime_hz;
1680}
1681
1682// Return the real, user, and system times in seconds from an
1683// arbitrary fixed point in the past.
1684bool os::getTimesSecs(double* process_real_time,
1685                  double* process_user_time,
1686                  double* process_system_time) {
1687  struct tms ticks;
1688  clock_t real_ticks = times(&ticks);
1689
1690  if (real_ticks == (clock_t) (-1)) {
1691    return false;
1692  } else {
1693    double ticks_per_second = (double) clock_tics_per_sec;
1694    *process_user_time = ((double) ticks.tms_utime) / ticks_per_second;
1695    *process_system_time = ((double) ticks.tms_stime) / ticks_per_second;
1696    // For consistency return the real time from getTimeNanos()
1697    // converted to seconds.
1698    *process_real_time = ((double) getTimeNanos()) / ((double) NANOUNITS);
1699
1700    return true;
1701  }
1702}
1703
1704bool os::supports_vtime() { return true; }
1705
1706bool os::enable_vtime() {
1707  int fd = open("/proc/self/ctl", O_WRONLY);
1708  if (fd == -1)
1709    return false;
1710
1711  long cmd[] = { PCSET, PR_MSACCT };
1712  int res = write(fd, cmd, sizeof(long) * 2);
1713  close(fd);
1714  if (res != sizeof(long) * 2)
1715    return false;
1716
1717  return true;
1718}
1719
1720bool os::vtime_enabled() {
1721  int fd = open("/proc/self/status", O_RDONLY);
1722  if (fd == -1)
1723    return false;
1724
1725  pstatus_t status;
1726  int res = read(fd, (void*) &status, sizeof(pstatus_t));
1727  close(fd);
1728  if (res != sizeof(pstatus_t))
1729    return false;
1730
1731  return status.pr_flags & PR_MSACCT;
1732}
1733
1734double os::elapsedVTime() {
1735  return (double)gethrvtime() / (double)hrtime_hz;
1736}
1737
1738// Used internally for comparisons only
1739// getTimeMillis guaranteed to not move backwards on Solaris
1740jlong getTimeMillis() {
1741  jlong nanotime = getTimeNanos();
1742  return (jlong)(nanotime / NANOSECS_PER_MILLISECS);
1743}
1744
1745// Must return millis since Jan 1 1970 for JVM_CurrentTimeMillis
1746jlong os::javaTimeMillis() {
1747  timeval t;
1748  if (gettimeofday( &t, NULL) == -1)
1749    fatal1("os::javaTimeMillis: gettimeofday (%s)", strerror(errno));
1750  return jlong(t.tv_sec) * 1000  +  jlong(t.tv_usec) / 1000;
1751}
1752
1753jlong os::javaTimeNanos() {
1754  return (jlong)getTimeNanos();
1755}
1756
1757void os::javaTimeNanos_info(jvmtiTimerInfo *info_ptr) {
1758  info_ptr->max_value = ALL_64_BITS;      // gethrtime() uses all 64 bits
1759  info_ptr->may_skip_backward = false;    // not subject to resetting or drifting
1760  info_ptr->may_skip_forward = false;     // not subject to resetting or drifting
1761  info_ptr->kind = JVMTI_TIMER_ELAPSED;   // elapsed not CPU time
1762}
1763
1764char * os::local_time_string(char *buf, size_t buflen) {
1765  struct tm t;
1766  time_t long_time;
1767  time(&long_time);
1768  localtime_r(&long_time, &t);
1769  jio_snprintf(buf, buflen, "%d-%02d-%02d %02d:%02d:%02d",
1770               t.tm_year + 1900, t.tm_mon + 1, t.tm_mday,
1771               t.tm_hour, t.tm_min, t.tm_sec);
1772  return buf;
1773}
1774
1775// Note: os::shutdown() might be called very early during initialization, or
1776// called from signal handler. Before adding something to os::shutdown(), make
1777// sure it is async-safe and can handle partially initialized VM.
1778void os::shutdown() {
1779
1780  // allow PerfMemory to attempt cleanup of any persistent resources
1781  perfMemory_exit();
1782
1783  // needs to remove object in file system
1784  AttachListener::abort();
1785
1786  // flush buffered output, finish log files
1787  ostream_abort();
1788
1789  // Check for abort hook
1790  abort_hook_t abort_hook = Arguments::abort_hook();
1791  if (abort_hook != NULL) {
1792    abort_hook();
1793  }
1794}
1795
1796// Note: os::abort() might be called very early during initialization, or
1797// called from signal handler. Before adding something to os::abort(), make
1798// sure it is async-safe and can handle partially initialized VM.
1799void os::abort(bool dump_core) {
1800  os::shutdown();
1801  if (dump_core) {
1802#ifndef PRODUCT
1803    fdStream out(defaultStream::output_fd());
1804    out.print_raw("Current thread is ");
1805    char buf[16];
1806    jio_snprintf(buf, sizeof(buf), UINTX_FORMAT, os::current_thread_id());
1807    out.print_raw_cr(buf);
1808    out.print_raw_cr("Dumping core ...");
1809#endif
1810    ::abort(); // dump core (for debugging)
1811  }
1812
1813  ::exit(1);
1814}
1815
1816// Die immediately, no exit hook, no abort hook, no cleanup.
1817void os::die() {
1818  _exit(-1);
1819}
1820
1821// unused
1822void os::set_error_file(const char *logfile) {}
1823
1824// DLL functions
1825
1826const char* os::dll_file_extension() { return ".so"; }
1827
1828const char* os::get_temp_directory() { return "/tmp/"; }
1829
1830void os::dll_build_name(
1831    char* buffer, size_t buflen, const char* pname, const char* fname) {
1832  // copied from libhpi
1833  const size_t pnamelen = pname ? strlen(pname) : 0;
1834
1835  /* Quietly truncate on buffer overflow.  Should be an error. */
1836  if (pnamelen + strlen(fname) + 10 > (size_t) buflen) {
1837      *buffer = '\0';
1838      return;
1839  }
1840
1841  if (pnamelen == 0) {
1842      sprintf(buffer, "lib%s.so", fname);
1843  } else {
1844      sprintf(buffer, "%s/lib%s.so", pname, fname);
1845  }
1846}
1847
1848const char* os::get_current_directory(char *buf, int buflen) {
1849  return getcwd(buf, buflen);
1850}
1851
1852// check if addr is inside libjvm[_g].so
1853bool os::address_is_in_vm(address addr) {
1854  static address libjvm_base_addr;
1855  Dl_info dlinfo;
1856
1857  if (libjvm_base_addr == NULL) {
1858    dladdr(CAST_FROM_FN_PTR(void *, os::address_is_in_vm), &dlinfo);
1859    libjvm_base_addr = (address)dlinfo.dli_fbase;
1860    assert(libjvm_base_addr !=NULL, "Cannot obtain base address for libjvm");
1861  }
1862
1863  if (dladdr((void *)addr, &dlinfo)) {
1864    if (libjvm_base_addr == (address)dlinfo.dli_fbase) return true;
1865  }
1866
1867  return false;
1868}
1869
1870typedef int (*dladdr1_func_type) (void *, Dl_info *, void **, int);
1871static dladdr1_func_type dladdr1_func = NULL;
1872
1873bool os::dll_address_to_function_name(address addr, char *buf,
1874                                      int buflen, int * offset) {
1875  Dl_info dlinfo;
1876
1877  // dladdr1_func was initialized in os::init()
1878  if (dladdr1_func){
1879      // yes, we have dladdr1
1880
1881      // Support for dladdr1 is checked at runtime; it may be
1882      // available even if the vm is built on a machine that does
1883      // not have dladdr1 support.  Make sure there is a value for
1884      // RTLD_DL_SYMENT.
1885      #ifndef RTLD_DL_SYMENT
1886      #define RTLD_DL_SYMENT 1
1887      #endif
1888      Sym * info;
1889      if (dladdr1_func((void *)addr, &dlinfo, (void **)&info,
1890                       RTLD_DL_SYMENT)) {
1891          if (buf) jio_snprintf(buf, buflen, "%s", dlinfo.dli_sname);
1892          if (offset) *offset = addr - (address)dlinfo.dli_saddr;
1893
1894          // check if the returned symbol really covers addr
1895          return ((char *)dlinfo.dli_saddr + info->st_size > (char *)addr);
1896      } else {
1897          if (buf) buf[0] = '\0';
1898          if (offset) *offset  = -1;
1899          return false;
1900      }
1901  } else {
1902      // no, only dladdr is available
1903      if(dladdr((void *)addr, &dlinfo)) {
1904          if (buf) jio_snprintf(buf, buflen, dlinfo.dli_sname);
1905          if (offset) *offset = addr - (address)dlinfo.dli_saddr;
1906          return true;
1907      } else {
1908          if (buf) buf[0] = '\0';
1909          if (offset) *offset  = -1;
1910          return false;
1911      }
1912  }
1913}
1914
1915bool os::dll_address_to_library_name(address addr, char* buf,
1916                                     int buflen, int* offset) {
1917  Dl_info dlinfo;
1918
1919  if (dladdr((void*)addr, &dlinfo)){
1920     if (buf) jio_snprintf(buf, buflen, "%s", dlinfo.dli_fname);
1921     if (offset) *offset = addr - (address)dlinfo.dli_fbase;
1922     return true;
1923  } else {
1924     if (buf) buf[0] = '\0';
1925     if (offset) *offset = -1;
1926     return false;
1927  }
1928}
1929
1930// Prints the names and full paths of all opened dynamic libraries
1931// for current process
1932void os::print_dll_info(outputStream * st) {
1933    Dl_info dli;
1934    void *handle;
1935    Link_map *map;
1936    Link_map *p;
1937
1938    st->print_cr("Dynamic libraries:"); st->flush();
1939
1940    if (!dladdr(CAST_FROM_FN_PTR(void *, os::print_dll_info), &dli)) {
1941        st->print_cr("Error: Cannot print dynamic libraries.");
1942        return;
1943    }
1944    handle = dlopen(dli.dli_fname, RTLD_LAZY);
1945    if (handle == NULL) {
1946        st->print_cr("Error: Cannot print dynamic libraries.");
1947        return;
1948    }
1949    dlinfo(handle, RTLD_DI_LINKMAP, &map);
1950    if (map == NULL) {
1951        st->print_cr("Error: Cannot print dynamic libraries.");
1952        return;
1953    }
1954
1955    while (map->l_prev != NULL)
1956        map = map->l_prev;
1957
1958    while (map != NULL) {
1959        st->print_cr(PTR_FORMAT " \t%s", map->l_addr, map->l_name);
1960        map = map->l_next;
1961    }
1962
1963    dlclose(handle);
1964}
1965
1966  // Loads .dll/.so and
1967  // in case of error it checks if .dll/.so was built for the
1968  // same architecture as Hotspot is running on
1969
1970void * os::dll_load(const char *filename, char *ebuf, int ebuflen)
1971{
1972  void * result= ::dlopen(filename, RTLD_LAZY);
1973  if (result != NULL) {
1974    // Successful loading
1975    return result;
1976  }
1977
1978  Elf32_Ehdr elf_head;
1979
1980  // Read system error message into ebuf
1981  // It may or may not be overwritten below
1982  ::strncpy(ebuf, ::dlerror(), ebuflen-1);
1983  ebuf[ebuflen-1]='\0';
1984  int diag_msg_max_length=ebuflen-strlen(ebuf);
1985  char* diag_msg_buf=ebuf+strlen(ebuf);
1986
1987  if (diag_msg_max_length==0) {
1988    // No more space in ebuf for additional diagnostics message
1989    return NULL;
1990  }
1991
1992
1993  int file_descriptor= ::open(filename, O_RDONLY | O_NONBLOCK);
1994
1995  if (file_descriptor < 0) {
1996    // Can't open library, report dlerror() message
1997    return NULL;
1998  }
1999
2000  bool failed_to_read_elf_head=
2001    (sizeof(elf_head)!=
2002        (::read(file_descriptor, &elf_head,sizeof(elf_head)))) ;
2003
2004  ::close(file_descriptor);
2005  if (failed_to_read_elf_head) {
2006    // file i/o error - report dlerror() msg
2007    return NULL;
2008  }
2009
2010  typedef struct {
2011    Elf32_Half  code;         // Actual value as defined in elf.h
2012    Elf32_Half  compat_class; // Compatibility of archs at VM's sense
2013    char        elf_class;    // 32 or 64 bit
2014    char        endianess;    // MSB or LSB
2015    char*       name;         // String representation
2016  } arch_t;
2017
2018  static const arch_t arch_array[]={
2019    {EM_386,         EM_386,     ELFCLASS32, ELFDATA2LSB, (char*)"IA 32"},
2020    {EM_486,         EM_386,     ELFCLASS32, ELFDATA2LSB, (char*)"IA 32"},
2021    {EM_IA_64,       EM_IA_64,   ELFCLASS64, ELFDATA2LSB, (char*)"IA 64"},
2022    {EM_X86_64,      EM_X86_64,  ELFCLASS64, ELFDATA2LSB, (char*)"AMD 64"},
2023    {EM_SPARC,       EM_SPARC,   ELFCLASS32, ELFDATA2MSB, (char*)"Sparc 32"},
2024    {EM_SPARC32PLUS, EM_SPARC,   ELFCLASS32, ELFDATA2MSB, (char*)"Sparc 32"},
2025    {EM_SPARCV9,     EM_SPARCV9, ELFCLASS64, ELFDATA2MSB, (char*)"Sparc v9 64"},
2026    {EM_PPC,         EM_PPC,     ELFCLASS32, ELFDATA2MSB, (char*)"Power PC 32"},
2027    {EM_PPC64,       EM_PPC64,   ELFCLASS64, ELFDATA2MSB, (char*)"Power PC 64"}
2028  };
2029
2030  #if  (defined IA32)
2031    static  Elf32_Half running_arch_code=EM_386;
2032  #elif   (defined AMD64)
2033    static  Elf32_Half running_arch_code=EM_X86_64;
2034  #elif  (defined IA64)
2035    static  Elf32_Half running_arch_code=EM_IA_64;
2036  #elif  (defined __sparc) && (defined _LP64)
2037    static  Elf32_Half running_arch_code=EM_SPARCV9;
2038  #elif  (defined __sparc) && (!defined _LP64)
2039    static  Elf32_Half running_arch_code=EM_SPARC;
2040  #elif  (defined __powerpc64__)
2041    static  Elf32_Half running_arch_code=EM_PPC64;
2042  #elif  (defined __powerpc__)
2043    static  Elf32_Half running_arch_code=EM_PPC;
2044  #else
2045    #error Method os::dll_load requires that one of following is defined:\
2046         IA32, AMD64, IA64, __sparc, __powerpc__
2047  #endif
2048
2049  // Identify compatability class for VM's architecture and library's architecture
2050  // Obtain string descriptions for architectures
2051
2052  arch_t lib_arch={elf_head.e_machine,0,elf_head.e_ident[EI_CLASS], elf_head.e_ident[EI_DATA], NULL};
2053  int running_arch_index=-1;
2054
2055  for (unsigned int i=0 ; i < ARRAY_SIZE(arch_array) ; i++ ) {
2056    if (running_arch_code == arch_array[i].code) {
2057      running_arch_index    = i;
2058    }
2059    if (lib_arch.code == arch_array[i].code) {
2060      lib_arch.compat_class = arch_array[i].compat_class;
2061      lib_arch.name         = arch_array[i].name;
2062    }
2063  }
2064
2065  assert(running_arch_index != -1,
2066    "Didn't find running architecture code (running_arch_code) in arch_array");
2067  if (running_arch_index == -1) {
2068    // Even though running architecture detection failed
2069    // we may still continue with reporting dlerror() message
2070    return NULL;
2071  }
2072
2073  if (lib_arch.endianess != arch_array[running_arch_index].endianess) {
2074    ::snprintf(diag_msg_buf, diag_msg_max_length-1," (Possible cause: endianness mismatch)");
2075    return NULL;
2076  }
2077
2078  if (lib_arch.elf_class != arch_array[running_arch_index].elf_class) {
2079    ::snprintf(diag_msg_buf, diag_msg_max_length-1," (Possible cause: architecture word width mismatch)");
2080    return NULL;
2081  }
2082
2083  if (lib_arch.compat_class != arch_array[running_arch_index].compat_class) {
2084    if ( lib_arch.name!=NULL ) {
2085      ::snprintf(diag_msg_buf, diag_msg_max_length-1,
2086        " (Possible cause: can't load %s-bit .so on a %s-bit platform)",
2087        lib_arch.name, arch_array[running_arch_index].name);
2088    } else {
2089      ::snprintf(diag_msg_buf, diag_msg_max_length-1,
2090      " (Possible cause: can't load this .so (machine code=0x%x) on a %s-bit platform)",
2091        lib_arch.code,
2092        arch_array[running_arch_index].name);
2093    }
2094  }
2095
2096  return NULL;
2097}
2098
2099void* os::dll_lookup(void* handle, const char* name) {
2100  return dlsym(handle, name);
2101}
2102
2103
2104bool _print_ascii_file(const char* filename, outputStream* st) {
2105  int fd = open(filename, O_RDONLY);
2106  if (fd == -1) {
2107     return false;
2108  }
2109
2110  char buf[32];
2111  int bytes;
2112  while ((bytes = read(fd, buf, sizeof(buf))) > 0) {
2113    st->print_raw(buf, bytes);
2114  }
2115
2116  close(fd);
2117
2118  return true;
2119}
2120
2121void os::print_os_info(outputStream* st) {
2122  st->print("OS:");
2123
2124  if (!_print_ascii_file("/etc/release", st)) {
2125    st->print("Solaris");
2126  }
2127  st->cr();
2128
2129  // kernel
2130  st->print("uname:");
2131  struct utsname name;
2132  uname(&name);
2133  st->print(name.sysname); st->print(" ");
2134  st->print(name.release); st->print(" ");
2135  st->print(name.version); st->print(" ");
2136  st->print(name.machine);
2137
2138  // libthread
2139  if (os::Solaris::T2_libthread()) st->print("  (T2 libthread)");
2140  else st->print("  (T1 libthread)");
2141  st->cr();
2142
2143  // rlimit
2144  st->print("rlimit:");
2145  struct rlimit rlim;
2146
2147  st->print(" STACK ");
2148  getrlimit(RLIMIT_STACK, &rlim);
2149  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2150  else st->print("%uk", rlim.rlim_cur >> 10);
2151
2152  st->print(", CORE ");
2153  getrlimit(RLIMIT_CORE, &rlim);
2154  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2155  else st->print("%uk", rlim.rlim_cur >> 10);
2156
2157  st->print(", NOFILE ");
2158  getrlimit(RLIMIT_NOFILE, &rlim);
2159  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2160  else st->print("%d", rlim.rlim_cur);
2161
2162  st->print(", AS ");
2163  getrlimit(RLIMIT_AS, &rlim);
2164  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2165  else st->print("%uk", rlim.rlim_cur >> 10);
2166  st->cr();
2167
2168  // load average
2169  st->print("load average:");
2170  double loadavg[3];
2171  os::loadavg(loadavg, 3);
2172  st->print("%0.02f %0.02f %0.02f", loadavg[0], loadavg[1], loadavg[2]);
2173  st->cr();
2174}
2175
2176
2177static bool check_addr0(outputStream* st) {
2178  jboolean status = false;
2179  int fd = open("/proc/self/map",O_RDONLY);
2180  if (fd >= 0) {
2181    prmap_t p;
2182    while(read(fd, &p, sizeof(p)) > 0) {
2183      if (p.pr_vaddr == 0x0) {
2184        st->print("Warning: Address: 0x%x, Size: %dK, ",p.pr_vaddr, p.pr_size/1024, p.pr_mapname);
2185        st->print("Mapped file: %s, ", p.pr_mapname[0] == '\0' ? "None" : p.pr_mapname);
2186        st->print("Access:");
2187        st->print("%s",(p.pr_mflags & MA_READ)  ? "r" : "-");
2188        st->print("%s",(p.pr_mflags & MA_WRITE) ? "w" : "-");
2189        st->print("%s",(p.pr_mflags & MA_EXEC)  ? "x" : "-");
2190        st->cr();
2191        status = true;
2192      }
2193      close(fd);
2194    }
2195  }
2196  return status;
2197}
2198
2199void os::print_memory_info(outputStream* st) {
2200  st->print("Memory:");
2201  st->print(" %dk page", os::vm_page_size()>>10);
2202  st->print(", physical " UINT64_FORMAT "k", os::physical_memory()>>10);
2203  st->print("(" UINT64_FORMAT "k free)", os::available_memory() >> 10);
2204  st->cr();
2205  (void) check_addr0(st);
2206}
2207
2208// Taken from /usr/include/sys/machsig.h  Supposed to be architecture specific
2209// but they're the same for all the solaris architectures that we support.
2210const char *ill_names[] = { "ILL0", "ILL_ILLOPC", "ILL_ILLOPN", "ILL_ILLADR",
2211                          "ILL_ILLTRP", "ILL_PRVOPC", "ILL_PRVREG",
2212                          "ILL_COPROC", "ILL_BADSTK" };
2213
2214const char *fpe_names[] = { "FPE0", "FPE_INTDIV", "FPE_INTOVF", "FPE_FLTDIV",
2215                          "FPE_FLTOVF", "FPE_FLTUND", "FPE_FLTRES",
2216                          "FPE_FLTINV", "FPE_FLTSUB" };
2217
2218const char *segv_names[] = { "SEGV0", "SEGV_MAPERR", "SEGV_ACCERR" };
2219
2220const char *bus_names[] = { "BUS0", "BUS_ADRALN", "BUS_ADRERR", "BUS_OBJERR" };
2221
2222void os::print_siginfo(outputStream* st, void* siginfo) {
2223  st->print("siginfo:");
2224
2225  const int buflen = 100;
2226  char buf[buflen];
2227  siginfo_t *si = (siginfo_t*)siginfo;
2228  st->print("si_signo=%s: ", os::exception_name(si->si_signo, buf, buflen));
2229  char *err = strerror(si->si_errno);
2230  if (si->si_errno != 0 && err != NULL) {
2231    st->print("si_errno=%s", err);
2232  } else {
2233    st->print("si_errno=%d", si->si_errno);
2234  }
2235  const int c = si->si_code;
2236  assert(c > 0, "unexpected si_code");
2237  switch (si->si_signo) {
2238  case SIGILL:
2239    st->print(", si_code=%d (%s)", c, c > 8 ? "" : ill_names[c]);
2240    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2241    break;
2242  case SIGFPE:
2243    st->print(", si_code=%d (%s)", c, c > 9 ? "" : fpe_names[c]);
2244    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2245    break;
2246  case SIGSEGV:
2247    st->print(", si_code=%d (%s)", c, c > 2 ? "" : segv_names[c]);
2248    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2249    break;
2250  case SIGBUS:
2251    st->print(", si_code=%d (%s)", c, c > 3 ? "" : bus_names[c]);
2252    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2253    break;
2254  default:
2255    st->print(", si_code=%d", si->si_code);
2256    // no si_addr
2257  }
2258
2259  if ((si->si_signo == SIGBUS || si->si_signo == SIGSEGV) &&
2260      UseSharedSpaces) {
2261    FileMapInfo* mapinfo = FileMapInfo::current_info();
2262    if (mapinfo->is_in_shared_space(si->si_addr)) {
2263      st->print("\n\nError accessing class data sharing archive."   \
2264                " Mapped file inaccessible during execution, "      \
2265                " possible disk/network problem.");
2266    }
2267  }
2268  st->cr();
2269}
2270
2271// Moved from whole group, because we need them here for diagnostic
2272// prints.
2273#define OLDMAXSIGNUM 32
2274static int Maxsignum = 0;
2275static int *ourSigFlags = NULL;
2276
2277extern "C" void sigINTRHandler(int, siginfo_t*, void*);
2278
2279int os::Solaris::get_our_sigflags(int sig) {
2280  assert(ourSigFlags!=NULL, "signal data structure not initialized");
2281  assert(sig > 0 && sig < Maxsignum, "vm signal out of expected range");
2282  return ourSigFlags[sig];
2283}
2284
2285void os::Solaris::set_our_sigflags(int sig, int flags) {
2286  assert(ourSigFlags!=NULL, "signal data structure not initialized");
2287  assert(sig > 0 && sig < Maxsignum, "vm signal out of expected range");
2288  ourSigFlags[sig] = flags;
2289}
2290
2291
2292static const char* get_signal_handler_name(address handler,
2293                                           char* buf, int buflen) {
2294  int offset;
2295  bool found = os::dll_address_to_library_name(handler, buf, buflen, &offset);
2296  if (found) {
2297    // skip directory names
2298    const char *p1, *p2;
2299    p1 = buf;
2300    size_t len = strlen(os::file_separator());
2301    while ((p2 = strstr(p1, os::file_separator())) != NULL) p1 = p2 + len;
2302    jio_snprintf(buf, buflen, "%s+0x%x", p1, offset);
2303  } else {
2304    jio_snprintf(buf, buflen, PTR_FORMAT, handler);
2305  }
2306  return buf;
2307}
2308
2309static void print_signal_handler(outputStream* st, int sig,
2310                                  char* buf, size_t buflen) {
2311  struct sigaction sa;
2312
2313  sigaction(sig, NULL, &sa);
2314
2315  st->print("%s: ", os::exception_name(sig, buf, buflen));
2316
2317  address handler = (sa.sa_flags & SA_SIGINFO)
2318                  ? CAST_FROM_FN_PTR(address, sa.sa_sigaction)
2319                  : CAST_FROM_FN_PTR(address, sa.sa_handler);
2320
2321  if (handler == CAST_FROM_FN_PTR(address, SIG_DFL)) {
2322    st->print("SIG_DFL");
2323  } else if (handler == CAST_FROM_FN_PTR(address, SIG_IGN)) {
2324    st->print("SIG_IGN");
2325  } else {
2326    st->print("[%s]", get_signal_handler_name(handler, buf, buflen));
2327  }
2328
2329  st->print(", sa_mask[0]=" PTR32_FORMAT, *(uint32_t*)&sa.sa_mask);
2330
2331  address rh = VMError::get_resetted_sighandler(sig);
2332  // May be, handler was resetted by VMError?
2333  if(rh != NULL) {
2334    handler = rh;
2335    sa.sa_flags = VMError::get_resetted_sigflags(sig);
2336  }
2337
2338  st->print(", sa_flags="   PTR32_FORMAT, sa.sa_flags);
2339
2340  // Check: is it our handler?
2341  if(handler == CAST_FROM_FN_PTR(address, signalHandler) ||
2342     handler == CAST_FROM_FN_PTR(address, sigINTRHandler)) {
2343    // It is our signal handler
2344    // check for flags
2345    if(sa.sa_flags != os::Solaris::get_our_sigflags(sig)) {
2346      st->print(
2347        ", flags was changed from " PTR32_FORMAT ", consider using jsig library",
2348        os::Solaris::get_our_sigflags(sig));
2349    }
2350  }
2351  st->cr();
2352}
2353
2354void os::print_signal_handlers(outputStream* st, char* buf, size_t buflen) {
2355  st->print_cr("Signal Handlers:");
2356  print_signal_handler(st, SIGSEGV, buf, buflen);
2357  print_signal_handler(st, SIGBUS , buf, buflen);
2358  print_signal_handler(st, SIGFPE , buf, buflen);
2359  print_signal_handler(st, SIGPIPE, buf, buflen);
2360  print_signal_handler(st, SIGXFSZ, buf, buflen);
2361  print_signal_handler(st, SIGILL , buf, buflen);
2362  print_signal_handler(st, INTERRUPT_SIGNAL, buf, buflen);
2363  print_signal_handler(st, ASYNC_SIGNAL, buf, buflen);
2364  print_signal_handler(st, BREAK_SIGNAL, buf, buflen);
2365  print_signal_handler(st, SHUTDOWN1_SIGNAL , buf, buflen);
2366  print_signal_handler(st, SHUTDOWN2_SIGNAL , buf, buflen);
2367  print_signal_handler(st, SHUTDOWN3_SIGNAL, buf, buflen);
2368  print_signal_handler(st, os::Solaris::SIGinterrupt(), buf, buflen);
2369  print_signal_handler(st, os::Solaris::SIGasync(), buf, buflen);
2370}
2371
2372static char saved_jvm_path[MAXPATHLEN] = { 0 };
2373
2374// Find the full path to the current module, libjvm.so or libjvm_g.so
2375void os::jvm_path(char *buf, jint buflen) {
2376  // Error checking.
2377  if (buflen < MAXPATHLEN) {
2378    assert(false, "must use a large-enough buffer");
2379    buf[0] = '\0';
2380    return;
2381  }
2382  // Lazy resolve the path to current module.
2383  if (saved_jvm_path[0] != 0) {
2384    strcpy(buf, saved_jvm_path);
2385    return;
2386  }
2387
2388  Dl_info dlinfo;
2389  int ret = dladdr(CAST_FROM_FN_PTR(void *, os::jvm_path), &dlinfo);
2390  assert(ret != 0, "cannot locate libjvm");
2391  realpath((char *)dlinfo.dli_fname, buf);
2392
2393  if (strcmp(Arguments::sun_java_launcher(), "gamma") == 0) {
2394    // Support for the gamma launcher.  Typical value for buf is
2395    // "<JAVA_HOME>/jre/lib/<arch>/<vmtype>/libjvm.so".  If "/jre/lib/" appears at
2396    // the right place in the string, then assume we are installed in a JDK and
2397    // we're done.  Otherwise, check for a JAVA_HOME environment variable and fix
2398    // up the path so it looks like libjvm.so is installed there (append a
2399    // fake suffix hotspot/libjvm.so).
2400    const char *p = buf + strlen(buf) - 1;
2401    for (int count = 0; p > buf && count < 5; ++count) {
2402      for (--p; p > buf && *p != '/'; --p)
2403        /* empty */ ;
2404    }
2405
2406    if (strncmp(p, "/jre/lib/", 9) != 0) {
2407      // Look for JAVA_HOME in the environment.
2408      char* java_home_var = ::getenv("JAVA_HOME");
2409      if (java_home_var != NULL && java_home_var[0] != 0) {
2410        char cpu_arch[12];
2411        sysinfo(SI_ARCHITECTURE, cpu_arch, sizeof(cpu_arch));
2412#ifdef _LP64
2413        // If we are on sparc running a 64-bit vm, look in jre/lib/sparcv9.
2414        if (strcmp(cpu_arch, "sparc") == 0) {
2415          strcat(cpu_arch, "v9");
2416        } else if (strcmp(cpu_arch, "i386") == 0) {
2417          strcpy(cpu_arch, "amd64");
2418        }
2419#endif
2420        // Check the current module name "libjvm.so" or "libjvm_g.so".
2421        p = strrchr(buf, '/');
2422        assert(strstr(p, "/libjvm") == p, "invalid library name");
2423        p = strstr(p, "_g") ? "_g" : "";
2424
2425        realpath(java_home_var, buf);
2426        sprintf(buf + strlen(buf), "/jre/lib/%s", cpu_arch);
2427        if (0 == access(buf, F_OK)) {
2428          // Use current module name "libjvm[_g].so" instead of
2429          // "libjvm"debug_only("_g")".so" since for fastdebug version
2430          // we should have "libjvm.so" but debug_only("_g") adds "_g"!
2431          // It is used when we are choosing the HPI library's name
2432          // "libhpi[_g].so" in hpi::initialize_get_interface().
2433          sprintf(buf + strlen(buf), "/hotspot/libjvm%s.so", p);
2434        } else {
2435          // Go back to path of .so
2436          realpath((char *)dlinfo.dli_fname, buf);
2437        }
2438      }
2439    }
2440  }
2441
2442  strcpy(saved_jvm_path, buf);
2443}
2444
2445
2446void os::print_jni_name_prefix_on(outputStream* st, int args_size) {
2447  // no prefix required, not even "_"
2448}
2449
2450
2451void os::print_jni_name_suffix_on(outputStream* st, int args_size) {
2452  // no suffix required
2453}
2454
2455
2456// sun.misc.Signal
2457
2458extern "C" {
2459  static void UserHandler(int sig, void *siginfo, void *context) {
2460    // Ctrl-C is pressed during error reporting, likely because the error
2461    // handler fails to abort. Let VM die immediately.
2462    if (sig == SIGINT && is_error_reported()) {
2463       os::die();
2464    }
2465
2466    os::signal_notify(sig);
2467    // We do not need to reinstate the signal handler each time...
2468  }
2469}
2470
2471void* os::user_handler() {
2472  return CAST_FROM_FN_PTR(void*, UserHandler);
2473}
2474
2475extern "C" {
2476  typedef void (*sa_handler_t)(int);
2477  typedef void (*sa_sigaction_t)(int, siginfo_t *, void *);
2478}
2479
2480void* os::signal(int signal_number, void* handler) {
2481  struct sigaction sigAct, oldSigAct;
2482  sigfillset(&(sigAct.sa_mask));
2483  sigAct.sa_flags = SA_RESTART & ~SA_RESETHAND;
2484  sigAct.sa_handler = CAST_TO_FN_PTR(sa_handler_t, handler);
2485
2486  if (sigaction(signal_number, &sigAct, &oldSigAct))
2487    // -1 means registration failed
2488    return (void *)-1;
2489
2490  return CAST_FROM_FN_PTR(void*, oldSigAct.sa_handler);
2491}
2492
2493void os::signal_raise(int signal_number) {
2494  raise(signal_number);
2495}
2496
2497/*
2498 * The following code is moved from os.cpp for making this
2499 * code platform specific, which it is by its very nature.
2500 */
2501
2502// a counter for each possible signal value
2503static int Sigexit = 0;
2504static int Maxlibjsigsigs;
2505static jint *pending_signals = NULL;
2506static int *preinstalled_sigs = NULL;
2507static struct sigaction *chainedsigactions = NULL;
2508static sema_t sig_sem;
2509typedef int (*version_getting_t)();
2510version_getting_t os::Solaris::get_libjsig_version = NULL;
2511static int libjsigversion = NULL;
2512
2513int os::sigexitnum_pd() {
2514  assert(Sigexit > 0, "signal memory not yet initialized");
2515  return Sigexit;
2516}
2517
2518void os::Solaris::init_signal_mem() {
2519  // Initialize signal structures
2520  Maxsignum = SIGRTMAX;
2521  Sigexit = Maxsignum+1;
2522  assert(Maxsignum >0, "Unable to obtain max signal number");
2523
2524  Maxlibjsigsigs = Maxsignum;
2525
2526  // pending_signals has one int per signal
2527  // The additional signal is for SIGEXIT - exit signal to signal_thread
2528  pending_signals = (jint *)os::malloc(sizeof(jint) * (Sigexit+1));
2529  memset(pending_signals, 0, (sizeof(jint) * (Sigexit+1)));
2530
2531  if (UseSignalChaining) {
2532     chainedsigactions = (struct sigaction *)malloc(sizeof(struct sigaction)
2533       * (Maxsignum + 1));
2534     memset(chainedsigactions, 0, (sizeof(struct sigaction) * (Maxsignum + 1)));
2535     preinstalled_sigs = (int *)os::malloc(sizeof(int) * (Maxsignum + 1));
2536     memset(preinstalled_sigs, 0, (sizeof(int) * (Maxsignum + 1)));
2537  }
2538  ourSigFlags = (int*)malloc(sizeof(int) * (Maxsignum + 1 ));
2539  memset(ourSigFlags, 0, sizeof(int) * (Maxsignum + 1));
2540}
2541
2542void os::signal_init_pd() {
2543  int ret;
2544
2545  ret = ::sema_init(&sig_sem, 0, NULL, NULL);
2546  assert(ret == 0, "sema_init() failed");
2547}
2548
2549void os::signal_notify(int signal_number) {
2550  int ret;
2551
2552  Atomic::inc(&pending_signals[signal_number]);
2553  ret = ::sema_post(&sig_sem);
2554  assert(ret == 0, "sema_post() failed");
2555}
2556
2557static int check_pending_signals(bool wait_for_signal) {
2558  int ret;
2559  while (true) {
2560    for (int i = 0; i < Sigexit + 1; i++) {
2561      jint n = pending_signals[i];
2562      if (n > 0 && n == Atomic::cmpxchg(n - 1, &pending_signals[i], n)) {
2563        return i;
2564      }
2565    }
2566    if (!wait_for_signal) {
2567      return -1;
2568    }
2569    JavaThread *thread = JavaThread::current();
2570    ThreadBlockInVM tbivm(thread);
2571
2572    bool threadIsSuspended;
2573    do {
2574      thread->set_suspend_equivalent();
2575      // cleared by handle_special_suspend_equivalent_condition() or java_suspend_self()
2576      while((ret = ::sema_wait(&sig_sem)) == EINTR)
2577          ;
2578      assert(ret == 0, "sema_wait() failed");
2579
2580      // were we externally suspended while we were waiting?
2581      threadIsSuspended = thread->handle_special_suspend_equivalent_condition();
2582      if (threadIsSuspended) {
2583        //
2584        // The semaphore has been incremented, but while we were waiting
2585        // another thread suspended us. We don't want to continue running
2586        // while suspended because that would surprise the thread that
2587        // suspended us.
2588        //
2589        ret = ::sema_post(&sig_sem);
2590        assert(ret == 0, "sema_post() failed");
2591
2592        thread->java_suspend_self();
2593      }
2594    } while (threadIsSuspended);
2595  }
2596}
2597
2598int os::signal_lookup() {
2599  return check_pending_signals(false);
2600}
2601
2602int os::signal_wait() {
2603  return check_pending_signals(true);
2604}
2605
2606////////////////////////////////////////////////////////////////////////////////
2607// Virtual Memory
2608
2609static int page_size = -1;
2610
2611// The mmap MAP_ALIGN flag is supported on Solaris 9 and later.  init_2() will
2612// clear this var if support is not available.
2613static bool has_map_align = true;
2614
2615int os::vm_page_size() {
2616  assert(page_size != -1, "must call os::init");
2617  return page_size;
2618}
2619
2620// Solaris allocates memory by pages.
2621int os::vm_allocation_granularity() {
2622  assert(page_size != -1, "must call os::init");
2623  return page_size;
2624}
2625
2626bool os::commit_memory(char* addr, size_t bytes) {
2627  size_t size = bytes;
2628  return
2629     NULL != Solaris::mmap_chunk(addr, size, MAP_PRIVATE|MAP_FIXED,
2630                                 PROT_READ | PROT_WRITE | PROT_EXEC);
2631}
2632
2633bool os::commit_memory(char* addr, size_t bytes, size_t alignment_hint) {
2634  if (commit_memory(addr, bytes)) {
2635    if (UseMPSS && alignment_hint > (size_t)vm_page_size()) {
2636      // If the large page size has been set and the VM
2637      // is using large pages, use the large page size
2638      // if it is smaller than the alignment hint. This is
2639      // a case where the VM wants to use a larger alignment size
2640      // for its own reasons but still want to use large pages
2641      // (which is what matters to setting the mpss range.
2642      size_t page_size = 0;
2643      if (large_page_size() < alignment_hint) {
2644        assert(UseLargePages, "Expected to be here for large page use only");
2645        page_size = large_page_size();
2646      } else {
2647        // If the alignment hint is less than the large page
2648        // size, the VM wants a particular alignment (thus the hint)
2649        // for internal reasons.  Try to set the mpss range using
2650        // the alignment_hint.
2651        page_size = alignment_hint;
2652      }
2653      // Since this is a hint, ignore any failures.
2654      (void)Solaris::set_mpss_range(addr, bytes, page_size);
2655    }
2656    return true;
2657  }
2658  return false;
2659}
2660
2661// Uncommit the pages in a specified region.
2662void os::free_memory(char* addr, size_t bytes) {
2663  if (madvise(addr, bytes, MADV_FREE) < 0) {
2664    debug_only(warning("MADV_FREE failed."));
2665    return;
2666  }
2667}
2668
2669// Change the page size in a given range.
2670void os::realign_memory(char *addr, size_t bytes, size_t alignment_hint) {
2671  assert((intptr_t)addr % alignment_hint == 0, "Address should be aligned.");
2672  assert((intptr_t)(addr + bytes) % alignment_hint == 0, "End should be aligned.");
2673  Solaris::set_mpss_range(addr, bytes, alignment_hint);
2674}
2675
2676// Tell the OS to make the range local to the first-touching LWP
2677void os::numa_make_local(char *addr, size_t bytes, int lgrp_hint) {
2678  assert((intptr_t)addr % os::vm_page_size() == 0, "Address should be page-aligned.");
2679  if (madvise(addr, bytes, MADV_ACCESS_LWP) < 0) {
2680    debug_only(warning("MADV_ACCESS_LWP failed."));
2681  }
2682}
2683
2684// Tell the OS that this range would be accessed from different LWPs.
2685void os::numa_make_global(char *addr, size_t bytes) {
2686  assert((intptr_t)addr % os::vm_page_size() == 0, "Address should be page-aligned.");
2687  if (madvise(addr, bytes, MADV_ACCESS_MANY) < 0) {
2688    debug_only(warning("MADV_ACCESS_MANY failed."));
2689  }
2690}
2691
2692// Get the number of the locality groups.
2693size_t os::numa_get_groups_num() {
2694  size_t n = Solaris::lgrp_nlgrps(Solaris::lgrp_cookie());
2695  return n != -1 ? n : 1;
2696}
2697
2698// Get a list of leaf locality groups. A leaf lgroup is group that
2699// doesn't have any children. Typical leaf group is a CPU or a CPU/memory
2700// board. An LWP is assigned to one of these groups upon creation.
2701size_t os::numa_get_leaf_groups(int *ids, size_t size) {
2702   if ((ids[0] = Solaris::lgrp_root(Solaris::lgrp_cookie())) == -1) {
2703     ids[0] = 0;
2704     return 1;
2705   }
2706   int result_size = 0, top = 1, bottom = 0, cur = 0;
2707   for (int k = 0; k < size; k++) {
2708     int r = Solaris::lgrp_children(Solaris::lgrp_cookie(), ids[cur],
2709                                    (Solaris::lgrp_id_t*)&ids[top], size - top);
2710     if (r == -1) {
2711       ids[0] = 0;
2712       return 1;
2713     }
2714     if (!r) {
2715       // That's a leaf node.
2716       assert (bottom <= cur, "Sanity check");
2717       // Check if the node has memory
2718       if (Solaris::lgrp_resources(Solaris::lgrp_cookie(), ids[cur],
2719                                   NULL, 0, LGRP_RSRC_MEM) > 0) {
2720         ids[bottom++] = ids[cur];
2721       }
2722     }
2723     top += r;
2724     cur++;
2725   }
2726   if (bottom == 0) {
2727     // Handle a situation, when the OS reports no memory available.
2728     // Assume UMA architecture.
2729     ids[0] = 0;
2730     return 1;
2731   }
2732   return bottom;
2733}
2734
2735// Detect the topology change. Typically happens during CPU plugging-unplugging.
2736bool os::numa_topology_changed() {
2737  int is_stale = Solaris::lgrp_cookie_stale(Solaris::lgrp_cookie());
2738  if (is_stale != -1 && is_stale) {
2739    Solaris::lgrp_fini(Solaris::lgrp_cookie());
2740    Solaris::lgrp_cookie_t c = Solaris::lgrp_init(Solaris::LGRP_VIEW_CALLER);
2741    assert(c != 0, "Failure to initialize LGRP API");
2742    Solaris::set_lgrp_cookie(c);
2743    return true;
2744  }
2745  return false;
2746}
2747
2748// Get the group id of the current LWP.
2749int os::numa_get_group_id() {
2750  int lgrp_id = Solaris::lgrp_home(P_LWPID, P_MYID);
2751  if (lgrp_id == -1) {
2752    return 0;
2753  }
2754  const int size = os::numa_get_groups_num();
2755  int *ids = (int*)alloca(size * sizeof(int));
2756
2757  // Get the ids of all lgroups with memory; r is the count.
2758  int r = Solaris::lgrp_resources(Solaris::lgrp_cookie(), lgrp_id,
2759                                  (Solaris::lgrp_id_t*)ids, size, LGRP_RSRC_MEM);
2760  if (r <= 0) {
2761    return 0;
2762  }
2763  return ids[os::random() % r];
2764}
2765
2766// Request information about the page.
2767bool os::get_page_info(char *start, page_info* info) {
2768  const uint_t info_types[] = { MEMINFO_VLGRP, MEMINFO_VPAGESIZE };
2769  uint64_t addr = (uintptr_t)start;
2770  uint64_t outdata[2];
2771  uint_t validity = 0;
2772
2773  if (os::Solaris::meminfo(&addr, 1, info_types, 2, outdata, &validity) < 0) {
2774    return false;
2775  }
2776
2777  info->size = 0;
2778  info->lgrp_id = -1;
2779
2780  if ((validity & 1) != 0) {
2781    if ((validity & 2) != 0) {
2782      info->lgrp_id = outdata[0];
2783    }
2784    if ((validity & 4) != 0) {
2785      info->size = outdata[1];
2786    }
2787    return true;
2788  }
2789  return false;
2790}
2791
2792// Scan the pages from start to end until a page different than
2793// the one described in the info parameter is encountered.
2794char *os::scan_pages(char *start, char* end, page_info* page_expected, page_info* page_found) {
2795  const uint_t info_types[] = { MEMINFO_VLGRP, MEMINFO_VPAGESIZE };
2796  const size_t types = sizeof(info_types) / sizeof(info_types[0]);
2797  uint64_t addrs[MAX_MEMINFO_CNT], outdata[types * MAX_MEMINFO_CNT];
2798  uint_t validity[MAX_MEMINFO_CNT];
2799
2800  size_t page_size = MAX2((size_t)os::vm_page_size(), page_expected->size);
2801  uint64_t p = (uint64_t)start;
2802  while (p < (uint64_t)end) {
2803    addrs[0] = p;
2804    size_t addrs_count = 1;
2805    while (addrs_count < MAX_MEMINFO_CNT && addrs[addrs_count - 1] < (uint64_t)end) {
2806      addrs[addrs_count] = addrs[addrs_count - 1] + page_size;
2807      addrs_count++;
2808    }
2809
2810    if (os::Solaris::meminfo(addrs, addrs_count, info_types, types, outdata, validity) < 0) {
2811      return NULL;
2812    }
2813
2814    size_t i = 0;
2815    for (; i < addrs_count; i++) {
2816      if ((validity[i] & 1) != 0) {
2817        if ((validity[i] & 4) != 0) {
2818          if (outdata[types * i + 1] != page_expected->size) {
2819            break;
2820          }
2821        } else
2822          if (page_expected->size != 0) {
2823            break;
2824          }
2825
2826        if ((validity[i] & 2) != 0 && page_expected->lgrp_id > 0) {
2827          if (outdata[types * i] != page_expected->lgrp_id) {
2828            break;
2829          }
2830        }
2831      } else {
2832        return NULL;
2833      }
2834    }
2835
2836    if (i != addrs_count) {
2837      if ((validity[i] & 2) != 0) {
2838        page_found->lgrp_id = outdata[types * i];
2839      } else {
2840        page_found->lgrp_id = -1;
2841      }
2842      if ((validity[i] & 4) != 0) {
2843        page_found->size = outdata[types * i + 1];
2844      } else {
2845        page_found->size = 0;
2846      }
2847      return (char*)addrs[i];
2848    }
2849
2850    p = addrs[addrs_count - 1] + page_size;
2851  }
2852  return end;
2853}
2854
2855bool os::uncommit_memory(char* addr, size_t bytes) {
2856  size_t size = bytes;
2857  // Map uncommitted pages PROT_NONE so we fail early if we touch an
2858  // uncommitted page. Otherwise, the read/write might succeed if we
2859  // have enough swap space to back the physical page.
2860  return
2861    NULL != Solaris::mmap_chunk(addr, size,
2862                                MAP_PRIVATE|MAP_FIXED|MAP_NORESERVE,
2863                                PROT_NONE);
2864}
2865
2866char* os::Solaris::mmap_chunk(char *addr, size_t size, int flags, int prot) {
2867  char *b = (char *)mmap(addr, size, prot, flags, os::Solaris::_dev_zero_fd, 0);
2868
2869  if (b == MAP_FAILED) {
2870    return NULL;
2871  }
2872  return b;
2873}
2874
2875char* os::Solaris::anon_mmap(char* requested_addr, size_t bytes, size_t alignment_hint, bool fixed) {
2876  char* addr = requested_addr;
2877  int flags = MAP_PRIVATE | MAP_NORESERVE;
2878
2879  assert(!(fixed && (alignment_hint > 0)), "alignment hint meaningless with fixed mmap");
2880
2881  if (fixed) {
2882    flags |= MAP_FIXED;
2883  } else if (has_map_align && (alignment_hint > (size_t) vm_page_size())) {
2884    flags |= MAP_ALIGN;
2885    addr = (char*) alignment_hint;
2886  }
2887
2888  // Map uncommitted pages PROT_NONE so we fail early if we touch an
2889  // uncommitted page. Otherwise, the read/write might succeed if we
2890  // have enough swap space to back the physical page.
2891  return mmap_chunk(addr, bytes, flags, PROT_NONE);
2892}
2893
2894char* os::reserve_memory(size_t bytes, char* requested_addr, size_t alignment_hint) {
2895  char* addr = Solaris::anon_mmap(requested_addr, bytes, alignment_hint, (requested_addr != NULL));
2896
2897  guarantee(requested_addr == NULL || requested_addr == addr,
2898            "OS failed to return requested mmap address.");
2899  return addr;
2900}
2901
2902// Reserve memory at an arbitrary address, only if that area is
2903// available (and not reserved for something else).
2904
2905char* os::attempt_reserve_memory_at(size_t bytes, char* requested_addr) {
2906  const int max_tries = 10;
2907  char* base[max_tries];
2908  size_t size[max_tries];
2909
2910  // Solaris adds a gap between mmap'ed regions.  The size of the gap
2911  // is dependent on the requested size and the MMU.  Our initial gap
2912  // value here is just a guess and will be corrected later.
2913  bool had_top_overlap = false;
2914  bool have_adjusted_gap = false;
2915  size_t gap = 0x400000;
2916
2917  // Assert only that the size is a multiple of the page size, since
2918  // that's all that mmap requires, and since that's all we really know
2919  // about at this low abstraction level.  If we need higher alignment,
2920  // we can either pass an alignment to this method or verify alignment
2921  // in one of the methods further up the call chain.  See bug 5044738.
2922  assert(bytes % os::vm_page_size() == 0, "reserving unexpected size block");
2923
2924  // Since snv_84, Solaris attempts to honor the address hint - see 5003415.
2925  // Give it a try, if the kernel honors the hint we can return immediately.
2926  char* addr = Solaris::anon_mmap(requested_addr, bytes, 0, false);
2927  volatile int err = errno;
2928  if (addr == requested_addr) {
2929    return addr;
2930  } else if (addr != NULL) {
2931    unmap_memory(addr, bytes);
2932  }
2933
2934  if (PrintMiscellaneous && Verbose) {
2935    char buf[256];
2936    buf[0] = '\0';
2937    if (addr == NULL) {
2938      jio_snprintf(buf, sizeof(buf), ": %s", strerror(err));
2939    }
2940    warning("attempt_reserve_memory_at: couldn't reserve %d bytes at "
2941            PTR_FORMAT ": reserve_memory_helper returned " PTR_FORMAT
2942            "%s", bytes, requested_addr, addr, buf);
2943  }
2944
2945  // Address hint method didn't work.  Fall back to the old method.
2946  // In theory, once SNV becomes our oldest supported platform, this
2947  // code will no longer be needed.
2948  //
2949  // Repeatedly allocate blocks until the block is allocated at the
2950  // right spot. Give up after max_tries.
2951  int i;
2952  for (i = 0; i < max_tries; ++i) {
2953    base[i] = reserve_memory(bytes);
2954
2955    if (base[i] != NULL) {
2956      // Is this the block we wanted?
2957      if (base[i] == requested_addr) {
2958        size[i] = bytes;
2959        break;
2960      }
2961
2962      // check that the gap value is right
2963      if (had_top_overlap && !have_adjusted_gap) {
2964        size_t actual_gap = base[i-1] - base[i] - bytes;
2965        if (gap != actual_gap) {
2966          // adjust the gap value and retry the last 2 allocations
2967          assert(i > 0, "gap adjustment code problem");
2968          have_adjusted_gap = true;  // adjust the gap only once, just in case
2969          gap = actual_gap;
2970          if (PrintMiscellaneous && Verbose) {
2971            warning("attempt_reserve_memory_at: adjusted gap to 0x%lx", gap);
2972          }
2973          unmap_memory(base[i], bytes);
2974          unmap_memory(base[i-1], size[i-1]);
2975          i-=2;
2976          continue;
2977        }
2978      }
2979
2980      // Does this overlap the block we wanted? Give back the overlapped
2981      // parts and try again.
2982      //
2983      // There is still a bug in this code: if top_overlap == bytes,
2984      // the overlap is offset from requested region by the value of gap.
2985      // In this case giving back the overlapped part will not work,
2986      // because we'll give back the entire block at base[i] and
2987      // therefore the subsequent allocation will not generate a new gap.
2988      // This could be fixed with a new algorithm that used larger
2989      // or variable size chunks to find the requested region -
2990      // but such a change would introduce additional complications.
2991      // It's rare enough that the planets align for this bug,
2992      // so we'll just wait for a fix for 6204603/5003415 which
2993      // will provide a mmap flag to allow us to avoid this business.
2994
2995      size_t top_overlap = requested_addr + (bytes + gap) - base[i];
2996      if (top_overlap >= 0 && top_overlap < bytes) {
2997        had_top_overlap = true;
2998        unmap_memory(base[i], top_overlap);
2999        base[i] += top_overlap;
3000        size[i] = bytes - top_overlap;
3001      } else {
3002        size_t bottom_overlap = base[i] + bytes - requested_addr;
3003        if (bottom_overlap >= 0 && bottom_overlap < bytes) {
3004          if (PrintMiscellaneous && Verbose && bottom_overlap == 0) {
3005            warning("attempt_reserve_memory_at: possible alignment bug");
3006          }
3007          unmap_memory(requested_addr, bottom_overlap);
3008          size[i] = bytes - bottom_overlap;
3009        } else {
3010          size[i] = bytes;
3011        }
3012      }
3013    }
3014  }
3015
3016  // Give back the unused reserved pieces.
3017
3018  for (int j = 0; j < i; ++j) {
3019    if (base[j] != NULL) {
3020      unmap_memory(base[j], size[j]);
3021    }
3022  }
3023
3024  return (i < max_tries) ? requested_addr : NULL;
3025}
3026
3027bool os::release_memory(char* addr, size_t bytes) {
3028  size_t size = bytes;
3029  return munmap(addr, size) == 0;
3030}
3031
3032static bool solaris_mprotect(char* addr, size_t bytes, int prot) {
3033  assert(addr == (char*)align_size_down((uintptr_t)addr, os::vm_page_size()),
3034         "addr must be page aligned");
3035  int retVal = mprotect(addr, bytes, prot);
3036  return retVal == 0;
3037}
3038
3039// Protect memory (Used to pass readonly pages through
3040// JNI GetArray<type>Elements with empty arrays.)
3041// Also, used for serialization page and for compressed oops null pointer
3042// checking.
3043bool os::protect_memory(char* addr, size_t bytes, ProtType prot,
3044                        bool is_committed) {
3045  unsigned int p = 0;
3046  switch (prot) {
3047  case MEM_PROT_NONE: p = PROT_NONE; break;
3048  case MEM_PROT_READ: p = PROT_READ; break;
3049  case MEM_PROT_RW:   p = PROT_READ|PROT_WRITE; break;
3050  case MEM_PROT_RWX:  p = PROT_READ|PROT_WRITE|PROT_EXEC; break;
3051  default:
3052    ShouldNotReachHere();
3053  }
3054  // is_committed is unused.
3055  return solaris_mprotect(addr, bytes, p);
3056}
3057
3058// guard_memory and unguard_memory only happens within stack guard pages.
3059// Since ISM pertains only to the heap, guard and unguard memory should not
3060/// happen with an ISM region.
3061bool os::guard_memory(char* addr, size_t bytes) {
3062  return solaris_mprotect(addr, bytes, PROT_NONE);
3063}
3064
3065bool os::unguard_memory(char* addr, size_t bytes) {
3066  return solaris_mprotect(addr, bytes, PROT_READ|PROT_WRITE);
3067}
3068
3069// Large page support
3070
3071// UseLargePages is the master flag to enable/disable large page memory.
3072// UseMPSS and UseISM are supported for compatibility reasons. Their combined
3073// effects can be described in the following table:
3074//
3075// UseLargePages UseMPSS UseISM
3076//    false         *       *   => UseLargePages is the master switch, turning
3077//                                 it off will turn off both UseMPSS and
3078//                                 UseISM. VM will not use large page memory
3079//                                 regardless the settings of UseMPSS/UseISM.
3080//     true      false    false => Unless future Solaris provides other
3081//                                 mechanism to use large page memory, this
3082//                                 combination is equivalent to -UseLargePages,
3083//                                 VM will not use large page memory
3084//     true      true     false => JVM will use MPSS for large page memory.
3085//                                 This is the default behavior.
3086//     true      false    true  => JVM will use ISM for large page memory.
3087//     true      true     true  => JVM will use ISM if it is available.
3088//                                 Otherwise, JVM will fall back to MPSS.
3089//                                 Becaues ISM is now available on all
3090//                                 supported Solaris versions, this combination
3091//                                 is equivalent to +UseISM -UseMPSS.
3092
3093typedef int (*getpagesizes_func_type) (size_t[], int);
3094static size_t _large_page_size = 0;
3095
3096bool os::Solaris::ism_sanity_check(bool warn, size_t * page_size) {
3097  // x86 uses either 2M or 4M page, depending on whether PAE (Physical Address
3098  // Extensions) mode is enabled. AMD64/EM64T uses 2M page in 64bit mode. Sparc
3099  // can support multiple page sizes.
3100
3101  // Don't bother to probe page size because getpagesizes() comes with MPSS.
3102  // ISM is only recommended on old Solaris where there is no MPSS support.
3103  // Simply choose a conservative value as default.
3104  *page_size = LargePageSizeInBytes ? LargePageSizeInBytes :
3105               SPARC_ONLY(4 * M) IA32_ONLY(4 * M) AMD64_ONLY(2 * M);
3106
3107  // ISM is available on all supported Solaris versions
3108  return true;
3109}
3110
3111// Insertion sort for small arrays (descending order).
3112static void insertion_sort_descending(size_t* array, int len) {
3113  for (int i = 0; i < len; i++) {
3114    size_t val = array[i];
3115    for (size_t key = i; key > 0 && array[key - 1] < val; --key) {
3116      size_t tmp = array[key];
3117      array[key] = array[key - 1];
3118      array[key - 1] = tmp;
3119    }
3120  }
3121}
3122
3123bool os::Solaris::mpss_sanity_check(bool warn, size_t * page_size) {
3124  getpagesizes_func_type getpagesizes_func =
3125    CAST_TO_FN_PTR(getpagesizes_func_type, dlsym(RTLD_DEFAULT, "getpagesizes"));
3126  if (getpagesizes_func == NULL) {
3127    if (warn) {
3128      warning("MPSS is not supported by the operating system.");
3129    }
3130    return false;
3131  }
3132
3133  const unsigned int usable_count = VM_Version::page_size_count();
3134  if (usable_count == 1) {
3135    return false;
3136  }
3137
3138  // Fill the array of page sizes.
3139  int n = getpagesizes_func(_page_sizes, page_sizes_max);
3140  assert(n > 0, "Solaris bug?");
3141  if (n == page_sizes_max) {
3142    // Add a sentinel value (necessary only if the array was completely filled
3143    // since it is static (zeroed at initialization)).
3144    _page_sizes[--n] = 0;
3145    DEBUG_ONLY(warning("increase the size of the os::_page_sizes array.");)
3146  }
3147  assert(_page_sizes[n] == 0, "missing sentinel");
3148
3149  if (n == 1) return false;     // Only one page size available.
3150
3151  // Skip sizes larger than 4M (or LargePageSizeInBytes if it was set) and
3152  // select up to usable_count elements.  First sort the array, find the first
3153  // acceptable value, then copy the usable sizes to the top of the array and
3154  // trim the rest.  Make sure to include the default page size :-).
3155  //
3156  // A better policy could get rid of the 4M limit by taking the sizes of the
3157  // important VM memory regions (java heap and possibly the code cache) into
3158  // account.
3159  insertion_sort_descending(_page_sizes, n);
3160  const size_t size_limit =
3161    FLAG_IS_DEFAULT(LargePageSizeInBytes) ? 4 * M : LargePageSizeInBytes;
3162  int beg;
3163  for (beg = 0; beg < n && _page_sizes[beg] > size_limit; ++beg) /* empty */ ;
3164  const int end = MIN2((int)usable_count, n) - 1;
3165  for (int cur = 0; cur < end; ++cur, ++beg) {
3166    _page_sizes[cur] = _page_sizes[beg];
3167  }
3168  _page_sizes[end] = vm_page_size();
3169  _page_sizes[end + 1] = 0;
3170
3171  if (_page_sizes[end] > _page_sizes[end - 1]) {
3172    // Default page size is not the smallest; sort again.
3173    insertion_sort_descending(_page_sizes, end + 1);
3174  }
3175  *page_size = _page_sizes[0];
3176
3177  return true;
3178}
3179
3180bool os::large_page_init() {
3181  if (!UseLargePages) {
3182    UseISM = false;
3183    UseMPSS = false;
3184    return false;
3185  }
3186
3187  // print a warning if any large page related flag is specified on command line
3188  bool warn_on_failure = !FLAG_IS_DEFAULT(UseLargePages)        ||
3189                         !FLAG_IS_DEFAULT(UseISM)               ||
3190                         !FLAG_IS_DEFAULT(UseMPSS)              ||
3191                         !FLAG_IS_DEFAULT(LargePageSizeInBytes);
3192  UseISM = UseISM &&
3193           Solaris::ism_sanity_check(warn_on_failure, &_large_page_size);
3194  if (UseISM) {
3195    // ISM disables MPSS to be compatible with old JDK behavior
3196    UseMPSS = false;
3197    _page_sizes[0] = _large_page_size;
3198    _page_sizes[1] = vm_page_size();
3199  }
3200
3201  UseMPSS = UseMPSS &&
3202            Solaris::mpss_sanity_check(warn_on_failure, &_large_page_size);
3203
3204  UseLargePages = UseISM || UseMPSS;
3205  return UseLargePages;
3206}
3207
3208bool os::Solaris::set_mpss_range(caddr_t start, size_t bytes, size_t align) {
3209  // Signal to OS that we want large pages for addresses
3210  // from addr, addr + bytes
3211  struct memcntl_mha mpss_struct;
3212  mpss_struct.mha_cmd = MHA_MAPSIZE_VA;
3213  mpss_struct.mha_pagesize = align;
3214  mpss_struct.mha_flags = 0;
3215  if (memcntl(start, bytes, MC_HAT_ADVISE,
3216              (caddr_t) &mpss_struct, 0, 0) < 0) {
3217    debug_only(warning("Attempt to use MPSS failed."));
3218    return false;
3219  }
3220  return true;
3221}
3222
3223char* os::reserve_memory_special(size_t bytes) {
3224  assert(UseLargePages && UseISM, "only for ISM large pages");
3225
3226  size_t size = bytes;
3227  char* retAddr = NULL;
3228  int shmid;
3229  key_t ismKey;
3230
3231  bool warn_on_failure = UseISM &&
3232                        (!FLAG_IS_DEFAULT(UseLargePages)         ||
3233                         !FLAG_IS_DEFAULT(UseISM)                ||
3234                         !FLAG_IS_DEFAULT(LargePageSizeInBytes)
3235                        );
3236  char msg[128];
3237
3238  ismKey = IPC_PRIVATE;
3239
3240  // Create a large shared memory region to attach to based on size.
3241  // Currently, size is the total size of the heap
3242  shmid = shmget(ismKey, size, SHM_R | SHM_W | IPC_CREAT);
3243  if (shmid == -1){
3244     if (warn_on_failure) {
3245       jio_snprintf(msg, sizeof(msg), "Failed to reserve shared memory (errno = %d).", errno);
3246       warning(msg);
3247     }
3248     return NULL;
3249  }
3250
3251  // Attach to the region
3252  retAddr = (char *) shmat(shmid, 0, SHM_SHARE_MMU | SHM_R | SHM_W);
3253  int err = errno;
3254
3255  // Remove shmid. If shmat() is successful, the actual shared memory segment
3256  // will be deleted when it's detached by shmdt() or when the process
3257  // terminates. If shmat() is not successful this will remove the shared
3258  // segment immediately.
3259  shmctl(shmid, IPC_RMID, NULL);
3260
3261  if (retAddr == (char *) -1) {
3262    if (warn_on_failure) {
3263      jio_snprintf(msg, sizeof(msg), "Failed to attach shared memory (errno = %d).", err);
3264      warning(msg);
3265    }
3266    return NULL;
3267  }
3268
3269  return retAddr;
3270}
3271
3272bool os::release_memory_special(char* base, size_t bytes) {
3273  // detaching the SHM segment will also delete it, see reserve_memory_special()
3274  int rslt = shmdt(base);
3275  return rslt == 0;
3276}
3277
3278size_t os::large_page_size() {
3279  return _large_page_size;
3280}
3281
3282// MPSS allows application to commit large page memory on demand; with ISM
3283// the entire memory region must be allocated as shared memory.
3284bool os::can_commit_large_page_memory() {
3285  return UseISM ? false : true;
3286}
3287
3288bool os::can_execute_large_page_memory() {
3289  return UseISM ? false : true;
3290}
3291
3292static int os_sleep(jlong millis, bool interruptible) {
3293  const jlong limit = INT_MAX;
3294  jlong prevtime;
3295  int res;
3296
3297  while (millis > limit) {
3298    if ((res = os_sleep(limit, interruptible)) != OS_OK)
3299      return res;
3300    millis -= limit;
3301  }
3302
3303  // Restart interrupted polls with new parameters until the proper delay
3304  // has been completed.
3305
3306  prevtime = getTimeMillis();
3307
3308  while (millis > 0) {
3309    jlong newtime;
3310
3311    if (!interruptible) {
3312      // Following assert fails for os::yield_all:
3313      // assert(!thread->is_Java_thread(), "must not be java thread");
3314      res = poll(NULL, 0, millis);
3315    } else {
3316      JavaThread *jt = JavaThread::current();
3317
3318      INTERRUPTIBLE_NORESTART_VM_ALWAYS(poll(NULL, 0, millis), res, jt,
3319        os::Solaris::clear_interrupted);
3320    }
3321
3322    // INTERRUPTIBLE_NORESTART_VM_ALWAYS returns res == OS_INTRPT for
3323    // thread.Interrupt.
3324
3325    if((res == OS_ERR) && (errno == EINTR)) {
3326      newtime = getTimeMillis();
3327      assert(newtime >= prevtime, "time moving backwards");
3328    /* Doing prevtime and newtime in microseconds doesn't help precision,
3329       and trying to round up to avoid lost milliseconds can result in a
3330       too-short delay. */
3331      millis -= newtime - prevtime;
3332      if(millis <= 0)
3333        return OS_OK;
3334      prevtime = newtime;
3335    } else
3336      return res;
3337  }
3338
3339  return OS_OK;
3340}
3341
3342// Read calls from inside the vm need to perform state transitions
3343size_t os::read(int fd, void *buf, unsigned int nBytes) {
3344  INTERRUPTIBLE_RETURN_INT_VM(::read(fd, buf, nBytes), os::Solaris::clear_interrupted);
3345}
3346
3347int os::sleep(Thread* thread, jlong millis, bool interruptible) {
3348  assert(thread == Thread::current(),  "thread consistency check");
3349
3350  // TODO-FIXME: this should be removed.
3351  // On Solaris machines (especially 2.5.1) we found that sometimes the VM gets into a live lock
3352  // situation with a JavaThread being starved out of a lwp. The kernel doesn't seem to generate
3353  // a SIGWAITING signal which would enable the threads library to create a new lwp for the starving
3354  // thread. We suspect that because the Watcher thread keeps waking up at periodic intervals the kernel
3355  // is fooled into believing that the system is making progress. In the code below we block the
3356  // the watcher thread while safepoint is in progress so that it would not appear as though the
3357  // system is making progress.
3358  if (!Solaris::T2_libthread() &&
3359      thread->is_Watcher_thread() && SafepointSynchronize::is_synchronizing() && !Arguments::has_profile()) {
3360    // We now try to acquire the threads lock. Since this lock is held by the VM thread during
3361    // the entire safepoint, the watcher thread will  line up here during the safepoint.
3362    Threads_lock->lock_without_safepoint_check();
3363    Threads_lock->unlock();
3364  }
3365
3366  if (thread->is_Java_thread()) {
3367    // This is a JavaThread so we honor the _thread_blocked protocol
3368    // even for sleeps of 0 milliseconds. This was originally done
3369    // as a workaround for bug 4338139. However, now we also do it
3370    // to honor the suspend-equivalent protocol.
3371
3372    JavaThread *jt = (JavaThread *) thread;
3373    ThreadBlockInVM tbivm(jt);
3374
3375    jt->set_suspend_equivalent();
3376    // cleared by handle_special_suspend_equivalent_condition() or
3377    // java_suspend_self() via check_and_wait_while_suspended()
3378
3379    int ret_code;
3380    if (millis <= 0) {
3381      thr_yield();
3382      ret_code = 0;
3383    } else {
3384      // The original sleep() implementation did not create an
3385      // OSThreadWaitState helper for sleeps of 0 milliseconds.
3386      // I'm preserving that decision for now.
3387      OSThreadWaitState osts(jt->osthread(), false /* not Object.wait() */);
3388
3389      ret_code = os_sleep(millis, interruptible);
3390    }
3391
3392    // were we externally suspended while we were waiting?
3393    jt->check_and_wait_while_suspended();
3394
3395    return ret_code;
3396  }
3397
3398  // non-JavaThread from this point on:
3399
3400  if (millis <= 0) {
3401    thr_yield();
3402    return 0;
3403  }
3404
3405  OSThreadWaitState osts(thread->osthread(), false /* not Object.wait() */);
3406
3407  return os_sleep(millis, interruptible);
3408}
3409
3410int os::naked_sleep() {
3411  // %% make the sleep time an integer flag. for now use 1 millisec.
3412  return os_sleep(1, false);
3413}
3414
3415// Sleep forever; naked call to OS-specific sleep; use with CAUTION
3416void os::infinite_sleep() {
3417  while (true) {    // sleep forever ...
3418    ::sleep(100);   // ... 100 seconds at a time
3419  }
3420}
3421
3422// Used to convert frequent JVM_Yield() to nops
3423bool os::dont_yield() {
3424  if (DontYieldALot) {
3425    static hrtime_t last_time = 0;
3426    hrtime_t diff = getTimeNanos() - last_time;
3427
3428    if (diff < DontYieldALotInterval * 1000000)
3429      return true;
3430
3431    last_time += diff;
3432
3433    return false;
3434  }
3435  else {
3436    return false;
3437  }
3438}
3439
3440// Caveat: Solaris os::yield() causes a thread-state transition whereas
3441// the linux and win32 implementations do not.  This should be checked.
3442
3443void os::yield() {
3444  // Yields to all threads with same or greater priority
3445  os::sleep(Thread::current(), 0, false);
3446}
3447
3448// Note that yield semantics are defined by the scheduling class to which
3449// the thread currently belongs.  Typically, yield will _not yield to
3450// other equal or higher priority threads that reside on the dispatch queues
3451// of other CPUs.
3452
3453os::YieldResult os::NakedYield() { thr_yield(); return os::YIELD_UNKNOWN; }
3454
3455
3456// On Solaris we found that yield_all doesn't always yield to all other threads.
3457// There have been cases where there is a thread ready to execute but it doesn't
3458// get an lwp as the VM thread continues to spin with sleeps of 1 millisecond.
3459// The 1 millisecond wait doesn't seem long enough for the kernel to issue a
3460// SIGWAITING signal which will cause a new lwp to be created. So we count the
3461// number of times yield_all is called in the one loop and increase the sleep
3462// time after 8 attempts. If this fails too we increase the concurrency level
3463// so that the starving thread would get an lwp
3464
3465void os::yield_all(int attempts) {
3466  // Yields to all threads, including threads with lower priorities
3467  if (attempts == 0) {
3468    os::sleep(Thread::current(), 1, false);
3469  } else {
3470    int iterations = attempts % 30;
3471    if (iterations == 0 && !os::Solaris::T2_libthread()) {
3472      // thr_setconcurrency and _getconcurrency make sense only under T1.
3473      int noofLWPS = thr_getconcurrency();
3474      if (noofLWPS < (Threads::number_of_threads() + 2)) {
3475        thr_setconcurrency(thr_getconcurrency() + 1);
3476      }
3477    } else if (iterations < 25) {
3478      os::sleep(Thread::current(), 1, false);
3479    } else {
3480      os::sleep(Thread::current(), 10, false);
3481    }
3482  }
3483}
3484
3485// Called from the tight loops to possibly influence time-sharing heuristics
3486void os::loop_breaker(int attempts) {
3487  os::yield_all(attempts);
3488}
3489
3490
3491// Interface for setting lwp priorities.  If we are using T2 libthread,
3492// which forces the use of BoundThreads or we manually set UseBoundThreads,
3493// all of our threads will be assigned to real lwp's.  Using the thr_setprio
3494// function is meaningless in this mode so we must adjust the real lwp's priority
3495// The routines below implement the getting and setting of lwp priorities.
3496//
3497// Note: There are three priority scales used on Solaris.  Java priotities
3498//       which range from 1 to 10, libthread "thr_setprio" scale which range
3499//       from 0 to 127, and the current scheduling class of the process we
3500//       are running in.  This is typically from -60 to +60.
3501//       The setting of the lwp priorities in done after a call to thr_setprio
3502//       so Java priorities are mapped to libthread priorities and we map from
3503//       the latter to lwp priorities.  We don't keep priorities stored in
3504//       Java priorities since some of our worker threads want to set priorities
3505//       higher than all Java threads.
3506//
3507// For related information:
3508// (1)  man -s 2 priocntl
3509// (2)  man -s 4 priocntl
3510// (3)  man dispadmin
3511// =    librt.so
3512// =    libthread/common/rtsched.c - thrp_setlwpprio().
3513// =    ps -cL <pid> ... to validate priority.
3514// =    sched_get_priority_min and _max
3515//              pthread_create
3516//              sched_setparam
3517//              pthread_setschedparam
3518//
3519// Assumptions:
3520// +    We assume that all threads in the process belong to the same
3521//              scheduling class.   IE. an homogenous process.
3522// +    Must be root or in IA group to change change "interactive" attribute.
3523//              Priocntl() will fail silently.  The only indication of failure is when
3524//              we read-back the value and notice that it hasn't changed.
3525// +    Interactive threads enter the runq at the head, non-interactive at the tail.
3526// +    For RT, change timeslice as well.  Invariant:
3527//              constant "priority integral"
3528//              Konst == TimeSlice * (60-Priority)
3529//              Given a priority, compute appropriate timeslice.
3530// +    Higher numerical values have higher priority.
3531
3532// sched class attributes
3533typedef struct {
3534        int   schedPolicy;              // classID
3535        int   maxPrio;
3536        int   minPrio;
3537} SchedInfo;
3538
3539
3540static SchedInfo tsLimits, iaLimits, rtLimits;
3541
3542#ifdef ASSERT
3543static int  ReadBackValidate = 1;
3544#endif
3545static int  myClass     = 0;
3546static int  myMin       = 0;
3547static int  myMax       = 0;
3548static int  myCur       = 0;
3549static bool priocntl_enable = false;
3550
3551
3552// Call the version of priocntl suitable for all supported versions
3553// of Solaris. We need to call through this wrapper so that we can
3554// build on Solaris 9 and run on Solaris 8, 9 and 10.
3555//
3556// This code should be removed if we ever stop supporting Solaris 8
3557// and earlier releases.
3558
3559static long priocntl_stub(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg);
3560typedef long (*priocntl_type)(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg);
3561static priocntl_type priocntl_ptr = priocntl_stub;
3562
3563// Stub to set the value of the real pointer, and then call the real
3564// function.
3565
3566static long priocntl_stub(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg) {
3567  // Try Solaris 8- name only.
3568  priocntl_type tmp = (priocntl_type)dlsym(RTLD_DEFAULT, "__priocntl");
3569  guarantee(tmp != NULL, "priocntl function not found.");
3570  priocntl_ptr = tmp;
3571  return (*priocntl_ptr)(PC_VERSION, idtype, id, cmd, arg);
3572}
3573
3574
3575// lwp_priocntl_init
3576//
3577// Try to determine the priority scale for our process.
3578//
3579// Return errno or 0 if OK.
3580//
3581static
3582int     lwp_priocntl_init ()
3583{
3584  int rslt;
3585  pcinfo_t ClassInfo;
3586  pcparms_t ParmInfo;
3587  int i;
3588
3589  if (!UseThreadPriorities) return 0;
3590
3591  // We are using Bound threads, we need to determine our priority ranges
3592  if (os::Solaris::T2_libthread() || UseBoundThreads) {
3593    // If ThreadPriorityPolicy is 1, switch tables
3594    if (ThreadPriorityPolicy == 1) {
3595      for (i = 0 ; i < MaxPriority+1; i++)
3596        os::java_to_os_priority[i] = prio_policy1[i];
3597    }
3598  }
3599  // Not using Bound Threads, set to ThreadPolicy 1
3600  else {
3601    for ( i = 0 ; i < MaxPriority+1; i++ ) {
3602      os::java_to_os_priority[i] = prio_policy1[i];
3603    }
3604    return 0;
3605  }
3606
3607
3608  // Get IDs for a set of well-known scheduling classes.
3609  // TODO-FIXME: GETCLINFO returns the current # of classes in the
3610  // the system.  We should have a loop that iterates over the
3611  // classID values, which are known to be "small" integers.
3612
3613  strcpy(ClassInfo.pc_clname, "TS");
3614  ClassInfo.pc_cid = -1;
3615  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3616  if (rslt < 0) return errno;
3617  assert(ClassInfo.pc_cid != -1, "cid for TS class is -1");
3618  tsLimits.schedPolicy = ClassInfo.pc_cid;
3619  tsLimits.maxPrio = ((tsinfo_t*)ClassInfo.pc_clinfo)->ts_maxupri;
3620  tsLimits.minPrio = -tsLimits.maxPrio;
3621
3622  strcpy(ClassInfo.pc_clname, "IA");
3623  ClassInfo.pc_cid = -1;
3624  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3625  if (rslt < 0) return errno;
3626  assert(ClassInfo.pc_cid != -1, "cid for IA class is -1");
3627  iaLimits.schedPolicy = ClassInfo.pc_cid;
3628  iaLimits.maxPrio = ((iainfo_t*)ClassInfo.pc_clinfo)->ia_maxupri;
3629  iaLimits.minPrio = -iaLimits.maxPrio;
3630
3631  strcpy(ClassInfo.pc_clname, "RT");
3632  ClassInfo.pc_cid = -1;
3633  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3634  if (rslt < 0) return errno;
3635  assert(ClassInfo.pc_cid != -1, "cid for RT class is -1");
3636  rtLimits.schedPolicy = ClassInfo.pc_cid;
3637  rtLimits.maxPrio = ((rtinfo_t*)ClassInfo.pc_clinfo)->rt_maxpri;
3638  rtLimits.minPrio = 0;
3639
3640
3641  // Query our "current" scheduling class.
3642  // This will normally be IA,TS or, rarely, RT.
3643  memset (&ParmInfo, 0, sizeof(ParmInfo));
3644  ParmInfo.pc_cid = PC_CLNULL;
3645  rslt = (*priocntl_ptr) (PC_VERSION, P_PID, P_MYID, PC_GETPARMS, (caddr_t)&ParmInfo );
3646  if ( rslt < 0 ) return errno;
3647  myClass = ParmInfo.pc_cid;
3648
3649  // We now know our scheduling classId, get specific information
3650  // the class.
3651  ClassInfo.pc_cid = myClass;
3652  ClassInfo.pc_clname[0] = 0;
3653  rslt = (*priocntl_ptr) (PC_VERSION, (idtype)0, 0, PC_GETCLINFO, (caddr_t)&ClassInfo );
3654  if ( rslt < 0 ) return errno;
3655
3656  if (ThreadPriorityVerbose)
3657    tty->print_cr ("lwp_priocntl_init: Class=%d(%s)...", myClass, ClassInfo.pc_clname);
3658
3659  memset(&ParmInfo, 0, sizeof(pcparms_t));
3660  ParmInfo.pc_cid = PC_CLNULL;
3661  rslt = (*priocntl_ptr)(PC_VERSION, P_PID, P_MYID, PC_GETPARMS, (caddr_t)&ParmInfo);
3662  if (rslt < 0) return errno;
3663
3664  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3665    myMin = rtLimits.minPrio;
3666    myMax = rtLimits.maxPrio;
3667  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3668    iaparms_t *iaInfo  = (iaparms_t*)ParmInfo.pc_clparms;
3669    myMin = iaLimits.minPrio;
3670    myMax = iaLimits.maxPrio;
3671    myMax = MIN2(myMax, (int)iaInfo->ia_uprilim);       // clamp - restrict
3672  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3673    tsparms_t *tsInfo  = (tsparms_t*)ParmInfo.pc_clparms;
3674    myMin = tsLimits.minPrio;
3675    myMax = tsLimits.maxPrio;
3676    myMax = MIN2(myMax, (int)tsInfo->ts_uprilim);       // clamp - restrict
3677  } else {
3678    // No clue - punt
3679    if (ThreadPriorityVerbose)
3680      tty->print_cr ("Unknown scheduling class: %s ... \n", ClassInfo.pc_clname);
3681    return EINVAL;      // no clue, punt
3682  }
3683
3684  if (ThreadPriorityVerbose)
3685        tty->print_cr ("Thread priority Range: [%d..%d]\n", myMin, myMax);
3686
3687  priocntl_enable = true;  // Enable changing priorities
3688  return 0;
3689}
3690
3691#define IAPRI(x)        ((iaparms_t *)((x).pc_clparms))
3692#define RTPRI(x)        ((rtparms_t *)((x).pc_clparms))
3693#define TSPRI(x)        ((tsparms_t *)((x).pc_clparms))
3694
3695
3696// scale_to_lwp_priority
3697//
3698// Convert from the libthread "thr_setprio" scale to our current
3699// lwp scheduling class scale.
3700//
3701static
3702int     scale_to_lwp_priority (int rMin, int rMax, int x)
3703{
3704  int v;
3705
3706  if (x == 127) return rMax;            // avoid round-down
3707    v = (((x*(rMax-rMin)))/128)+rMin;
3708  return v;
3709}
3710
3711
3712// set_lwp_priority
3713//
3714// Set the priority of the lwp.  This call should only be made
3715// when using bound threads (T2 threads are bound by default).
3716//
3717int     set_lwp_priority (int ThreadID, int lwpid, int newPrio )
3718{
3719  int rslt;
3720  int Actual, Expected, prv;
3721  pcparms_t ParmInfo;                   // for GET-SET
3722#ifdef ASSERT
3723  pcparms_t ReadBack;                   // for readback
3724#endif
3725
3726  // Set priority via PC_GETPARMS, update, PC_SETPARMS
3727  // Query current values.
3728  // TODO: accelerate this by eliminating the PC_GETPARMS call.
3729  // Cache "pcparms_t" in global ParmCache.
3730  // TODO: elide set-to-same-value
3731
3732  // If something went wrong on init, don't change priorities.
3733  if ( !priocntl_enable ) {
3734    if (ThreadPriorityVerbose)
3735      tty->print_cr("Trying to set priority but init failed, ignoring");
3736    return EINVAL;
3737  }
3738
3739
3740  // If lwp hasn't started yet, just return
3741  // the _start routine will call us again.
3742  if ( lwpid <= 0 ) {
3743    if (ThreadPriorityVerbose) {
3744      tty->print_cr ("deferring the set_lwp_priority of thread " INTPTR_FORMAT " to %d, lwpid not set",
3745                     ThreadID, newPrio);
3746    }
3747    return 0;
3748  }
3749
3750  if (ThreadPriorityVerbose) {
3751    tty->print_cr ("set_lwp_priority(" INTPTR_FORMAT "@" INTPTR_FORMAT " %d) ",
3752                   ThreadID, lwpid, newPrio);
3753  }
3754
3755  memset(&ParmInfo, 0, sizeof(pcparms_t));
3756  ParmInfo.pc_cid = PC_CLNULL;
3757  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_GETPARMS, (caddr_t)&ParmInfo);
3758  if (rslt < 0) return errno;
3759
3760  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3761    rtparms_t *rtInfo  = (rtparms_t*)ParmInfo.pc_clparms;
3762    rtInfo->rt_pri     = scale_to_lwp_priority (rtLimits.minPrio, rtLimits.maxPrio, newPrio);
3763    rtInfo->rt_tqsecs  = RT_NOCHANGE;
3764    rtInfo->rt_tqnsecs = RT_NOCHANGE;
3765    if (ThreadPriorityVerbose) {
3766      tty->print_cr("RT: %d->%d\n", newPrio, rtInfo->rt_pri);
3767    }
3768  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3769    iaparms_t *iaInfo  = (iaparms_t*)ParmInfo.pc_clparms;
3770    int maxClamped     = MIN2(iaLimits.maxPrio, (int)iaInfo->ia_uprilim);
3771    iaInfo->ia_upri    = scale_to_lwp_priority(iaLimits.minPrio, maxClamped, newPrio);
3772    iaInfo->ia_uprilim = IA_NOCHANGE;
3773    iaInfo->ia_mode    = IA_NOCHANGE;
3774    if (ThreadPriorityVerbose) {
3775      tty->print_cr ("IA: [%d...%d] %d->%d\n",
3776               iaLimits.minPrio, maxClamped, newPrio, iaInfo->ia_upri);
3777    }
3778  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3779    tsparms_t *tsInfo  = (tsparms_t*)ParmInfo.pc_clparms;
3780    int maxClamped     = MIN2(tsLimits.maxPrio, (int)tsInfo->ts_uprilim);
3781    prv                = tsInfo->ts_upri;
3782    tsInfo->ts_upri    = scale_to_lwp_priority(tsLimits.minPrio, maxClamped, newPrio);
3783    tsInfo->ts_uprilim = IA_NOCHANGE;
3784    if (ThreadPriorityVerbose) {
3785      tty->print_cr ("TS: %d [%d...%d] %d->%d\n",
3786               prv, tsLimits.minPrio, maxClamped, newPrio, tsInfo->ts_upri);
3787    }
3788    if (prv == tsInfo->ts_upri) return 0;
3789  } else {
3790    if ( ThreadPriorityVerbose ) {
3791      tty->print_cr ("Unknown scheduling class\n");
3792    }
3793      return EINVAL;    // no clue, punt
3794  }
3795
3796  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_SETPARMS, (caddr_t)&ParmInfo);
3797  if (ThreadPriorityVerbose && rslt) {
3798    tty->print_cr ("PC_SETPARMS ->%d %d\n", rslt, errno);
3799  }
3800  if (rslt < 0) return errno;
3801
3802#ifdef ASSERT
3803  // Sanity check: read back what we just attempted to set.
3804  // In theory it could have changed in the interim ...
3805  //
3806  // The priocntl system call is tricky.
3807  // Sometimes it'll validate the priority value argument and
3808  // return EINVAL if unhappy.  At other times it fails silently.
3809  // Readbacks are prudent.
3810
3811  if (!ReadBackValidate) return 0;
3812
3813  memset(&ReadBack, 0, sizeof(pcparms_t));
3814  ReadBack.pc_cid = PC_CLNULL;
3815  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_GETPARMS, (caddr_t)&ReadBack);
3816  assert(rslt >= 0, "priocntl failed");
3817  Actual = Expected = 0xBAD;
3818  assert(ParmInfo.pc_cid == ReadBack.pc_cid, "cid's don't match");
3819  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3820    Actual   = RTPRI(ReadBack)->rt_pri;
3821    Expected = RTPRI(ParmInfo)->rt_pri;
3822  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3823    Actual   = IAPRI(ReadBack)->ia_upri;
3824    Expected = IAPRI(ParmInfo)->ia_upri;
3825  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3826    Actual   = TSPRI(ReadBack)->ts_upri;
3827    Expected = TSPRI(ParmInfo)->ts_upri;
3828  } else {
3829    if ( ThreadPriorityVerbose ) {
3830      tty->print_cr("set_lwp_priority: unexpected class in readback: %d\n", ParmInfo.pc_cid);
3831    }
3832  }
3833
3834  if (Actual != Expected) {
3835    if ( ThreadPriorityVerbose ) {
3836      tty->print_cr ("set_lwp_priority(%d %d) Class=%d: actual=%d vs expected=%d\n",
3837             lwpid, newPrio, ReadBack.pc_cid, Actual, Expected);
3838    }
3839  }
3840#endif
3841
3842  return 0;
3843}
3844
3845
3846
3847// Solaris only gives access to 128 real priorities at a time,
3848// so we expand Java's ten to fill this range.  This would be better
3849// if we dynamically adjusted relative priorities.
3850//
3851// The ThreadPriorityPolicy option allows us to select 2 different
3852// priority scales.
3853//
3854// ThreadPriorityPolicy=0
3855// Since the Solaris' default priority is MaximumPriority, we do not
3856// set a priority lower than Max unless a priority lower than
3857// NormPriority is requested.
3858//
3859// ThreadPriorityPolicy=1
3860// This mode causes the priority table to get filled with
3861// linear values.  NormPriority get's mapped to 50% of the
3862// Maximum priority an so on.  This will cause VM threads
3863// to get unfair treatment against other Solaris processes
3864// which do not explicitly alter their thread priorities.
3865//
3866
3867
3868int os::java_to_os_priority[MaxPriority + 1] = {
3869  -99999,         // 0 Entry should never be used
3870
3871  0,              // 1 MinPriority
3872  32,             // 2
3873  64,             // 3
3874
3875  96,             // 4
3876  127,            // 5 NormPriority
3877  127,            // 6
3878
3879  127,            // 7
3880  127,            // 8
3881  127,            // 9 NearMaxPriority
3882
3883  127             // 10 MaxPriority
3884};
3885
3886
3887OSReturn os::set_native_priority(Thread* thread, int newpri) {
3888  assert(newpri >= MinimumPriority && newpri <= MaximumPriority, "bad priority mapping");
3889  if ( !UseThreadPriorities ) return OS_OK;
3890  int status = thr_setprio(thread->osthread()->thread_id(), newpri);
3891  if ( os::Solaris::T2_libthread() || (UseBoundThreads && thread->osthread()->is_vm_created()) )
3892    status |= (set_lwp_priority (thread->osthread()->thread_id(),
3893                    thread->osthread()->lwp_id(), newpri ));
3894  return (status == 0) ? OS_OK : OS_ERR;
3895}
3896
3897
3898OSReturn os::get_native_priority(const Thread* const thread, int *priority_ptr) {
3899  int p;
3900  if ( !UseThreadPriorities ) {
3901    *priority_ptr = NormalPriority;
3902    return OS_OK;
3903  }
3904  int status = thr_getprio(thread->osthread()->thread_id(), &p);
3905  if (status != 0) {
3906    return OS_ERR;
3907  }
3908  *priority_ptr = p;
3909  return OS_OK;
3910}
3911
3912
3913// Hint to the underlying OS that a task switch would not be good.
3914// Void return because it's a hint and can fail.
3915void os::hint_no_preempt() {
3916  schedctl_start(schedctl_init());
3917}
3918
3919void os::interrupt(Thread* thread) {
3920  assert(Thread::current() == thread || Threads_lock->owned_by_self(), "possibility of dangling Thread pointer");
3921
3922  OSThread* osthread = thread->osthread();
3923
3924  int isInterrupted = osthread->interrupted();
3925  if (!isInterrupted) {
3926      osthread->set_interrupted(true);
3927      OrderAccess::fence();
3928      // os::sleep() is implemented with either poll (NULL,0,timeout) or
3929      // by parking on _SleepEvent.  If the former, thr_kill will unwedge
3930      // the sleeper by SIGINTR, otherwise the unpark() will wake the sleeper.
3931      ParkEvent * const slp = thread->_SleepEvent ;
3932      if (slp != NULL) slp->unpark() ;
3933  }
3934
3935  // For JSR166:  unpark after setting status but before thr_kill -dl
3936  if (thread->is_Java_thread()) {
3937    ((JavaThread*)thread)->parker()->unpark();
3938  }
3939
3940  // Handle interruptible wait() ...
3941  ParkEvent * const ev = thread->_ParkEvent ;
3942  if (ev != NULL) ev->unpark() ;
3943
3944  // When events are used everywhere for os::sleep, then this thr_kill
3945  // will only be needed if UseVMInterruptibleIO is true.
3946
3947  if (!isInterrupted) {
3948    int status = thr_kill(osthread->thread_id(), os::Solaris::SIGinterrupt());
3949    assert_status(status == 0, status, "thr_kill");
3950
3951    // Bump thread interruption counter
3952    RuntimeService::record_thread_interrupt_signaled_count();
3953  }
3954}
3955
3956
3957bool os::is_interrupted(Thread* thread, bool clear_interrupted) {
3958  assert(Thread::current() == thread || Threads_lock->owned_by_self(), "possibility of dangling Thread pointer");
3959
3960  OSThread* osthread = thread->osthread();
3961
3962  bool res = osthread->interrupted();
3963
3964  // NOTE that since there is no "lock" around these two operations,
3965  // there is the possibility that the interrupted flag will be
3966  // "false" but that the interrupt event will be set. This is
3967  // intentional. The effect of this is that Object.wait() will appear
3968  // to have a spurious wakeup, which is not harmful, and the
3969  // possibility is so rare that it is not worth the added complexity
3970  // to add yet another lock. It has also been recommended not to put
3971  // the interrupted flag into the os::Solaris::Event structure,
3972  // because it hides the issue.
3973  if (res && clear_interrupted) {
3974    osthread->set_interrupted(false);
3975  }
3976  return res;
3977}
3978
3979
3980void os::print_statistics() {
3981}
3982
3983int os::message_box(const char* title, const char* message) {
3984  int i;
3985  fdStream err(defaultStream::error_fd());
3986  for (i = 0; i < 78; i++) err.print_raw("=");
3987  err.cr();
3988  err.print_raw_cr(title);
3989  for (i = 0; i < 78; i++) err.print_raw("-");
3990  err.cr();
3991  err.print_raw_cr(message);
3992  for (i = 0; i < 78; i++) err.print_raw("=");
3993  err.cr();
3994
3995  char buf[16];
3996  // Prevent process from exiting upon "read error" without consuming all CPU
3997  while (::read(0, buf, sizeof(buf)) <= 0) { ::sleep(100); }
3998
3999  return buf[0] == 'y' || buf[0] == 'Y';
4000}
4001
4002// A lightweight implementation that does not suspend the target thread and
4003// thus returns only a hint. Used for profiling only!
4004ExtendedPC os::get_thread_pc(Thread* thread) {
4005  // Make sure that it is called by the watcher and the Threads lock is owned.
4006  assert(Thread::current()->is_Watcher_thread(), "Must be watcher and own Threads_lock");
4007  // For now, is only used to profile the VM Thread
4008  assert(thread->is_VM_thread(), "Can only be called for VMThread");
4009  ExtendedPC epc;
4010
4011  GetThreadPC_Callback  cb(ProfileVM_lock);
4012  OSThread *osthread = thread->osthread();
4013  const int time_to_wait = 400; // 400ms wait for initial response
4014  int status = cb.interrupt(thread, time_to_wait);
4015
4016  if (cb.is_done() ) {
4017    epc = cb.addr();
4018  } else {
4019    DEBUG_ONLY(tty->print_cr("Failed to get pc for thread: %d got %d status",
4020                              osthread->thread_id(), status););
4021    // epc is already NULL
4022  }
4023  return epc;
4024}
4025
4026
4027// This does not do anything on Solaris. This is basically a hook for being
4028// able to use structured exception handling (thread-local exception filters) on, e.g., Win32.
4029void os::os_exception_wrapper(java_call_t f, JavaValue* value, methodHandle* method, JavaCallArguments* args, Thread* thread) {
4030  f(value, method, args, thread);
4031}
4032
4033// This routine may be used by user applications as a "hook" to catch signals.
4034// The user-defined signal handler must pass unrecognized signals to this
4035// routine, and if it returns true (non-zero), then the signal handler must
4036// return immediately.  If the flag "abort_if_unrecognized" is true, then this
4037// routine will never retun false (zero), but instead will execute a VM panic
4038// routine kill the process.
4039//
4040// If this routine returns false, it is OK to call it again.  This allows
4041// the user-defined signal handler to perform checks either before or after
4042// the VM performs its own checks.  Naturally, the user code would be making
4043// a serious error if it tried to handle an exception (such as a null check
4044// or breakpoint) that the VM was generating for its own correct operation.
4045//
4046// This routine may recognize any of the following kinds of signals:
4047// SIGBUS, SIGSEGV, SIGILL, SIGFPE, BREAK_SIGNAL, SIGPIPE, SIGXFSZ,
4048// os::Solaris::SIGasync
4049// It should be consulted by handlers for any of those signals.
4050// It explicitly does not recognize os::Solaris::SIGinterrupt
4051//
4052// The caller of this routine must pass in the three arguments supplied
4053// to the function referred to in the "sa_sigaction" (not the "sa_handler")
4054// field of the structure passed to sigaction().  This routine assumes that
4055// the sa_flags field passed to sigaction() includes SA_SIGINFO and SA_RESTART.
4056//
4057// Note that the VM will print warnings if it detects conflicting signal
4058// handlers, unless invoked with the option "-XX:+AllowUserSignalHandlers".
4059//
4060extern "C" int JVM_handle_solaris_signal(int signo, siginfo_t* siginfo, void* ucontext, int abort_if_unrecognized);
4061
4062
4063void signalHandler(int sig, siginfo_t* info, void* ucVoid) {
4064  JVM_handle_solaris_signal(sig, info, ucVoid, true);
4065}
4066
4067/* Do not delete - if guarantee is ever removed,  a signal handler (even empty)
4068   is needed to provoke threads blocked on IO to return an EINTR
4069   Note: this explicitly does NOT call JVM_handle_solaris_signal and
4070   does NOT participate in signal chaining due to requirement for
4071   NOT setting SA_RESTART to make EINTR work. */
4072extern "C" void sigINTRHandler(int sig, siginfo_t* info, void* ucVoid) {
4073   if (UseSignalChaining) {
4074      struct sigaction *actp = os::Solaris::get_chained_signal_action(sig);
4075      if (actp && actp->sa_handler) {
4076        vm_exit_during_initialization("Signal chaining detected for VM interrupt signal, try -XX:+UseAltSigs");
4077      }
4078   }
4079}
4080
4081// This boolean allows users to forward their own non-matching signals
4082// to JVM_handle_solaris_signal, harmlessly.
4083bool os::Solaris::signal_handlers_are_installed = false;
4084
4085// For signal-chaining
4086bool os::Solaris::libjsig_is_loaded = false;
4087typedef struct sigaction *(*get_signal_t)(int);
4088get_signal_t os::Solaris::get_signal_action = NULL;
4089
4090struct sigaction* os::Solaris::get_chained_signal_action(int sig) {
4091  struct sigaction *actp = NULL;
4092
4093  if ((libjsig_is_loaded)  && (sig <= Maxlibjsigsigs)) {
4094    // Retrieve the old signal handler from libjsig
4095    actp = (*get_signal_action)(sig);
4096  }
4097  if (actp == NULL) {
4098    // Retrieve the preinstalled signal handler from jvm
4099    actp = get_preinstalled_handler(sig);
4100  }
4101
4102  return actp;
4103}
4104
4105static bool call_chained_handler(struct sigaction *actp, int sig,
4106                                 siginfo_t *siginfo, void *context) {
4107  // Call the old signal handler
4108  if (actp->sa_handler == SIG_DFL) {
4109    // It's more reasonable to let jvm treat it as an unexpected exception
4110    // instead of taking the default action.
4111    return false;
4112  } else if (actp->sa_handler != SIG_IGN) {
4113    if ((actp->sa_flags & SA_NODEFER) == 0) {
4114      // automaticlly block the signal
4115      sigaddset(&(actp->sa_mask), sig);
4116    }
4117
4118    sa_handler_t hand;
4119    sa_sigaction_t sa;
4120    bool siginfo_flag_set = (actp->sa_flags & SA_SIGINFO) != 0;
4121    // retrieve the chained handler
4122    if (siginfo_flag_set) {
4123      sa = actp->sa_sigaction;
4124    } else {
4125      hand = actp->sa_handler;
4126    }
4127
4128    if ((actp->sa_flags & SA_RESETHAND) != 0) {
4129      actp->sa_handler = SIG_DFL;
4130    }
4131
4132    // try to honor the signal mask
4133    sigset_t oset;
4134    thr_sigsetmask(SIG_SETMASK, &(actp->sa_mask), &oset);
4135
4136    // call into the chained handler
4137    if (siginfo_flag_set) {
4138      (*sa)(sig, siginfo, context);
4139    } else {
4140      (*hand)(sig);
4141    }
4142
4143    // restore the signal mask
4144    thr_sigsetmask(SIG_SETMASK, &oset, 0);
4145  }
4146  // Tell jvm's signal handler the signal is taken care of.
4147  return true;
4148}
4149
4150bool os::Solaris::chained_handler(int sig, siginfo_t* siginfo, void* context) {
4151  bool chained = false;
4152  // signal-chaining
4153  if (UseSignalChaining) {
4154    struct sigaction *actp = get_chained_signal_action(sig);
4155    if (actp != NULL) {
4156      chained = call_chained_handler(actp, sig, siginfo, context);
4157    }
4158  }
4159  return chained;
4160}
4161
4162struct sigaction* os::Solaris::get_preinstalled_handler(int sig) {
4163  assert((chainedsigactions != (struct sigaction *)NULL) && (preinstalled_sigs != (int *)NULL) , "signals not yet initialized");
4164  if (preinstalled_sigs[sig] != 0) {
4165    return &chainedsigactions[sig];
4166  }
4167  return NULL;
4168}
4169
4170void os::Solaris::save_preinstalled_handler(int sig, struct sigaction& oldAct) {
4171
4172  assert(sig > 0 && sig <= Maxsignum, "vm signal out of expected range");
4173  assert((chainedsigactions != (struct sigaction *)NULL) && (preinstalled_sigs != (int *)NULL) , "signals not yet initialized");
4174  chainedsigactions[sig] = oldAct;
4175  preinstalled_sigs[sig] = 1;
4176}
4177
4178void os::Solaris::set_signal_handler(int sig, bool set_installed, bool oktochain) {
4179  // Check for overwrite.
4180  struct sigaction oldAct;
4181  sigaction(sig, (struct sigaction*)NULL, &oldAct);
4182  void* oldhand = oldAct.sa_sigaction ? CAST_FROM_FN_PTR(void*,  oldAct.sa_sigaction)
4183                                      : CAST_FROM_FN_PTR(void*,  oldAct.sa_handler);
4184  if (oldhand != CAST_FROM_FN_PTR(void*, SIG_DFL) &&
4185      oldhand != CAST_FROM_FN_PTR(void*, SIG_IGN) &&
4186      oldhand != CAST_FROM_FN_PTR(void*, signalHandler)) {
4187    if (AllowUserSignalHandlers || !set_installed) {
4188      // Do not overwrite; user takes responsibility to forward to us.
4189      return;
4190    } else if (UseSignalChaining) {
4191      if (oktochain) {
4192        // save the old handler in jvm
4193        save_preinstalled_handler(sig, oldAct);
4194      } else {
4195        vm_exit_during_initialization("Signal chaining not allowed for VM interrupt signal, try -XX:+UseAltSigs.");
4196      }
4197      // libjsig also interposes the sigaction() call below and saves the
4198      // old sigaction on it own.
4199    } else {
4200      fatal2("Encountered unexpected pre-existing sigaction handler %#lx for signal %d.", (long)oldhand, sig);
4201    }
4202  }
4203
4204  struct sigaction sigAct;
4205  sigfillset(&(sigAct.sa_mask));
4206  sigAct.sa_handler = SIG_DFL;
4207
4208  sigAct.sa_sigaction = signalHandler;
4209  // Handle SIGSEGV on alternate signal stack if
4210  // not using stack banging
4211  if (!UseStackBanging && sig == SIGSEGV) {
4212    sigAct.sa_flags = SA_SIGINFO | SA_RESTART | SA_ONSTACK;
4213  // Interruptible i/o requires SA_RESTART cleared so EINTR
4214  // is returned instead of restarting system calls
4215  } else if (sig == os::Solaris::SIGinterrupt()) {
4216    sigemptyset(&sigAct.sa_mask);
4217    sigAct.sa_handler = NULL;
4218    sigAct.sa_flags = SA_SIGINFO;
4219    sigAct.sa_sigaction = sigINTRHandler;
4220  } else {
4221    sigAct.sa_flags = SA_SIGINFO | SA_RESTART;
4222  }
4223  os::Solaris::set_our_sigflags(sig, sigAct.sa_flags);
4224
4225  sigaction(sig, &sigAct, &oldAct);
4226
4227  void* oldhand2 = oldAct.sa_sigaction ? CAST_FROM_FN_PTR(void*, oldAct.sa_sigaction)
4228                                       : CAST_FROM_FN_PTR(void*, oldAct.sa_handler);
4229  assert(oldhand2 == oldhand, "no concurrent signal handler installation");
4230}
4231
4232
4233#define DO_SIGNAL_CHECK(sig) \
4234  if (!sigismember(&check_signal_done, sig)) \
4235    os::Solaris::check_signal_handler(sig)
4236
4237// This method is a periodic task to check for misbehaving JNI applications
4238// under CheckJNI, we can add any periodic checks here
4239
4240void os::run_periodic_checks() {
4241  // A big source of grief is hijacking virt. addr 0x0 on Solaris,
4242  // thereby preventing a NULL checks.
4243  if(!check_addr0_done) check_addr0_done = check_addr0(tty);
4244
4245  if (check_signals == false) return;
4246
4247  // SEGV and BUS if overridden could potentially prevent
4248  // generation of hs*.log in the event of a crash, debugging
4249  // such a case can be very challenging, so we absolutely
4250  // check for the following for a good measure:
4251  DO_SIGNAL_CHECK(SIGSEGV);
4252  DO_SIGNAL_CHECK(SIGILL);
4253  DO_SIGNAL_CHECK(SIGFPE);
4254  DO_SIGNAL_CHECK(SIGBUS);
4255  DO_SIGNAL_CHECK(SIGPIPE);
4256  DO_SIGNAL_CHECK(SIGXFSZ);
4257
4258  // ReduceSignalUsage allows the user to override these handlers
4259  // see comments at the very top and jvm_solaris.h
4260  if (!ReduceSignalUsage) {
4261    DO_SIGNAL_CHECK(SHUTDOWN1_SIGNAL);
4262    DO_SIGNAL_CHECK(SHUTDOWN2_SIGNAL);
4263    DO_SIGNAL_CHECK(SHUTDOWN3_SIGNAL);
4264    DO_SIGNAL_CHECK(BREAK_SIGNAL);
4265  }
4266
4267  // See comments above for using JVM1/JVM2 and UseAltSigs
4268  DO_SIGNAL_CHECK(os::Solaris::SIGinterrupt());
4269  DO_SIGNAL_CHECK(os::Solaris::SIGasync());
4270
4271}
4272
4273typedef int (*os_sigaction_t)(int, const struct sigaction *, struct sigaction *);
4274
4275static os_sigaction_t os_sigaction = NULL;
4276
4277void os::Solaris::check_signal_handler(int sig) {
4278  char buf[O_BUFLEN];
4279  address jvmHandler = NULL;
4280
4281  struct sigaction act;
4282  if (os_sigaction == NULL) {
4283    // only trust the default sigaction, in case it has been interposed
4284    os_sigaction = (os_sigaction_t)dlsym(RTLD_DEFAULT, "sigaction");
4285    if (os_sigaction == NULL) return;
4286  }
4287
4288  os_sigaction(sig, (struct sigaction*)NULL, &act);
4289
4290  address thisHandler = (act.sa_flags & SA_SIGINFO)
4291    ? CAST_FROM_FN_PTR(address, act.sa_sigaction)
4292    : CAST_FROM_FN_PTR(address, act.sa_handler) ;
4293
4294
4295  switch(sig) {
4296    case SIGSEGV:
4297    case SIGBUS:
4298    case SIGFPE:
4299    case SIGPIPE:
4300    case SIGXFSZ:
4301    case SIGILL:
4302      jvmHandler = CAST_FROM_FN_PTR(address, signalHandler);
4303      break;
4304
4305    case SHUTDOWN1_SIGNAL:
4306    case SHUTDOWN2_SIGNAL:
4307    case SHUTDOWN3_SIGNAL:
4308    case BREAK_SIGNAL:
4309      jvmHandler = (address)user_handler();
4310      break;
4311
4312    default:
4313      int intrsig = os::Solaris::SIGinterrupt();
4314      int asynsig = os::Solaris::SIGasync();
4315
4316      if (sig == intrsig) {
4317        jvmHandler = CAST_FROM_FN_PTR(address, sigINTRHandler);
4318      } else if (sig == asynsig) {
4319        jvmHandler = CAST_FROM_FN_PTR(address, signalHandler);
4320      } else {
4321        return;
4322      }
4323      break;
4324  }
4325
4326
4327  if (thisHandler != jvmHandler) {
4328    tty->print("Warning: %s handler ", exception_name(sig, buf, O_BUFLEN));
4329    tty->print("expected:%s", get_signal_handler_name(jvmHandler, buf, O_BUFLEN));
4330    tty->print_cr("  found:%s", get_signal_handler_name(thisHandler, buf, O_BUFLEN));
4331    // No need to check this sig any longer
4332    sigaddset(&check_signal_done, sig);
4333  } else if(os::Solaris::get_our_sigflags(sig) != 0 && act.sa_flags != os::Solaris::get_our_sigflags(sig)) {
4334    tty->print("Warning: %s handler flags ", exception_name(sig, buf, O_BUFLEN));
4335    tty->print("expected:" PTR32_FORMAT, os::Solaris::get_our_sigflags(sig));
4336    tty->print_cr("  found:" PTR32_FORMAT, act.sa_flags);
4337    // No need to check this sig any longer
4338    sigaddset(&check_signal_done, sig);
4339  }
4340
4341  // Print all the signal handler state
4342  if (sigismember(&check_signal_done, sig)) {
4343    print_signal_handlers(tty, buf, O_BUFLEN);
4344  }
4345
4346}
4347
4348void os::Solaris::install_signal_handlers() {
4349  bool libjsigdone = false;
4350  signal_handlers_are_installed = true;
4351
4352  // signal-chaining
4353  typedef void (*signal_setting_t)();
4354  signal_setting_t begin_signal_setting = NULL;
4355  signal_setting_t end_signal_setting = NULL;
4356  begin_signal_setting = CAST_TO_FN_PTR(signal_setting_t,
4357                                        dlsym(RTLD_DEFAULT, "JVM_begin_signal_setting"));
4358  if (begin_signal_setting != NULL) {
4359    end_signal_setting = CAST_TO_FN_PTR(signal_setting_t,
4360                                        dlsym(RTLD_DEFAULT, "JVM_end_signal_setting"));
4361    get_signal_action = CAST_TO_FN_PTR(get_signal_t,
4362                                       dlsym(RTLD_DEFAULT, "JVM_get_signal_action"));
4363    get_libjsig_version = CAST_TO_FN_PTR(version_getting_t,
4364                                         dlsym(RTLD_DEFAULT, "JVM_get_libjsig_version"));
4365    libjsig_is_loaded = true;
4366    if (os::Solaris::get_libjsig_version != NULL) {
4367      libjsigversion =  (*os::Solaris::get_libjsig_version)();
4368    }
4369    assert(UseSignalChaining, "should enable signal-chaining");
4370  }
4371  if (libjsig_is_loaded) {
4372    // Tell libjsig jvm is setting signal handlers
4373    (*begin_signal_setting)();
4374  }
4375
4376  set_signal_handler(SIGSEGV, true, true);
4377  set_signal_handler(SIGPIPE, true, true);
4378  set_signal_handler(SIGXFSZ, true, true);
4379  set_signal_handler(SIGBUS, true, true);
4380  set_signal_handler(SIGILL, true, true);
4381  set_signal_handler(SIGFPE, true, true);
4382
4383
4384  if (os::Solaris::SIGinterrupt() > OLDMAXSIGNUM || os::Solaris::SIGasync() > OLDMAXSIGNUM) {
4385
4386    // Pre-1.4.1 Libjsig limited to signal chaining signals <= 32 so
4387    // can not register overridable signals which might be > 32
4388    if (libjsig_is_loaded && libjsigversion <= JSIG_VERSION_1_4_1) {
4389    // Tell libjsig jvm has finished setting signal handlers
4390      (*end_signal_setting)();
4391      libjsigdone = true;
4392    }
4393  }
4394
4395  // Never ok to chain our SIGinterrupt
4396  set_signal_handler(os::Solaris::SIGinterrupt(), true, false);
4397  set_signal_handler(os::Solaris::SIGasync(), true, true);
4398
4399  if (libjsig_is_loaded && !libjsigdone) {
4400    // Tell libjsig jvm finishes setting signal handlers
4401    (*end_signal_setting)();
4402  }
4403
4404  // We don't activate signal checker if libjsig is in place, we trust ourselves
4405  // and if UserSignalHandler is installed all bets are off
4406  if (CheckJNICalls) {
4407    if (libjsig_is_loaded) {
4408      tty->print_cr("Info: libjsig is activated, all active signal checking is disabled");
4409      check_signals = false;
4410    }
4411    if (AllowUserSignalHandlers) {
4412      tty->print_cr("Info: AllowUserSignalHandlers is activated, all active signal checking is disabled");
4413      check_signals = false;
4414    }
4415  }
4416}
4417
4418
4419void report_error(const char* file_name, int line_no, const char* title, const char* format, ...);
4420
4421const char * signames[] = {
4422  "SIG0",
4423  "SIGHUP", "SIGINT", "SIGQUIT", "SIGILL", "SIGTRAP",
4424  "SIGABRT", "SIGEMT", "SIGFPE", "SIGKILL", "SIGBUS",
4425  "SIGSEGV", "SIGSYS", "SIGPIPE", "SIGALRM", "SIGTERM",
4426  "SIGUSR1", "SIGUSR2", "SIGCLD", "SIGPWR", "SIGWINCH",
4427  "SIGURG", "SIGPOLL", "SIGSTOP", "SIGTSTP", "SIGCONT",
4428  "SIGTTIN", "SIGTTOU", "SIGVTALRM", "SIGPROF", "SIGXCPU",
4429  "SIGXFSZ", "SIGWAITING", "SIGLWP", "SIGFREEZE", "SIGTHAW",
4430  "SIGCANCEL", "SIGLOST"
4431};
4432
4433const char* os::exception_name(int exception_code, char* buf, size_t size) {
4434  if (0 < exception_code && exception_code <= SIGRTMAX) {
4435    // signal
4436    if (exception_code < sizeof(signames)/sizeof(const char*)) {
4437       jio_snprintf(buf, size, "%s", signames[exception_code]);
4438    } else {
4439       jio_snprintf(buf, size, "SIG%d", exception_code);
4440    }
4441    return buf;
4442  } else {
4443    return NULL;
4444  }
4445}
4446
4447// (Static) wrappers for the new libthread API
4448int_fnP_thread_t_iP_uP_stack_tP_gregset_t os::Solaris::_thr_getstate;
4449int_fnP_thread_t_i_gregset_t os::Solaris::_thr_setstate;
4450int_fnP_thread_t_i os::Solaris::_thr_setmutator;
4451int_fnP_thread_t os::Solaris::_thr_suspend_mutator;
4452int_fnP_thread_t os::Solaris::_thr_continue_mutator;
4453
4454// (Static) wrappers for the liblgrp API
4455os::Solaris::lgrp_home_func_t os::Solaris::_lgrp_home;
4456os::Solaris::lgrp_init_func_t os::Solaris::_lgrp_init;
4457os::Solaris::lgrp_fini_func_t os::Solaris::_lgrp_fini;
4458os::Solaris::lgrp_root_func_t os::Solaris::_lgrp_root;
4459os::Solaris::lgrp_children_func_t os::Solaris::_lgrp_children;
4460os::Solaris::lgrp_resources_func_t os::Solaris::_lgrp_resources;
4461os::Solaris::lgrp_nlgrps_func_t os::Solaris::_lgrp_nlgrps;
4462os::Solaris::lgrp_cookie_stale_func_t os::Solaris::_lgrp_cookie_stale;
4463os::Solaris::lgrp_cookie_t os::Solaris::_lgrp_cookie = 0;
4464
4465// (Static) wrapper for meminfo() call.
4466os::Solaris::meminfo_func_t os::Solaris::_meminfo = 0;
4467
4468static address resolve_symbol(const char *name) {
4469  address addr;
4470
4471  addr = (address) dlsym(RTLD_DEFAULT, name);
4472  if(addr == NULL) {
4473    // RTLD_DEFAULT was not defined on some early versions of 2.5.1
4474    addr = (address) dlsym(RTLD_NEXT, name);
4475    if(addr == NULL) {
4476      fatal(dlerror());
4477    }
4478  }
4479  return addr;
4480}
4481
4482
4483
4484// isT2_libthread()
4485//
4486// Routine to determine if we are currently using the new T2 libthread.
4487//
4488// We determine if we are using T2 by reading /proc/self/lstatus and
4489// looking for a thread with the ASLWP bit set.  If we find this status
4490// bit set, we must assume that we are NOT using T2.  The T2 team
4491// has approved this algorithm.
4492//
4493// We need to determine if we are running with the new T2 libthread
4494// since setting native thread priorities is handled differently
4495// when using this library.  All threads created using T2 are bound
4496// threads. Calling thr_setprio is meaningless in this case.
4497//
4498bool isT2_libthread() {
4499  static prheader_t * lwpArray = NULL;
4500  static int lwpSize = 0;
4501  static int lwpFile = -1;
4502  lwpstatus_t * that;
4503  char lwpName [128];
4504  bool isT2 = false;
4505
4506#define ADR(x)  ((uintptr_t)(x))
4507#define LWPINDEX(ary,ix)   ((lwpstatus_t *)(((ary)->pr_entsize * (ix)) + (ADR((ary) + 1))))
4508
4509  lwpFile = open("/proc/self/lstatus", O_RDONLY, 0);
4510  if (lwpFile < 0) {
4511      if (ThreadPriorityVerbose) warning ("Couldn't open /proc/self/lstatus\n");
4512      return false;
4513  }
4514  lwpSize = 16*1024;
4515  for (;;) {
4516    lseek (lwpFile, 0, SEEK_SET);
4517    lwpArray = (prheader_t *)NEW_C_HEAP_ARRAY(char, lwpSize);
4518    if (read(lwpFile, lwpArray, lwpSize) < 0) {
4519      if (ThreadPriorityVerbose) warning("Error reading /proc/self/lstatus\n");
4520      break;
4521    }
4522    if ((lwpArray->pr_nent * lwpArray->pr_entsize) <= lwpSize) {
4523       // We got a good snapshot - now iterate over the list.
4524      int aslwpcount = 0;
4525      for (int i = 0; i < lwpArray->pr_nent; i++ ) {
4526        that = LWPINDEX(lwpArray,i);
4527        if (that->pr_flags & PR_ASLWP) {
4528          aslwpcount++;
4529        }
4530      }
4531      if (aslwpcount == 0) isT2 = true;
4532      break;
4533    }
4534    lwpSize = lwpArray->pr_nent * lwpArray->pr_entsize;
4535    FREE_C_HEAP_ARRAY(char, lwpArray);  // retry.
4536  }
4537
4538  FREE_C_HEAP_ARRAY(char, lwpArray);
4539  close (lwpFile);
4540  if (ThreadPriorityVerbose) {
4541    if (isT2) tty->print_cr("We are running with a T2 libthread\n");
4542    else tty->print_cr("We are not running with a T2 libthread\n");
4543  }
4544  return isT2;
4545}
4546
4547
4548void os::Solaris::libthread_init() {
4549  address func = (address)dlsym(RTLD_DEFAULT, "_thr_suspend_allmutators");
4550
4551  // Determine if we are running with the new T2 libthread
4552  os::Solaris::set_T2_libthread(isT2_libthread());
4553
4554  lwp_priocntl_init();
4555
4556  // RTLD_DEFAULT was not defined on some early versions of 5.5.1
4557  if(func == NULL) {
4558    func = (address) dlsym(RTLD_NEXT, "_thr_suspend_allmutators");
4559    // Guarantee that this VM is running on an new enough OS (5.6 or
4560    // later) that it will have a new enough libthread.so.
4561    guarantee(func != NULL, "libthread.so is too old.");
4562  }
4563
4564  // Initialize the new libthread getstate API wrappers
4565  func = resolve_symbol("thr_getstate");
4566  os::Solaris::set_thr_getstate(CAST_TO_FN_PTR(int_fnP_thread_t_iP_uP_stack_tP_gregset_t, func));
4567
4568  func = resolve_symbol("thr_setstate");
4569  os::Solaris::set_thr_setstate(CAST_TO_FN_PTR(int_fnP_thread_t_i_gregset_t, func));
4570
4571  func = resolve_symbol("thr_setmutator");
4572  os::Solaris::set_thr_setmutator(CAST_TO_FN_PTR(int_fnP_thread_t_i, func));
4573
4574  func = resolve_symbol("thr_suspend_mutator");
4575  os::Solaris::set_thr_suspend_mutator(CAST_TO_FN_PTR(int_fnP_thread_t, func));
4576
4577  func = resolve_symbol("thr_continue_mutator");
4578  os::Solaris::set_thr_continue_mutator(CAST_TO_FN_PTR(int_fnP_thread_t, func));
4579
4580  int size;
4581  void (*handler_info_func)(address *, int *);
4582  handler_info_func = CAST_TO_FN_PTR(void (*)(address *, int *), resolve_symbol("thr_sighndlrinfo"));
4583  handler_info_func(&handler_start, &size);
4584  handler_end = handler_start + size;
4585}
4586
4587
4588int_fnP_mutex_tP os::Solaris::_mutex_lock;
4589int_fnP_mutex_tP os::Solaris::_mutex_trylock;
4590int_fnP_mutex_tP os::Solaris::_mutex_unlock;
4591int_fnP_mutex_tP_i_vP os::Solaris::_mutex_init;
4592int_fnP_mutex_tP os::Solaris::_mutex_destroy;
4593int os::Solaris::_mutex_scope = USYNC_THREAD;
4594
4595int_fnP_cond_tP_mutex_tP_timestruc_tP os::Solaris::_cond_timedwait;
4596int_fnP_cond_tP_mutex_tP os::Solaris::_cond_wait;
4597int_fnP_cond_tP os::Solaris::_cond_signal;
4598int_fnP_cond_tP os::Solaris::_cond_broadcast;
4599int_fnP_cond_tP_i_vP os::Solaris::_cond_init;
4600int_fnP_cond_tP os::Solaris::_cond_destroy;
4601int os::Solaris::_cond_scope = USYNC_THREAD;
4602
4603void os::Solaris::synchronization_init() {
4604  if(UseLWPSynchronization) {
4605    os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_lock")));
4606    os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_trylock")));
4607    os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_unlock")));
4608    os::Solaris::set_mutex_init(lwp_mutex_init);
4609    os::Solaris::set_mutex_destroy(lwp_mutex_destroy);
4610    os::Solaris::set_mutex_scope(USYNC_THREAD);
4611
4612    os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("_lwp_cond_timedwait")));
4613    os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("_lwp_cond_wait")));
4614    os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("_lwp_cond_signal")));
4615    os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("_lwp_cond_broadcast")));
4616    os::Solaris::set_cond_init(lwp_cond_init);
4617    os::Solaris::set_cond_destroy(lwp_cond_destroy);
4618    os::Solaris::set_cond_scope(USYNC_THREAD);
4619  }
4620  else {
4621    os::Solaris::set_mutex_scope(USYNC_THREAD);
4622    os::Solaris::set_cond_scope(USYNC_THREAD);
4623
4624    if(UsePthreads) {
4625      os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_lock")));
4626      os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_trylock")));
4627      os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_unlock")));
4628      os::Solaris::set_mutex_init(pthread_mutex_default_init);
4629      os::Solaris::set_mutex_destroy(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_destroy")));
4630
4631      os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("pthread_cond_timedwait")));
4632      os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("pthread_cond_wait")));
4633      os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_signal")));
4634      os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_broadcast")));
4635      os::Solaris::set_cond_init(pthread_cond_default_init);
4636      os::Solaris::set_cond_destroy(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_destroy")));
4637    }
4638    else {
4639      os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_lock")));
4640      os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_trylock")));
4641      os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_unlock")));
4642      os::Solaris::set_mutex_init(::mutex_init);
4643      os::Solaris::set_mutex_destroy(::mutex_destroy);
4644
4645      os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("cond_timedwait")));
4646      os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("cond_wait")));
4647      os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("cond_signal")));
4648      os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("cond_broadcast")));
4649      os::Solaris::set_cond_init(::cond_init);
4650      os::Solaris::set_cond_destroy(::cond_destroy);
4651    }
4652  }
4653}
4654
4655bool os::Solaris::liblgrp_init() {
4656  void *handle = dlopen("liblgrp.so.1", RTLD_LAZY);
4657  if (handle != NULL) {
4658    os::Solaris::set_lgrp_home(CAST_TO_FN_PTR(lgrp_home_func_t, dlsym(handle, "lgrp_home")));
4659    os::Solaris::set_lgrp_init(CAST_TO_FN_PTR(lgrp_init_func_t, dlsym(handle, "lgrp_init")));
4660    os::Solaris::set_lgrp_fini(CAST_TO_FN_PTR(lgrp_fini_func_t, dlsym(handle, "lgrp_fini")));
4661    os::Solaris::set_lgrp_root(CAST_TO_FN_PTR(lgrp_root_func_t, dlsym(handle, "lgrp_root")));
4662    os::Solaris::set_lgrp_children(CAST_TO_FN_PTR(lgrp_children_func_t, dlsym(handle, "lgrp_children")));
4663    os::Solaris::set_lgrp_resources(CAST_TO_FN_PTR(lgrp_resources_func_t, dlsym(handle, "lgrp_resources")));
4664    os::Solaris::set_lgrp_nlgrps(CAST_TO_FN_PTR(lgrp_nlgrps_func_t, dlsym(handle, "lgrp_nlgrps")));
4665    os::Solaris::set_lgrp_cookie_stale(CAST_TO_FN_PTR(lgrp_cookie_stale_func_t,
4666                                       dlsym(handle, "lgrp_cookie_stale")));
4667
4668    lgrp_cookie_t c = lgrp_init(LGRP_VIEW_CALLER);
4669    set_lgrp_cookie(c);
4670    return true;
4671  }
4672  return false;
4673}
4674
4675void os::Solaris::misc_sym_init() {
4676  address func = (address)dlsym(RTLD_DEFAULT, "meminfo");
4677  if(func == NULL) {
4678    func = (address) dlsym(RTLD_NEXT, "meminfo");
4679  }
4680  if (func != NULL) {
4681    os::Solaris::set_meminfo(CAST_TO_FN_PTR(meminfo_func_t, func));
4682  }
4683}
4684
4685// Symbol doesn't exist in Solaris 8 pset.h
4686#ifndef PS_MYID
4687#define PS_MYID -3
4688#endif
4689
4690// int pset_getloadavg(psetid_t pset, double loadavg[], int nelem);
4691typedef long (*pset_getloadavg_type)(psetid_t pset, double loadavg[], int nelem);
4692static pset_getloadavg_type pset_getloadavg_ptr = NULL;
4693
4694void init_pset_getloadavg_ptr(void) {
4695  pset_getloadavg_ptr =
4696    (pset_getloadavg_type)dlsym(RTLD_DEFAULT, "pset_getloadavg");
4697  if (PrintMiscellaneous && Verbose && pset_getloadavg_ptr == NULL) {
4698    warning("pset_getloadavg function not found");
4699  }
4700}
4701
4702int os::Solaris::_dev_zero_fd = -1;
4703
4704// this is called _before_ the global arguments have been parsed
4705void os::init(void) {
4706  _initial_pid = getpid();
4707
4708  max_hrtime = first_hrtime = gethrtime();
4709
4710  init_random(1234567);
4711
4712  page_size = sysconf(_SC_PAGESIZE);
4713  if (page_size == -1)
4714    fatal1("os_solaris.cpp: os::init: sysconf failed (%s)", strerror(errno));
4715  init_page_sizes((size_t) page_size);
4716
4717  Solaris::initialize_system_info();
4718
4719  int fd = open("/dev/zero", O_RDWR);
4720  if (fd < 0) {
4721    fatal1("os::init: cannot open /dev/zero (%s)", strerror(errno));
4722  } else {
4723    Solaris::set_dev_zero_fd(fd);
4724
4725    // Close on exec, child won't inherit.
4726    fcntl(fd, F_SETFD, FD_CLOEXEC);
4727  }
4728
4729  clock_tics_per_sec = CLK_TCK;
4730
4731  // check if dladdr1() exists; dladdr1 can provide more information than
4732  // dladdr for os::dll_address_to_function_name. It comes with SunOS 5.9
4733  // and is available on linker patches for 5.7 and 5.8.
4734  // libdl.so must have been loaded, this call is just an entry lookup
4735  void * hdl = dlopen("libdl.so", RTLD_NOW);
4736  if (hdl)
4737    dladdr1_func = CAST_TO_FN_PTR(dladdr1_func_type, dlsym(hdl, "dladdr1"));
4738
4739  // (Solaris only) this switches to calls that actually do locking.
4740  ThreadCritical::initialize();
4741
4742  main_thread = thr_self();
4743
4744  // Constant minimum stack size allowed. It must be at least
4745  // the minimum of what the OS supports (thr_min_stack()), and
4746  // enough to allow the thread to get to user bytecode execution.
4747  Solaris::min_stack_allowed = MAX2(thr_min_stack(), Solaris::min_stack_allowed);
4748  // If the pagesize of the VM is greater than 8K determine the appropriate
4749  // number of initial guard pages.  The user can change this with the
4750  // command line arguments, if needed.
4751  if (vm_page_size() > 8*K) {
4752    StackYellowPages = 1;
4753    StackRedPages = 1;
4754    StackShadowPages = round_to((StackShadowPages*8*K), vm_page_size()) / vm_page_size();
4755  }
4756}
4757
4758// To install functions for atexit system call
4759extern "C" {
4760  static void perfMemory_exit_helper() {
4761    perfMemory_exit();
4762  }
4763}
4764
4765// this is called _after_ the global arguments have been parsed
4766jint os::init_2(void) {
4767  // try to enable extended file IO ASAP, see 6431278
4768  os::Solaris::try_enable_extended_io();
4769
4770  // Allocate a single page and mark it as readable for safepoint polling.  Also
4771  // use this first mmap call to check support for MAP_ALIGN.
4772  address polling_page = (address)Solaris::mmap_chunk((char*)page_size,
4773                                                      page_size,
4774                                                      MAP_PRIVATE | MAP_ALIGN,
4775                                                      PROT_READ);
4776  if (polling_page == NULL) {
4777    has_map_align = false;
4778    polling_page = (address)Solaris::mmap_chunk(NULL, page_size, MAP_PRIVATE,
4779                                                PROT_READ);
4780  }
4781
4782  os::set_polling_page(polling_page);
4783
4784#ifndef PRODUCT
4785  if( Verbose && PrintMiscellaneous )
4786    tty->print("[SafePoint Polling address: " INTPTR_FORMAT "]\n", (intptr_t)polling_page);
4787#endif
4788
4789  if (!UseMembar) {
4790    address mem_serialize_page = (address)Solaris::mmap_chunk( NULL, page_size, MAP_PRIVATE, PROT_READ | PROT_WRITE );
4791    guarantee( mem_serialize_page != NULL, "mmap Failed for memory serialize page");
4792    os::set_memory_serialize_page( mem_serialize_page );
4793
4794#ifndef PRODUCT
4795    if(Verbose && PrintMiscellaneous)
4796      tty->print("[Memory Serialize  Page address: " INTPTR_FORMAT "]\n", (intptr_t)mem_serialize_page);
4797#endif
4798}
4799
4800  FLAG_SET_DEFAULT(UseLargePages, os::large_page_init());
4801
4802  // Check minimum allowable stack size for thread creation and to initialize
4803  // the java system classes, including StackOverflowError - depends on page
4804  // size.  Add a page for compiler2 recursion in main thread.
4805  // Add in BytesPerWord times page size to account for VM stack during
4806  // class initialization depending on 32 or 64 bit VM.
4807  guarantee((Solaris::min_stack_allowed >=
4808    (StackYellowPages+StackRedPages+StackShadowPages+BytesPerWord
4809     COMPILER2_PRESENT(+1)) * page_size),
4810    "need to increase Solaris::min_stack_allowed on this platform");
4811
4812  size_t threadStackSizeInBytes = ThreadStackSize * K;
4813  if (threadStackSizeInBytes != 0 &&
4814    threadStackSizeInBytes < Solaris::min_stack_allowed) {
4815    tty->print_cr("\nThe stack size specified is too small, Specify at least %dk",
4816                  Solaris::min_stack_allowed/K);
4817    return JNI_ERR;
4818  }
4819
4820  // For 64kbps there will be a 64kb page size, which makes
4821  // the usable default stack size quite a bit less.  Increase the
4822  // stack for 64kb (or any > than 8kb) pages, this increases
4823  // virtual memory fragmentation (since we're not creating the
4824  // stack on a power of 2 boundary.  The real fix for this
4825  // should be to fix the guard page mechanism.
4826
4827  if (vm_page_size() > 8*K) {
4828      threadStackSizeInBytes = (threadStackSizeInBytes != 0)
4829         ? threadStackSizeInBytes +
4830           ((StackYellowPages + StackRedPages) * vm_page_size())
4831         : 0;
4832      ThreadStackSize = threadStackSizeInBytes/K;
4833  }
4834
4835  // Make the stack size a multiple of the page size so that
4836  // the yellow/red zones can be guarded.
4837  JavaThread::set_stack_size_at_create(round_to(threadStackSizeInBytes,
4838        vm_page_size()));
4839
4840  Solaris::libthread_init();
4841
4842  if (UseNUMA) {
4843    if (!Solaris::liblgrp_init()) {
4844      UseNUMA = false;
4845    } else {
4846      size_t lgrp_limit = os::numa_get_groups_num();
4847      int *lgrp_ids = NEW_C_HEAP_ARRAY(int, lgrp_limit);
4848      size_t lgrp_num = os::numa_get_leaf_groups(lgrp_ids, lgrp_limit);
4849      FREE_C_HEAP_ARRAY(int, lgrp_ids);
4850      if (lgrp_num < 2) {
4851        // There's only one locality group, disable NUMA.
4852        UseNUMA = false;
4853      }
4854    }
4855    if (!UseNUMA && ForceNUMA) {
4856      UseNUMA = true;
4857    }
4858  }
4859
4860  Solaris::misc_sym_init();
4861  Solaris::signal_sets_init();
4862  Solaris::init_signal_mem();
4863  Solaris::install_signal_handlers();
4864
4865  if (libjsigversion < JSIG_VERSION_1_4_1) {
4866    Maxlibjsigsigs = OLDMAXSIGNUM;
4867  }
4868
4869  // initialize synchronization primitives to use either thread or
4870  // lwp synchronization (controlled by UseLWPSynchronization)
4871  Solaris::synchronization_init();
4872
4873  if (MaxFDLimit) {
4874    // set the number of file descriptors to max. print out error
4875    // if getrlimit/setrlimit fails but continue regardless.
4876    struct rlimit nbr_files;
4877    int status = getrlimit(RLIMIT_NOFILE, &nbr_files);
4878    if (status != 0) {
4879      if (PrintMiscellaneous && (Verbose || WizardMode))
4880        perror("os::init_2 getrlimit failed");
4881    } else {
4882      nbr_files.rlim_cur = nbr_files.rlim_max;
4883      status = setrlimit(RLIMIT_NOFILE, &nbr_files);
4884      if (status != 0) {
4885        if (PrintMiscellaneous && (Verbose || WizardMode))
4886          perror("os::init_2 setrlimit failed");
4887      }
4888    }
4889  }
4890
4891  // Initialize HPI.
4892  jint hpi_result = hpi::initialize();
4893  if (hpi_result != JNI_OK) {
4894    tty->print_cr("There was an error trying to initialize the HPI library.");
4895    return hpi_result;
4896  }
4897
4898  // Calculate theoretical max. size of Threads to guard gainst
4899  // artifical out-of-memory situations, where all available address-
4900  // space has been reserved by thread stacks. Default stack size is 1Mb.
4901  size_t pre_thread_stack_size = (JavaThread::stack_size_at_create()) ?
4902    JavaThread::stack_size_at_create() : (1*K*K);
4903  assert(pre_thread_stack_size != 0, "Must have a stack");
4904  // Solaris has a maximum of 4Gb of user programs. Calculate the thread limit when
4905  // we should start doing Virtual Memory banging. Currently when the threads will
4906  // have used all but 200Mb of space.
4907  size_t max_address_space = ((unsigned int)4 * K * K * K) - (200 * K * K);
4908  Solaris::_os_thread_limit = max_address_space / pre_thread_stack_size;
4909
4910  // at-exit methods are called in the reverse order of their registration.
4911  // In Solaris 7 and earlier, atexit functions are called on return from
4912  // main or as a result of a call to exit(3C). There can be only 32 of
4913  // these functions registered and atexit() does not set errno. In Solaris
4914  // 8 and later, there is no limit to the number of functions registered
4915  // and atexit() sets errno. In addition, in Solaris 8 and later, atexit
4916  // functions are called upon dlclose(3DL) in addition to return from main
4917  // and exit(3C).
4918
4919  if (PerfAllowAtExitRegistration) {
4920    // only register atexit functions if PerfAllowAtExitRegistration is set.
4921    // atexit functions can be delayed until process exit time, which
4922    // can be problematic for embedded VM situations. Embedded VMs should
4923    // call DestroyJavaVM() to assure that VM resources are released.
4924
4925    // note: perfMemory_exit_helper atexit function may be removed in
4926    // the future if the appropriate cleanup code can be added to the
4927    // VM_Exit VMOperation's doit method.
4928    if (atexit(perfMemory_exit_helper) != 0) {
4929      warning("os::init2 atexit(perfMemory_exit_helper) failed");
4930    }
4931  }
4932
4933  // Init pset_loadavg function pointer
4934  init_pset_getloadavg_ptr();
4935
4936  return JNI_OK;
4937}
4938
4939
4940// Mark the polling page as unreadable
4941void os::make_polling_page_unreadable(void) {
4942  if( mprotect((char *)_polling_page, page_size, PROT_NONE) != 0 )
4943    fatal("Could not disable polling page");
4944};
4945
4946// Mark the polling page as readable
4947void os::make_polling_page_readable(void) {
4948  if( mprotect((char *)_polling_page, page_size, PROT_READ) != 0 )
4949    fatal("Could not enable polling page");
4950};
4951
4952// OS interface.
4953
4954int os::stat(const char *path, struct stat *sbuf) {
4955  char pathbuf[MAX_PATH];
4956  if (strlen(path) > MAX_PATH - 1) {
4957    errno = ENAMETOOLONG;
4958    return -1;
4959  }
4960  hpi::native_path(strcpy(pathbuf, path));
4961  return ::stat(pathbuf, sbuf);
4962}
4963
4964
4965bool os::check_heap(bool force) { return true; }
4966
4967typedef int (*vsnprintf_t)(char* buf, size_t count, const char* fmt, va_list argptr);
4968static vsnprintf_t sol_vsnprintf = NULL;
4969
4970int local_vsnprintf(char* buf, size_t count, const char* fmt, va_list argptr) {
4971  if (!sol_vsnprintf) {
4972    //search  for the named symbol in the objects that were loaded after libjvm
4973    void* where = RTLD_NEXT;
4974    if ((sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "__vsnprintf"))) == NULL)
4975        sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "vsnprintf"));
4976    if (!sol_vsnprintf){
4977      //search  for the named symbol in the objects that were loaded before libjvm
4978      where = RTLD_DEFAULT;
4979      if ((sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "__vsnprintf"))) == NULL)
4980        sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "vsnprintf"));
4981      assert(sol_vsnprintf != NULL, "vsnprintf not found");
4982    }
4983  }
4984  return (*sol_vsnprintf)(buf, count, fmt, argptr);
4985}
4986
4987
4988// Is a (classpath) directory empty?
4989bool os::dir_is_empty(const char* path) {
4990  DIR *dir = NULL;
4991  struct dirent *ptr;
4992
4993  dir = opendir(path);
4994  if (dir == NULL) return true;
4995
4996  /* Scan the directory */
4997  bool result = true;
4998  char buf[sizeof(struct dirent) + MAX_PATH];
4999  struct dirent *dbuf = (struct dirent *) buf;
5000  while (result && (ptr = readdir(dir, dbuf)) != NULL) {
5001    if (strcmp(ptr->d_name, ".") != 0 && strcmp(ptr->d_name, "..") != 0) {
5002      result = false;
5003    }
5004  }
5005  closedir(dir);
5006  return result;
5007}
5008
5009// create binary file, rewriting existing file if required
5010int os::create_binary_file(const char* path, bool rewrite_existing) {
5011  int oflags = O_WRONLY | O_CREAT;
5012  if (!rewrite_existing) {
5013    oflags |= O_EXCL;
5014  }
5015  return ::open64(path, oflags, S_IREAD | S_IWRITE);
5016}
5017
5018// return current position of file pointer
5019jlong os::current_file_offset(int fd) {
5020  return (jlong)::lseek64(fd, (off64_t)0, SEEK_CUR);
5021}
5022
5023// move file pointer to the specified offset
5024jlong os::seek_to_file_offset(int fd, jlong offset) {
5025  return (jlong)::lseek64(fd, (off64_t)offset, SEEK_SET);
5026}
5027
5028// Map a block of memory.
5029char* os::map_memory(int fd, const char* file_name, size_t file_offset,
5030                     char *addr, size_t bytes, bool read_only,
5031                     bool allow_exec) {
5032  int prot;
5033  int flags;
5034
5035  if (read_only) {
5036    prot = PROT_READ;
5037    flags = MAP_SHARED;
5038  } else {
5039    prot = PROT_READ | PROT_WRITE;
5040    flags = MAP_PRIVATE;
5041  }
5042
5043  if (allow_exec) {
5044    prot |= PROT_EXEC;
5045  }
5046
5047  if (addr != NULL) {
5048    flags |= MAP_FIXED;
5049  }
5050
5051  char* mapped_address = (char*)mmap(addr, (size_t)bytes, prot, flags,
5052                                     fd, file_offset);
5053  if (mapped_address == MAP_FAILED) {
5054    return NULL;
5055  }
5056  return mapped_address;
5057}
5058
5059
5060// Remap a block of memory.
5061char* os::remap_memory(int fd, const char* file_name, size_t file_offset,
5062                       char *addr, size_t bytes, bool read_only,
5063                       bool allow_exec) {
5064  // same as map_memory() on this OS
5065  return os::map_memory(fd, file_name, file_offset, addr, bytes, read_only,
5066                        allow_exec);
5067}
5068
5069
5070// Unmap a block of memory.
5071bool os::unmap_memory(char* addr, size_t bytes) {
5072  return munmap(addr, bytes) == 0;
5073}
5074
5075void os::pause() {
5076  char filename[MAX_PATH];
5077  if (PauseAtStartupFile && PauseAtStartupFile[0]) {
5078    jio_snprintf(filename, MAX_PATH, PauseAtStartupFile);
5079  } else {
5080    jio_snprintf(filename, MAX_PATH, "./vm.paused.%d", current_process_id());
5081  }
5082
5083  int fd = ::open(filename, O_WRONLY | O_CREAT | O_TRUNC, 0666);
5084  if (fd != -1) {
5085    struct stat buf;
5086    close(fd);
5087    while (::stat(filename, &buf) == 0) {
5088      (void)::poll(NULL, 0, 100);
5089    }
5090  } else {
5091    jio_fprintf(stderr,
5092      "Could not open pause file '%s', continuing immediately.\n", filename);
5093  }
5094}
5095
5096#ifndef PRODUCT
5097#ifdef INTERPOSE_ON_SYSTEM_SYNCH_FUNCTIONS
5098// Turn this on if you need to trace synch operations.
5099// Set RECORD_SYNCH_LIMIT to a large-enough value,
5100// and call record_synch_enable and record_synch_disable
5101// around the computation of interest.
5102
5103void record_synch(char* name, bool returning);  // defined below
5104
5105class RecordSynch {
5106  char* _name;
5107 public:
5108  RecordSynch(char* name) :_name(name)
5109                 { record_synch(_name, false); }
5110  ~RecordSynch() { record_synch(_name,   true);  }
5111};
5112
5113#define CHECK_SYNCH_OP(ret, name, params, args, inner)          \
5114extern "C" ret name params {                                    \
5115  typedef ret name##_t params;                                  \
5116  static name##_t* implem = NULL;                               \
5117  static int callcount = 0;                                     \
5118  if (implem == NULL) {                                         \
5119    implem = (name##_t*) dlsym(RTLD_NEXT, #name);               \
5120    if (implem == NULL)  fatal(dlerror());                      \
5121  }                                                             \
5122  ++callcount;                                                  \
5123  RecordSynch _rs(#name);                                       \
5124  inner;                                                        \
5125  return implem args;                                           \
5126}
5127// in dbx, examine callcounts this way:
5128// for n in $(eval whereis callcount | awk '{print $2}'); do print $n; done
5129
5130#define CHECK_POINTER_OK(p) \
5131  (Universe::perm_gen() == NULL || !Universe::is_reserved_heap((oop)(p)))
5132#define CHECK_MU \
5133  if (!CHECK_POINTER_OK(mu)) fatal("Mutex must be in C heap only.");
5134#define CHECK_CV \
5135  if (!CHECK_POINTER_OK(cv)) fatal("Condvar must be in C heap only.");
5136#define CHECK_P(p) \
5137  if (!CHECK_POINTER_OK(p))  fatal(false,  "Pointer must be in C heap only.");
5138
5139#define CHECK_MUTEX(mutex_op) \
5140CHECK_SYNCH_OP(int, mutex_op, (mutex_t *mu), (mu), CHECK_MU);
5141
5142CHECK_MUTEX(   mutex_lock)
5143CHECK_MUTEX(  _mutex_lock)
5144CHECK_MUTEX( mutex_unlock)
5145CHECK_MUTEX(_mutex_unlock)
5146CHECK_MUTEX( mutex_trylock)
5147CHECK_MUTEX(_mutex_trylock)
5148
5149#define CHECK_COND(cond_op) \
5150CHECK_SYNCH_OP(int, cond_op, (cond_t *cv, mutex_t *mu), (cv, mu), CHECK_MU;CHECK_CV);
5151
5152CHECK_COND( cond_wait);
5153CHECK_COND(_cond_wait);
5154CHECK_COND(_cond_wait_cancel);
5155
5156#define CHECK_COND2(cond_op) \
5157CHECK_SYNCH_OP(int, cond_op, (cond_t *cv, mutex_t *mu, timestruc_t* ts), (cv, mu, ts), CHECK_MU;CHECK_CV);
5158
5159CHECK_COND2( cond_timedwait);
5160CHECK_COND2(_cond_timedwait);
5161CHECK_COND2(_cond_timedwait_cancel);
5162
5163// do the _lwp_* versions too
5164#define mutex_t lwp_mutex_t
5165#define cond_t  lwp_cond_t
5166CHECK_MUTEX(  _lwp_mutex_lock)
5167CHECK_MUTEX(  _lwp_mutex_unlock)
5168CHECK_MUTEX(  _lwp_mutex_trylock)
5169CHECK_MUTEX( __lwp_mutex_lock)
5170CHECK_MUTEX( __lwp_mutex_unlock)
5171CHECK_MUTEX( __lwp_mutex_trylock)
5172CHECK_MUTEX(___lwp_mutex_lock)
5173CHECK_MUTEX(___lwp_mutex_unlock)
5174
5175CHECK_COND(  _lwp_cond_wait);
5176CHECK_COND( __lwp_cond_wait);
5177CHECK_COND(___lwp_cond_wait);
5178
5179CHECK_COND2(  _lwp_cond_timedwait);
5180CHECK_COND2( __lwp_cond_timedwait);
5181#undef mutex_t
5182#undef cond_t
5183
5184CHECK_SYNCH_OP(int, _lwp_suspend2,       (int lwp, int *n), (lwp, n), 0);
5185CHECK_SYNCH_OP(int,__lwp_suspend2,       (int lwp, int *n), (lwp, n), 0);
5186CHECK_SYNCH_OP(int, _lwp_kill,           (int lwp, int n),  (lwp, n), 0);
5187CHECK_SYNCH_OP(int,__lwp_kill,           (int lwp, int n),  (lwp, n), 0);
5188CHECK_SYNCH_OP(int, _lwp_sema_wait,      (lwp_sema_t* p),   (p),  CHECK_P(p));
5189CHECK_SYNCH_OP(int,__lwp_sema_wait,      (lwp_sema_t* p),   (p),  CHECK_P(p));
5190CHECK_SYNCH_OP(int, _lwp_cond_broadcast, (lwp_cond_t* cv),  (cv), CHECK_CV);
5191CHECK_SYNCH_OP(int,__lwp_cond_broadcast, (lwp_cond_t* cv),  (cv), CHECK_CV);
5192
5193
5194// recording machinery:
5195
5196enum { RECORD_SYNCH_LIMIT = 200 };
5197char* record_synch_name[RECORD_SYNCH_LIMIT];
5198void* record_synch_arg0ptr[RECORD_SYNCH_LIMIT];
5199bool record_synch_returning[RECORD_SYNCH_LIMIT];
5200thread_t record_synch_thread[RECORD_SYNCH_LIMIT];
5201int record_synch_count = 0;
5202bool record_synch_enabled = false;
5203
5204// in dbx, examine recorded data this way:
5205// for n in name arg0ptr returning thread; do print record_synch_$n[0..record_synch_count-1]; done
5206
5207void record_synch(char* name, bool returning) {
5208  if (record_synch_enabled) {
5209    if (record_synch_count < RECORD_SYNCH_LIMIT) {
5210      record_synch_name[record_synch_count] = name;
5211      record_synch_returning[record_synch_count] = returning;
5212      record_synch_thread[record_synch_count] = thr_self();
5213      record_synch_arg0ptr[record_synch_count] = &name;
5214      record_synch_count++;
5215    }
5216    // put more checking code here:
5217    // ...
5218  }
5219}
5220
5221void record_synch_enable() {
5222  // start collecting trace data, if not already doing so
5223  if (!record_synch_enabled)  record_synch_count = 0;
5224  record_synch_enabled = true;
5225}
5226
5227void record_synch_disable() {
5228  // stop collecting trace data
5229  record_synch_enabled = false;
5230}
5231
5232#endif // INTERPOSE_ON_SYSTEM_SYNCH_FUNCTIONS
5233#endif // PRODUCT
5234
5235const intptr_t thr_time_off  = (intptr_t)(&((prusage_t *)(NULL))->pr_utime);
5236const intptr_t thr_time_size = (intptr_t)(&((prusage_t *)(NULL))->pr_ttime) -
5237                               (intptr_t)(&((prusage_t *)(NULL))->pr_utime);
5238
5239
5240// JVMTI & JVM monitoring and management support
5241// The thread_cpu_time() and current_thread_cpu_time() are only
5242// supported if is_thread_cpu_time_supported() returns true.
5243// They are not supported on Solaris T1.
5244
5245// current_thread_cpu_time(bool) and thread_cpu_time(Thread*, bool)
5246// are used by JVM M&M and JVMTI to get user+sys or user CPU time
5247// of a thread.
5248//
5249// current_thread_cpu_time() and thread_cpu_time(Thread *)
5250// returns the fast estimate available on the platform.
5251
5252// hrtime_t gethrvtime() return value includes
5253// user time but does not include system time
5254jlong os::current_thread_cpu_time() {
5255  return (jlong) gethrvtime();
5256}
5257
5258jlong os::thread_cpu_time(Thread *thread) {
5259  // return user level CPU time only to be consistent with
5260  // what current_thread_cpu_time returns.
5261  // thread_cpu_time_info() must be changed if this changes
5262  return os::thread_cpu_time(thread, false /* user time only */);
5263}
5264
5265jlong os::current_thread_cpu_time(bool user_sys_cpu_time) {
5266  if (user_sys_cpu_time) {
5267    return os::thread_cpu_time(Thread::current(), user_sys_cpu_time);
5268  } else {
5269    return os::current_thread_cpu_time();
5270  }
5271}
5272
5273jlong os::thread_cpu_time(Thread *thread, bool user_sys_cpu_time) {
5274  char proc_name[64];
5275  int count;
5276  prusage_t prusage;
5277  jlong lwp_time;
5278  int fd;
5279
5280  sprintf(proc_name, "/proc/%d/lwp/%d/lwpusage",
5281                     getpid(),
5282                     thread->osthread()->lwp_id());
5283  fd = open(proc_name, O_RDONLY);
5284  if ( fd == -1 ) return -1;
5285
5286  do {
5287    count = pread(fd,
5288                  (void *)&prusage.pr_utime,
5289                  thr_time_size,
5290                  thr_time_off);
5291  } while (count < 0 && errno == EINTR);
5292  close(fd);
5293  if ( count < 0 ) return -1;
5294
5295  if (user_sys_cpu_time) {
5296    // user + system CPU time
5297    lwp_time = (((jlong)prusage.pr_stime.tv_sec +
5298                 (jlong)prusage.pr_utime.tv_sec) * (jlong)1000000000) +
5299                 (jlong)prusage.pr_stime.tv_nsec +
5300                 (jlong)prusage.pr_utime.tv_nsec;
5301  } else {
5302    // user level CPU time only
5303    lwp_time = ((jlong)prusage.pr_utime.tv_sec * (jlong)1000000000) +
5304                (jlong)prusage.pr_utime.tv_nsec;
5305  }
5306
5307  return(lwp_time);
5308}
5309
5310void os::current_thread_cpu_time_info(jvmtiTimerInfo *info_ptr) {
5311  info_ptr->max_value = ALL_64_BITS;      // will not wrap in less than 64 bits
5312  info_ptr->may_skip_backward = false;    // elapsed time not wall time
5313  info_ptr->may_skip_forward = false;     // elapsed time not wall time
5314  info_ptr->kind = JVMTI_TIMER_USER_CPU;  // only user time is returned
5315}
5316
5317void os::thread_cpu_time_info(jvmtiTimerInfo *info_ptr) {
5318  info_ptr->max_value = ALL_64_BITS;      // will not wrap in less than 64 bits
5319  info_ptr->may_skip_backward = false;    // elapsed time not wall time
5320  info_ptr->may_skip_forward = false;     // elapsed time not wall time
5321  info_ptr->kind = JVMTI_TIMER_USER_CPU;  // only user time is returned
5322}
5323
5324bool os::is_thread_cpu_time_supported() {
5325  if ( os::Solaris::T2_libthread() || UseBoundThreads ) {
5326    return true;
5327  } else {
5328    return false;
5329  }
5330}
5331
5332// System loadavg support.  Returns -1 if load average cannot be obtained.
5333// Return the load average for our processor set if the primitive exists
5334// (Solaris 9 and later).  Otherwise just return system wide loadavg.
5335int os::loadavg(double loadavg[], int nelem) {
5336  if (pset_getloadavg_ptr != NULL) {
5337    return (*pset_getloadavg_ptr)(PS_MYID, loadavg, nelem);
5338  } else {
5339    return ::getloadavg(loadavg, nelem);
5340  }
5341}
5342
5343//---------------------------------------------------------------------------------
5344#ifndef PRODUCT
5345
5346static address same_page(address x, address y) {
5347  intptr_t page_bits = -os::vm_page_size();
5348  if ((intptr_t(x) & page_bits) == (intptr_t(y) & page_bits))
5349    return x;
5350  else if (x > y)
5351    return (address)(intptr_t(y) | ~page_bits) + 1;
5352  else
5353    return (address)(intptr_t(y) & page_bits);
5354}
5355
5356bool os::find(address addr) {
5357  Dl_info dlinfo;
5358  memset(&dlinfo, 0, sizeof(dlinfo));
5359  if (dladdr(addr, &dlinfo)) {
5360#ifdef _LP64
5361    tty->print("0x%016lx: ", addr);
5362#else
5363    tty->print("0x%08x: ", addr);
5364#endif
5365    if (dlinfo.dli_sname != NULL)
5366      tty->print("%s+%#lx", dlinfo.dli_sname, addr-(intptr_t)dlinfo.dli_saddr);
5367    else if (dlinfo.dli_fname)
5368      tty->print("<offset %#lx>", addr-(intptr_t)dlinfo.dli_fbase);
5369    else
5370      tty->print("<absolute address>");
5371    if (dlinfo.dli_fname)  tty->print(" in %s", dlinfo.dli_fname);
5372#ifdef _LP64
5373    if (dlinfo.dli_fbase)  tty->print(" at 0x%016lx", dlinfo.dli_fbase);
5374#else
5375    if (dlinfo.dli_fbase)  tty->print(" at 0x%08x", dlinfo.dli_fbase);
5376#endif
5377    tty->cr();
5378
5379    if (Verbose) {
5380      // decode some bytes around the PC
5381      address begin = same_page(addr-40, addr);
5382      address end   = same_page(addr+40, addr);
5383      address       lowest = (address) dlinfo.dli_sname;
5384      if (!lowest)  lowest = (address) dlinfo.dli_fbase;
5385      if (begin < lowest)  begin = lowest;
5386      Dl_info dlinfo2;
5387      if (dladdr(end, &dlinfo2) && dlinfo2.dli_saddr != dlinfo.dli_saddr
5388          && end > dlinfo2.dli_saddr && dlinfo2.dli_saddr > begin)
5389        end = (address) dlinfo2.dli_saddr;
5390      Disassembler::decode(begin, end);
5391    }
5392    return true;
5393  }
5394  return false;
5395}
5396
5397#endif
5398
5399
5400// Following function has been added to support HotSparc's libjvm.so running
5401// under Solaris production JDK 1.2.2 / 1.3.0.  These came from
5402// src/solaris/hpi/native_threads in the EVM codebase.
5403//
5404// NOTE: This is no longer needed in the 1.3.1 and 1.4 production release
5405// libraries and should thus be removed. We will leave it behind for a while
5406// until we no longer want to able to run on top of 1.3.0 Solaris production
5407// JDK. See 4341971.
5408
5409#define STACK_SLACK 0x800
5410
5411extern "C" {
5412  intptr_t sysThreadAvailableStackWithSlack() {
5413    stack_t st;
5414    intptr_t retval, stack_top;
5415    retval = thr_stksegment(&st);
5416    assert(retval == 0, "incorrect return value from thr_stksegment");
5417    assert((address)&st < (address)st.ss_sp, "Invalid stack base returned");
5418    assert((address)&st > (address)st.ss_sp-st.ss_size, "Invalid stack size returned");
5419    stack_top=(intptr_t)st.ss_sp-st.ss_size;
5420    return ((intptr_t)&stack_top - stack_top - STACK_SLACK);
5421  }
5422}
5423
5424// Just to get the Kernel build to link on solaris for testing.
5425
5426extern "C" {
5427class ASGCT_CallTrace;
5428void AsyncGetCallTrace(ASGCT_CallTrace *trace, jint depth, void* ucontext)
5429  KERNEL_RETURN;
5430}
5431
5432
5433// ObjectMonitor park-unpark infrastructure ...
5434//
5435// We implement Solaris and Linux PlatformEvents with the
5436// obvious condvar-mutex-flag triple.
5437// Another alternative that works quite well is pipes:
5438// Each PlatformEvent consists of a pipe-pair.
5439// The thread associated with the PlatformEvent
5440// calls park(), which reads from the input end of the pipe.
5441// Unpark() writes into the other end of the pipe.
5442// The write-side of the pipe must be set NDELAY.
5443// Unfortunately pipes consume a large # of handles.
5444// Native solaris lwp_park() and lwp_unpark() work nicely, too.
5445// Using pipes for the 1st few threads might be workable, however.
5446//
5447// park() is permitted to return spuriously.
5448// Callers of park() should wrap the call to park() in
5449// an appropriate loop.  A litmus test for the correct
5450// usage of park is the following: if park() were modified
5451// to immediately return 0 your code should still work,
5452// albeit degenerating to a spin loop.
5453//
5454// An interesting optimization for park() is to use a trylock()
5455// to attempt to acquire the mutex.  If the trylock() fails
5456// then we know that a concurrent unpark() operation is in-progress.
5457// in that case the park() code could simply set _count to 0
5458// and return immediately.  The subsequent park() operation *might*
5459// return immediately.  That's harmless as the caller of park() is
5460// expected to loop.  By using trylock() we will have avoided a
5461// avoided a context switch caused by contention on the per-thread mutex.
5462//
5463// TODO-FIXME:
5464// 1.  Reconcile Doug's JSR166 j.u.c park-unpark with the
5465//     objectmonitor implementation.
5466// 2.  Collapse the JSR166 parker event, and the
5467//     objectmonitor ParkEvent into a single "Event" construct.
5468// 3.  In park() and unpark() add:
5469//     assert (Thread::current() == AssociatedWith).
5470// 4.  add spurious wakeup injection on a -XX:EarlyParkReturn=N switch.
5471//     1-out-of-N park() operations will return immediately.
5472//
5473// _Event transitions in park()
5474//   -1 => -1 : illegal
5475//    1 =>  0 : pass - return immediately
5476//    0 => -1 : block
5477//
5478// _Event serves as a restricted-range semaphore.
5479//
5480// Another possible encoding of _Event would be with
5481// explicit "PARKED" == 01b and "SIGNALED" == 10b bits.
5482//
5483// TODO-FIXME: add DTRACE probes for:
5484// 1.   Tx parks
5485// 2.   Ty unparks Tx
5486// 3.   Tx resumes from park
5487
5488
5489// value determined through experimentation
5490#define ROUNDINGFIX 11
5491
5492// utility to compute the abstime argument to timedwait.
5493// TODO-FIXME: switch from compute_abstime() to unpackTime().
5494
5495static timestruc_t* compute_abstime(timestruc_t* abstime, jlong millis) {
5496  // millis is the relative timeout time
5497  // abstime will be the absolute timeout time
5498  if (millis < 0)  millis = 0;
5499  struct timeval now;
5500  int status = gettimeofday(&now, NULL);
5501  assert(status == 0, "gettimeofday");
5502  jlong seconds = millis / 1000;
5503  jlong max_wait_period;
5504
5505  if (UseLWPSynchronization) {
5506    // forward port of fix for 4275818 (not sleeping long enough)
5507    // There was a bug in Solaris 6, 7 and pre-patch 5 of 8 where
5508    // _lwp_cond_timedwait() used a round_down algorithm rather
5509    // than a round_up. For millis less than our roundfactor
5510    // it rounded down to 0 which doesn't meet the spec.
5511    // For millis > roundfactor we may return a bit sooner, but
5512    // since we can not accurately identify the patch level and
5513    // this has already been fixed in Solaris 9 and 8 we will
5514    // leave it alone rather than always rounding down.
5515
5516    if (millis > 0 && millis < ROUNDINGFIX) millis = ROUNDINGFIX;
5517       // It appears that when we go directly through Solaris _lwp_cond_timedwait()
5518           // the acceptable max time threshold is smaller than for libthread on 2.5.1 and 2.6
5519           max_wait_period = 21000000;
5520  } else {
5521    max_wait_period = 50000000;
5522  }
5523  millis %= 1000;
5524  if (seconds > max_wait_period) {      // see man cond_timedwait(3T)
5525     seconds = max_wait_period;
5526  }
5527  abstime->tv_sec = now.tv_sec  + seconds;
5528  long       usec = now.tv_usec + millis * 1000;
5529  if (usec >= 1000000) {
5530    abstime->tv_sec += 1;
5531    usec -= 1000000;
5532  }
5533  abstime->tv_nsec = usec * 1000;
5534  return abstime;
5535}
5536
5537// Test-and-clear _Event, always leaves _Event set to 0, returns immediately.
5538// Conceptually TryPark() should be equivalent to park(0).
5539
5540int os::PlatformEvent::TryPark() {
5541  for (;;) {
5542    const int v = _Event ;
5543    guarantee ((v == 0) || (v == 1), "invariant") ;
5544    if (Atomic::cmpxchg (0, &_Event, v) == v) return v  ;
5545  }
5546}
5547
5548void os::PlatformEvent::park() {           // AKA: down()
5549  // Invariant: Only the thread associated with the Event/PlatformEvent
5550  // may call park().
5551  int v ;
5552  for (;;) {
5553      v = _Event ;
5554      if (Atomic::cmpxchg (v-1, &_Event, v) == v) break ;
5555  }
5556  guarantee (v >= 0, "invariant") ;
5557  if (v == 0) {
5558     // Do this the hard way by blocking ...
5559     // See http://monaco.sfbay/detail.jsf?cr=5094058.
5560     // TODO-FIXME: for Solaris SPARC set fprs.FEF=0 prior to parking.
5561     // Only for SPARC >= V8PlusA
5562#if defined(__sparc) && defined(COMPILER2)
5563     if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5564#endif
5565     int status = os::Solaris::mutex_lock(_mutex);
5566     assert_status(status == 0, status,  "mutex_lock");
5567     guarantee (_nParked == 0, "invariant") ;
5568     ++ _nParked ;
5569     while (_Event < 0) {
5570        // for some reason, under 2.7 lwp_cond_wait() may return ETIME ...
5571        // Treat this the same as if the wait was interrupted
5572        // With usr/lib/lwp going to kernel, always handle ETIME
5573        status = os::Solaris::cond_wait(_cond, _mutex);
5574        if (status == ETIME) status = EINTR ;
5575        assert_status(status == 0 || status == EINTR, status, "cond_wait");
5576     }
5577     -- _nParked ;
5578     _Event = 0 ;
5579     status = os::Solaris::mutex_unlock(_mutex);
5580     assert_status(status == 0, status, "mutex_unlock");
5581  }
5582}
5583
5584int os::PlatformEvent::park(jlong millis) {
5585  guarantee (_nParked == 0, "invariant") ;
5586  int v ;
5587  for (;;) {
5588      v = _Event ;
5589      if (Atomic::cmpxchg (v-1, &_Event, v) == v) break ;
5590  }
5591  guarantee (v >= 0, "invariant") ;
5592  if (v != 0) return OS_OK ;
5593
5594  int ret = OS_TIMEOUT;
5595  timestruc_t abst;
5596  compute_abstime (&abst, millis);
5597
5598  // See http://monaco.sfbay/detail.jsf?cr=5094058.
5599  // For Solaris SPARC set fprs.FEF=0 prior to parking.
5600  // Only for SPARC >= V8PlusA
5601#if defined(__sparc) && defined(COMPILER2)
5602 if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5603#endif
5604  int status = os::Solaris::mutex_lock(_mutex);
5605  assert_status(status == 0, status, "mutex_lock");
5606  guarantee (_nParked == 0, "invariant") ;
5607  ++ _nParked ;
5608  while (_Event < 0) {
5609     int status = os::Solaris::cond_timedwait(_cond, _mutex, &abst);
5610     assert_status(status == 0 || status == EINTR ||
5611                   status == ETIME || status == ETIMEDOUT,
5612                   status, "cond_timedwait");
5613     if (!FilterSpuriousWakeups) break ;                // previous semantics
5614     if (status == ETIME || status == ETIMEDOUT) break ;
5615     // We consume and ignore EINTR and spurious wakeups.
5616  }
5617  -- _nParked ;
5618  if (_Event >= 0) ret = OS_OK ;
5619  _Event = 0 ;
5620  status = os::Solaris::mutex_unlock(_mutex);
5621  assert_status(status == 0, status, "mutex_unlock");
5622  return ret;
5623}
5624
5625void os::PlatformEvent::unpark() {
5626  int v, AnyWaiters;
5627
5628  // Increment _Event.
5629  // Another acceptable implementation would be to simply swap 1
5630  // into _Event:
5631  //   if (Swap (&_Event, 1) < 0) {
5632  //      mutex_lock (_mutex) ; AnyWaiters = nParked; mutex_unlock (_mutex) ;
5633  //      if (AnyWaiters) cond_signal (_cond) ;
5634  //   }
5635
5636  for (;;) {
5637    v = _Event ;
5638    if (v > 0) {
5639       // The LD of _Event could have reordered or be satisfied
5640       // by a read-aside from this processor's write buffer.
5641       // To avoid problems execute a barrier and then
5642       // ratify the value.  A degenerate CAS() would also work.
5643       // Viz., CAS (v+0, &_Event, v) == v).
5644       OrderAccess::fence() ;
5645       if (_Event == v) return ;
5646       continue ;
5647    }
5648    if (Atomic::cmpxchg (v+1, &_Event, v) == v) break ;
5649  }
5650
5651  // If the thread associated with the event was parked, wake it.
5652  if (v < 0) {
5653     int status ;
5654     // Wait for the thread assoc with the PlatformEvent to vacate.
5655     status = os::Solaris::mutex_lock(_mutex);
5656     assert_status(status == 0, status, "mutex_lock");
5657     AnyWaiters = _nParked ;
5658     status = os::Solaris::mutex_unlock(_mutex);
5659     assert_status(status == 0, status, "mutex_unlock");
5660     guarantee (AnyWaiters == 0 || AnyWaiters == 1, "invariant") ;
5661     if (AnyWaiters != 0) {
5662       // We intentional signal *after* dropping the lock
5663       // to avoid a common class of futile wakeups.
5664       status = os::Solaris::cond_signal(_cond);
5665       assert_status(status == 0, status, "cond_signal");
5666     }
5667  }
5668}
5669
5670// JSR166
5671// -------------------------------------------------------
5672
5673/*
5674 * The solaris and linux implementations of park/unpark are fairly
5675 * conservative for now, but can be improved. They currently use a
5676 * mutex/condvar pair, plus _counter.
5677 * Park decrements _counter if > 0, else does a condvar wait.  Unpark
5678 * sets count to 1 and signals condvar.  Only one thread ever waits
5679 * on the condvar. Contention seen when trying to park implies that someone
5680 * is unparking you, so don't wait. And spurious returns are fine, so there
5681 * is no need to track notifications.
5682 */
5683
5684#define NANOSECS_PER_SEC 1000000000
5685#define NANOSECS_PER_MILLISEC 1000000
5686#define MAX_SECS 100000000
5687
5688/*
5689 * This code is common to linux and solaris and will be moved to a
5690 * common place in dolphin.
5691 *
5692 * The passed in time value is either a relative time in nanoseconds
5693 * or an absolute time in milliseconds. Either way it has to be unpacked
5694 * into suitable seconds and nanoseconds components and stored in the
5695 * given timespec structure.
5696 * Given time is a 64-bit value and the time_t used in the timespec is only
5697 * a signed-32-bit value (except on 64-bit Linux) we have to watch for
5698 * overflow if times way in the future are given. Further on Solaris versions
5699 * prior to 10 there is a restriction (see cond_timedwait) that the specified
5700 * number of seconds, in abstime, is less than current_time  + 100,000,000.
5701 * As it will be 28 years before "now + 100000000" will overflow we can
5702 * ignore overflow and just impose a hard-limit on seconds using the value
5703 * of "now + 100,000,000". This places a limit on the timeout of about 3.17
5704 * years from "now".
5705 */
5706static void unpackTime(timespec* absTime, bool isAbsolute, jlong time) {
5707  assert (time > 0, "convertTime");
5708
5709  struct timeval now;
5710  int status = gettimeofday(&now, NULL);
5711  assert(status == 0, "gettimeofday");
5712
5713  time_t max_secs = now.tv_sec + MAX_SECS;
5714
5715  if (isAbsolute) {
5716    jlong secs = time / 1000;
5717    if (secs > max_secs) {
5718      absTime->tv_sec = max_secs;
5719    }
5720    else {
5721      absTime->tv_sec = secs;
5722    }
5723    absTime->tv_nsec = (time % 1000) * NANOSECS_PER_MILLISEC;
5724  }
5725  else {
5726    jlong secs = time / NANOSECS_PER_SEC;
5727    if (secs >= MAX_SECS) {
5728      absTime->tv_sec = max_secs;
5729      absTime->tv_nsec = 0;
5730    }
5731    else {
5732      absTime->tv_sec = now.tv_sec + secs;
5733      absTime->tv_nsec = (time % NANOSECS_PER_SEC) + now.tv_usec*1000;
5734      if (absTime->tv_nsec >= NANOSECS_PER_SEC) {
5735        absTime->tv_nsec -= NANOSECS_PER_SEC;
5736        ++absTime->tv_sec; // note: this must be <= max_secs
5737      }
5738    }
5739  }
5740  assert(absTime->tv_sec >= 0, "tv_sec < 0");
5741  assert(absTime->tv_sec <= max_secs, "tv_sec > max_secs");
5742  assert(absTime->tv_nsec >= 0, "tv_nsec < 0");
5743  assert(absTime->tv_nsec < NANOSECS_PER_SEC, "tv_nsec >= nanos_per_sec");
5744}
5745
5746void Parker::park(bool isAbsolute, jlong time) {
5747
5748  // Optional fast-path check:
5749  // Return immediately if a permit is available.
5750  if (_counter > 0) {
5751      _counter = 0 ;
5752      return ;
5753  }
5754
5755  // Optional fast-exit: Check interrupt before trying to wait
5756  Thread* thread = Thread::current();
5757  assert(thread->is_Java_thread(), "Must be JavaThread");
5758  JavaThread *jt = (JavaThread *)thread;
5759  if (Thread::is_interrupted(thread, false)) {
5760    return;
5761  }
5762
5763  // First, demultiplex/decode time arguments
5764  timespec absTime;
5765  if (time < 0) { // don't wait at all
5766    return;
5767  }
5768  if (time > 0) {
5769    // Warning: this code might be exposed to the old Solaris time
5770    // round-down bugs.  Grep "roundingFix" for details.
5771    unpackTime(&absTime, isAbsolute, time);
5772  }
5773
5774  // Enter safepoint region
5775  // Beware of deadlocks such as 6317397.
5776  // The per-thread Parker:: _mutex is a classic leaf-lock.
5777  // In particular a thread must never block on the Threads_lock while
5778  // holding the Parker:: mutex.  If safepoints are pending both the
5779  // the ThreadBlockInVM() CTOR and DTOR may grab Threads_lock.
5780  ThreadBlockInVM tbivm(jt);
5781
5782  // Don't wait if cannot get lock since interference arises from
5783  // unblocking.  Also. check interrupt before trying wait
5784  if (Thread::is_interrupted(thread, false) ||
5785      os::Solaris::mutex_trylock(_mutex) != 0) {
5786    return;
5787  }
5788
5789  int status ;
5790
5791  if (_counter > 0)  { // no wait needed
5792    _counter = 0;
5793    status = os::Solaris::mutex_unlock(_mutex);
5794    assert (status == 0, "invariant") ;
5795    return;
5796  }
5797
5798#ifdef ASSERT
5799  // Don't catch signals while blocked; let the running threads have the signals.
5800  // (This allows a debugger to break into the running thread.)
5801  sigset_t oldsigs;
5802  sigset_t* allowdebug_blocked = os::Solaris::allowdebug_blocked_signals();
5803  thr_sigsetmask(SIG_BLOCK, allowdebug_blocked, &oldsigs);
5804#endif
5805
5806  OSThreadWaitState osts(thread->osthread(), false /* not Object.wait() */);
5807  jt->set_suspend_equivalent();
5808  // cleared by handle_special_suspend_equivalent_condition() or java_suspend_self()
5809
5810  // Do this the hard way by blocking ...
5811  // See http://monaco.sfbay/detail.jsf?cr=5094058.
5812  // TODO-FIXME: for Solaris SPARC set fprs.FEF=0 prior to parking.
5813  // Only for SPARC >= V8PlusA
5814#if defined(__sparc) && defined(COMPILER2)
5815  if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5816#endif
5817
5818  if (time == 0) {
5819    status = os::Solaris::cond_wait (_cond, _mutex) ;
5820  } else {
5821    status = os::Solaris::cond_timedwait (_cond, _mutex, &absTime);
5822  }
5823  // Note that an untimed cond_wait() can sometimes return ETIME on older
5824  // versions of the Solaris.
5825  assert_status(status == 0 || status == EINTR ||
5826                status == ETIME || status == ETIMEDOUT,
5827                status, "cond_timedwait");
5828
5829#ifdef ASSERT
5830  thr_sigsetmask(SIG_SETMASK, &oldsigs, NULL);
5831#endif
5832  _counter = 0 ;
5833  status = os::Solaris::mutex_unlock(_mutex);
5834  assert_status(status == 0, status, "mutex_unlock") ;
5835
5836  // If externally suspended while waiting, re-suspend
5837  if (jt->handle_special_suspend_equivalent_condition()) {
5838    jt->java_suspend_self();
5839  }
5840
5841}
5842
5843void Parker::unpark() {
5844  int s, status ;
5845  status = os::Solaris::mutex_lock (_mutex) ;
5846  assert (status == 0, "invariant") ;
5847  s = _counter;
5848  _counter = 1;
5849  status = os::Solaris::mutex_unlock (_mutex) ;
5850  assert (status == 0, "invariant") ;
5851
5852  if (s < 1) {
5853    status = os::Solaris::cond_signal (_cond) ;
5854    assert (status == 0, "invariant") ;
5855  }
5856}
5857
5858extern char** environ;
5859
5860// Run the specified command in a separate process. Return its exit value,
5861// or -1 on failure (e.g. can't fork a new process).
5862// Unlike system(), this function can be called from signal handler. It
5863// doesn't block SIGINT et al.
5864int os::fork_and_exec(char* cmd) {
5865  char * argv[4];
5866  argv[0] = (char *)"sh";
5867  argv[1] = (char *)"-c";
5868  argv[2] = cmd;
5869  argv[3] = NULL;
5870
5871  // fork is async-safe, fork1 is not so can't use in signal handler
5872  pid_t pid;
5873  Thread* t = ThreadLocalStorage::get_thread_slow();
5874  if (t != NULL && t->is_inside_signal_handler()) {
5875    pid = fork();
5876  } else {
5877    pid = fork1();
5878  }
5879
5880  if (pid < 0) {
5881    // fork failed
5882    warning("fork failed: %s", strerror(errno));
5883    return -1;
5884
5885  } else if (pid == 0) {
5886    // child process
5887
5888    // try to be consistent with system(), which uses "/usr/bin/sh" on Solaris
5889    execve("/usr/bin/sh", argv, environ);
5890
5891    // execve failed
5892    _exit(-1);
5893
5894  } else  {
5895    // copied from J2SE ..._waitForProcessExit() in UNIXProcess_md.c; we don't
5896    // care about the actual exit code, for now.
5897
5898    int status;
5899
5900    // Wait for the child process to exit.  This returns immediately if
5901    // the child has already exited. */
5902    while (waitpid(pid, &status, 0) < 0) {
5903        switch (errno) {
5904        case ECHILD: return 0;
5905        case EINTR: break;
5906        default: return -1;
5907        }
5908    }
5909
5910    if (WIFEXITED(status)) {
5911       // The child exited normally; get its exit code.
5912       return WEXITSTATUS(status);
5913    } else if (WIFSIGNALED(status)) {
5914       // The child exited because of a signal
5915       // The best value to return is 0x80 + signal number,
5916       // because that is what all Unix shells do, and because
5917       // it allows callers to distinguish between process exit and
5918       // process death by signal.
5919       return 0x80 + WTERMSIG(status);
5920    } else {
5921       // Unknown exit code; pass it through
5922       return status;
5923    }
5924  }
5925}
5926