os_solaris.cpp revision 1123:167c2986d91b
1/*
2 * Copyright 1997-2009 Sun Microsystems, Inc.  All Rights Reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
20 * CA 95054 USA or visit www.sun.com if you need additional information or
21 * have any questions.
22 *
23 */
24
25// do not include  precompiled  header file
26# include "incls/_os_solaris.cpp.incl"
27
28// put OS-includes here
29# include <dlfcn.h>
30# include <errno.h>
31# include <link.h>
32# include <poll.h>
33# include <pthread.h>
34# include <pwd.h>
35# include <schedctl.h>
36# include <setjmp.h>
37# include <signal.h>
38# include <stdio.h>
39# include <alloca.h>
40# include <sys/filio.h>
41# include <sys/ipc.h>
42# include <sys/lwp.h>
43# include <sys/machelf.h>     // for elf Sym structure used by dladdr1
44# include <sys/mman.h>
45# include <sys/processor.h>
46# include <sys/procset.h>
47# include <sys/pset.h>
48# include <sys/resource.h>
49# include <sys/shm.h>
50# include <sys/socket.h>
51# include <sys/stat.h>
52# include <sys/systeminfo.h>
53# include <sys/time.h>
54# include <sys/times.h>
55# include <sys/types.h>
56# include <sys/wait.h>
57# include <sys/utsname.h>
58# include <thread.h>
59# include <unistd.h>
60# include <sys/priocntl.h>
61# include <sys/rtpriocntl.h>
62# include <sys/tspriocntl.h>
63# include <sys/iapriocntl.h>
64# include <sys/loadavg.h>
65# include <string.h>
66
67# define _STRUCTURED_PROC 1  //  this gets us the new structured proc interfaces of 5.6 & later
68# include <sys/procfs.h>     //  see comment in <sys/procfs.h>
69
70#define MAX_PATH (2 * K)
71
72// for timer info max values which include all bits
73#define ALL_64_BITS CONST64(0xFFFFFFFFFFFFFFFF)
74
75#ifdef _GNU_SOURCE
76// See bug #6514594
77extern "C" int madvise(caddr_t, size_t, int);
78extern "C"  int memcntl(caddr_t addr, size_t len, int cmd, caddr_t  arg,
79     int attr, int mask);
80#endif //_GNU_SOURCE
81
82/*
83  MPSS Changes Start.
84  The JVM binary needs to be built and run on pre-Solaris 9
85  systems, but the constants needed by MPSS are only in Solaris 9
86  header files.  They are textually replicated here to allow
87  building on earlier systems.  Once building on Solaris 8 is
88  no longer a requirement, these #defines can be replaced by ordinary
89  system .h inclusion.
90
91  In earlier versions of the  JDK and Solaris, we used ISM for large pages.
92  But ISM requires shared memory to achieve this and thus has many caveats.
93  MPSS is a fully transparent and is a cleaner way to get large pages.
94  Although we still require keeping ISM for backward compatiblitiy as well as
95  giving the opportunity to use large pages on older systems it is
96  recommended that MPSS be used for Solaris 9 and above.
97
98*/
99
100#ifndef MC_HAT_ADVISE
101
102struct memcntl_mha {
103  uint_t          mha_cmd;        /* command(s) */
104  uint_t          mha_flags;
105  size_t          mha_pagesize;
106};
107#define MC_HAT_ADVISE   7       /* advise hat map size */
108#define MHA_MAPSIZE_VA  0x1     /* set preferred page size */
109#define MAP_ALIGN       0x200   /* addr specifies alignment */
110
111#endif
112// MPSS Changes End.
113
114
115// Here are some liblgrp types from sys/lgrp_user.h to be able to
116// compile on older systems without this header file.
117
118#ifndef MADV_ACCESS_LWP
119# define  MADV_ACCESS_LWP         7       /* next LWP to access heavily */
120#endif
121#ifndef MADV_ACCESS_MANY
122# define  MADV_ACCESS_MANY        8       /* many processes to access heavily */
123#endif
124
125#ifndef LGRP_RSRC_CPU
126# define LGRP_RSRC_CPU           0       /* CPU resources */
127#endif
128#ifndef LGRP_RSRC_MEM
129# define LGRP_RSRC_MEM           1       /* memory resources */
130#endif
131
132// Some more macros from sys/mman.h that are not present in Solaris 8.
133
134#ifndef MAX_MEMINFO_CNT
135/*
136 * info_req request type definitions for meminfo
137 * request types starting with MEMINFO_V are used for Virtual addresses
138 * and should not be mixed with MEMINFO_PLGRP which is targeted for Physical
139 * addresses
140 */
141# define MEMINFO_SHIFT           16
142# define MEMINFO_MASK            (0xFF << MEMINFO_SHIFT)
143# define MEMINFO_VPHYSICAL       (0x01 << MEMINFO_SHIFT) /* get physical addr */
144# define MEMINFO_VLGRP           (0x02 << MEMINFO_SHIFT) /* get lgroup */
145# define MEMINFO_VPAGESIZE       (0x03 << MEMINFO_SHIFT) /* size of phys page */
146# define MEMINFO_VREPLCNT        (0x04 << MEMINFO_SHIFT) /* no. of replica */
147# define MEMINFO_VREPL           (0x05 << MEMINFO_SHIFT) /* physical replica */
148# define MEMINFO_VREPL_LGRP      (0x06 << MEMINFO_SHIFT) /* lgrp of replica */
149# define MEMINFO_PLGRP           (0x07 << MEMINFO_SHIFT) /* lgroup for paddr */
150
151/* maximum number of addresses meminfo() can process at a time */
152# define MAX_MEMINFO_CNT 256
153
154/* maximum number of request types */
155# define MAX_MEMINFO_REQ 31
156#endif
157
158// see thr_setprio(3T) for the basis of these numbers
159#define MinimumPriority 0
160#define NormalPriority  64
161#define MaximumPriority 127
162
163// Values for ThreadPriorityPolicy == 1
164int prio_policy1[MaxPriority+1] = { -99999, 0, 16, 32, 48, 64,
165                                        80, 96, 112, 124, 127 };
166
167// System parameters used internally
168static clock_t clock_tics_per_sec = 100;
169
170// For diagnostics to print a message once. see run_periodic_checks
171static bool check_addr0_done = false;
172static sigset_t check_signal_done;
173static bool check_signals = true;
174
175address os::Solaris::handler_start;  // start pc of thr_sighndlrinfo
176address os::Solaris::handler_end;    // end pc of thr_sighndlrinfo
177
178address os::Solaris::_main_stack_base = NULL;  // 4352906 workaround
179
180
181// "default" initializers for missing libc APIs
182extern "C" {
183  static int lwp_mutex_init(mutex_t *mx, int scope, void *arg) { memset(mx, 0, sizeof(mutex_t)); return 0; }
184  static int lwp_mutex_destroy(mutex_t *mx)                 { return 0; }
185
186  static int lwp_cond_init(cond_t *cv, int scope, void *arg){ memset(cv, 0, sizeof(cond_t)); return 0; }
187  static int lwp_cond_destroy(cond_t *cv)                   { return 0; }
188}
189
190// "default" initializers for pthread-based synchronization
191extern "C" {
192  static int pthread_mutex_default_init(mutex_t *mx, int scope, void *arg) { memset(mx, 0, sizeof(mutex_t)); return 0; }
193  static int pthread_cond_default_init(cond_t *cv, int scope, void *arg){ memset(cv, 0, sizeof(cond_t)); return 0; }
194}
195
196// Thread Local Storage
197// This is common to all Solaris platforms so it is defined here,
198// in this common file.
199// The declarations are in the os_cpu threadLS*.hpp files.
200//
201// Static member initialization for TLS
202Thread* ThreadLocalStorage::_get_thread_cache[ThreadLocalStorage::_pd_cache_size] = {NULL};
203
204#ifndef PRODUCT
205#define _PCT(n,d)       ((100.0*(double)(n))/(double)(d))
206
207int ThreadLocalStorage::_tcacheHit = 0;
208int ThreadLocalStorage::_tcacheMiss = 0;
209
210void ThreadLocalStorage::print_statistics() {
211  int total = _tcacheMiss+_tcacheHit;
212  tty->print_cr("Thread cache hits %d misses %d total %d percent %f\n",
213                _tcacheHit, _tcacheMiss, total, _PCT(_tcacheHit, total));
214}
215#undef _PCT
216#endif // PRODUCT
217
218Thread* ThreadLocalStorage::get_thread_via_cache_slowly(uintptr_t raw_id,
219                                                        int index) {
220  Thread *thread = get_thread_slow();
221  if (thread != NULL) {
222    address sp = os::current_stack_pointer();
223    guarantee(thread->_stack_base == NULL ||
224              (sp <= thread->_stack_base &&
225                 sp >= thread->_stack_base - thread->_stack_size) ||
226               is_error_reported(),
227              "sp must be inside of selected thread stack");
228
229    thread->_self_raw_id = raw_id;  // mark for quick retrieval
230    _get_thread_cache[ index ] = thread;
231  }
232  return thread;
233}
234
235
236static const double all_zero[ sizeof(Thread) / sizeof(double) + 1 ] = {0};
237#define NO_CACHED_THREAD ((Thread*)all_zero)
238
239void ThreadLocalStorage::pd_set_thread(Thread* thread) {
240
241  // Store the new value before updating the cache to prevent a race
242  // between get_thread_via_cache_slowly() and this store operation.
243  os::thread_local_storage_at_put(ThreadLocalStorage::thread_index(), thread);
244
245  // Update thread cache with new thread if setting on thread create,
246  // or NO_CACHED_THREAD (zeroed) thread if resetting thread on exit.
247  uintptr_t raw = pd_raw_thread_id();
248  int ix = pd_cache_index(raw);
249  _get_thread_cache[ix] = thread == NULL ? NO_CACHED_THREAD : thread;
250}
251
252void ThreadLocalStorage::pd_init() {
253  for (int i = 0; i < _pd_cache_size; i++) {
254    _get_thread_cache[i] = NO_CACHED_THREAD;
255  }
256}
257
258// Invalidate all the caches (happens to be the same as pd_init).
259void ThreadLocalStorage::pd_invalidate_all() { pd_init(); }
260
261#undef NO_CACHED_THREAD
262
263// END Thread Local Storage
264
265static inline size_t adjust_stack_size(address base, size_t size) {
266  if ((ssize_t)size < 0) {
267    // 4759953: Compensate for ridiculous stack size.
268    size = max_intx;
269  }
270  if (size > (size_t)base) {
271    // 4812466: Make sure size doesn't allow the stack to wrap the address space.
272    size = (size_t)base;
273  }
274  return size;
275}
276
277static inline stack_t get_stack_info() {
278  stack_t st;
279  int retval = thr_stksegment(&st);
280  st.ss_size = adjust_stack_size((address)st.ss_sp, st.ss_size);
281  assert(retval == 0, "incorrect return value from thr_stksegment");
282  assert((address)&st < (address)st.ss_sp, "Invalid stack base returned");
283  assert((address)&st > (address)st.ss_sp-st.ss_size, "Invalid stack size returned");
284  return st;
285}
286
287address os::current_stack_base() {
288  int r = thr_main() ;
289  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
290  bool is_primordial_thread = r;
291
292  // Workaround 4352906, avoid calls to thr_stksegment by
293  // thr_main after the first one (it looks like we trash
294  // some data, causing the value for ss_sp to be incorrect).
295  if (!is_primordial_thread || os::Solaris::_main_stack_base == NULL) {
296    stack_t st = get_stack_info();
297    if (is_primordial_thread) {
298      // cache initial value of stack base
299      os::Solaris::_main_stack_base = (address)st.ss_sp;
300    }
301    return (address)st.ss_sp;
302  } else {
303    guarantee(os::Solaris::_main_stack_base != NULL, "Attempt to use null cached stack base");
304    return os::Solaris::_main_stack_base;
305  }
306}
307
308size_t os::current_stack_size() {
309  size_t size;
310
311  int r = thr_main() ;
312  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
313  if(!r) {
314    size = get_stack_info().ss_size;
315  } else {
316    struct rlimit limits;
317    getrlimit(RLIMIT_STACK, &limits);
318    size = adjust_stack_size(os::Solaris::_main_stack_base, (size_t)limits.rlim_cur);
319  }
320  // base may not be page aligned
321  address base = current_stack_base();
322  address bottom = (address)align_size_up((intptr_t)(base - size), os::vm_page_size());;
323  return (size_t)(base - bottom);
324}
325
326struct tm* os::localtime_pd(const time_t* clock, struct tm*  res) {
327  return localtime_r(clock, res);
328}
329
330// interruptible infrastructure
331
332// setup_interruptible saves the thread state before going into an
333// interruptible system call.
334// The saved state is used to restore the thread to
335// its former state whether or not an interrupt is received.
336// Used by classloader os::read
337// hpi calls skip this layer and stay in _thread_in_native
338
339void os::Solaris::setup_interruptible(JavaThread* thread) {
340
341  JavaThreadState thread_state = thread->thread_state();
342
343  assert(thread_state != _thread_blocked, "Coming from the wrong thread");
344  assert(thread_state != _thread_in_native, "Native threads skip setup_interruptible");
345  OSThread* osthread = thread->osthread();
346  osthread->set_saved_interrupt_thread_state(thread_state);
347  thread->frame_anchor()->make_walkable(thread);
348  ThreadStateTransition::transition(thread, thread_state, _thread_blocked);
349}
350
351// Version of setup_interruptible() for threads that are already in
352// _thread_blocked. Used by os_sleep().
353void os::Solaris::setup_interruptible_already_blocked(JavaThread* thread) {
354  thread->frame_anchor()->make_walkable(thread);
355}
356
357JavaThread* os::Solaris::setup_interruptible() {
358  JavaThread* thread = (JavaThread*)ThreadLocalStorage::thread();
359  setup_interruptible(thread);
360  return thread;
361}
362
363void os::Solaris::try_enable_extended_io() {
364  typedef int (*enable_extended_FILE_stdio_t)(int, int);
365
366  if (!UseExtendedFileIO) {
367    return;
368  }
369
370  enable_extended_FILE_stdio_t enabler =
371    (enable_extended_FILE_stdio_t) dlsym(RTLD_DEFAULT,
372                                         "enable_extended_FILE_stdio");
373  if (enabler) {
374    enabler(-1, -1);
375  }
376}
377
378
379#ifdef ASSERT
380
381JavaThread* os::Solaris::setup_interruptible_native() {
382  JavaThread* thread = (JavaThread*)ThreadLocalStorage::thread();
383  JavaThreadState thread_state = thread->thread_state();
384  assert(thread_state == _thread_in_native, "Assumed thread_in_native");
385  return thread;
386}
387
388void os::Solaris::cleanup_interruptible_native(JavaThread* thread) {
389  JavaThreadState thread_state = thread->thread_state();
390  assert(thread_state == _thread_in_native, "Assumed thread_in_native");
391}
392#endif
393
394// cleanup_interruptible reverses the effects of setup_interruptible
395// setup_interruptible_already_blocked() does not need any cleanup.
396
397void os::Solaris::cleanup_interruptible(JavaThread* thread) {
398  OSThread* osthread = thread->osthread();
399
400  ThreadStateTransition::transition(thread, _thread_blocked, osthread->saved_interrupt_thread_state());
401}
402
403// I/O interruption related counters called in _INTERRUPTIBLE
404
405void os::Solaris::bump_interrupted_before_count() {
406  RuntimeService::record_interrupted_before_count();
407}
408
409void os::Solaris::bump_interrupted_during_count() {
410  RuntimeService::record_interrupted_during_count();
411}
412
413static int _processors_online = 0;
414
415         jint os::Solaris::_os_thread_limit = 0;
416volatile jint os::Solaris::_os_thread_count = 0;
417
418julong os::available_memory() {
419  return Solaris::available_memory();
420}
421
422julong os::Solaris::available_memory() {
423  return (julong)sysconf(_SC_AVPHYS_PAGES) * os::vm_page_size();
424}
425
426julong os::Solaris::_physical_memory = 0;
427
428julong os::physical_memory() {
429   return Solaris::physical_memory();
430}
431
432julong os::allocatable_physical_memory(julong size) {
433#ifdef _LP64
434   return size;
435#else
436   julong result = MIN2(size, (julong)3835*M);
437   if (!is_allocatable(result)) {
438     // Memory allocations will be aligned but the alignment
439     // is not known at this point.  Alignments will
440     // be at most to LargePageSizeInBytes.  Protect
441     // allocations from alignments up to illegal
442     // values. If at this point 2G is illegal.
443     julong reasonable_size = (julong)2*G - 2 * LargePageSizeInBytes;
444     result =  MIN2(size, reasonable_size);
445   }
446   return result;
447#endif
448}
449
450static hrtime_t first_hrtime = 0;
451static const hrtime_t hrtime_hz = 1000*1000*1000;
452const int LOCK_BUSY = 1;
453const int LOCK_FREE = 0;
454const int LOCK_INVALID = -1;
455static volatile hrtime_t max_hrtime = 0;
456static volatile int max_hrtime_lock = LOCK_FREE;     // Update counter with LSB as lock-in-progress
457
458
459void os::Solaris::initialize_system_info() {
460  set_processor_count(sysconf(_SC_NPROCESSORS_CONF));
461  _processors_online = sysconf (_SC_NPROCESSORS_ONLN);
462  _physical_memory = (julong)sysconf(_SC_PHYS_PAGES) * (julong)sysconf(_SC_PAGESIZE);
463}
464
465int os::active_processor_count() {
466  int online_cpus = sysconf(_SC_NPROCESSORS_ONLN);
467  pid_t pid = getpid();
468  psetid_t pset = PS_NONE;
469  // Are we running in a processor set or is there any processor set around?
470  if (pset_bind(PS_QUERY, P_PID, pid, &pset) == 0) {
471    uint_t pset_cpus;
472    // Query the number of cpus available to us.
473    if (pset_info(pset, NULL, &pset_cpus, NULL) == 0) {
474      assert(pset_cpus > 0 && pset_cpus <= online_cpus, "sanity check");
475      _processors_online = pset_cpus;
476      return pset_cpus;
477    }
478  }
479  // Otherwise return number of online cpus
480  return online_cpus;
481}
482
483static bool find_processors_in_pset(psetid_t        pset,
484                                    processorid_t** id_array,
485                                    uint_t*         id_length) {
486  bool result = false;
487  // Find the number of processors in the processor set.
488  if (pset_info(pset, NULL, id_length, NULL) == 0) {
489    // Make up an array to hold their ids.
490    *id_array = NEW_C_HEAP_ARRAY(processorid_t, *id_length);
491    // Fill in the array with their processor ids.
492    if (pset_info(pset, NULL, id_length, *id_array) == 0) {
493      result = true;
494    }
495  }
496  return result;
497}
498
499// Callers of find_processors_online() must tolerate imprecise results --
500// the system configuration can change asynchronously because of DR
501// or explicit psradm operations.
502//
503// We also need to take care that the loop (below) terminates as the
504// number of processors online can change between the _SC_NPROCESSORS_ONLN
505// request and the loop that builds the list of processor ids.   Unfortunately
506// there's no reliable way to determine the maximum valid processor id,
507// so we use a manifest constant, MAX_PROCESSOR_ID, instead.  See p_online
508// man pages, which claim the processor id set is "sparse, but
509// not too sparse".  MAX_PROCESSOR_ID is used to ensure that we eventually
510// exit the loop.
511//
512// In the future we'll be able to use sysconf(_SC_CPUID_MAX), but that's
513// not available on S8.0.
514
515static bool find_processors_online(processorid_t** id_array,
516                                   uint*           id_length) {
517  const processorid_t MAX_PROCESSOR_ID = 100000 ;
518  // Find the number of processors online.
519  *id_length = sysconf(_SC_NPROCESSORS_ONLN);
520  // Make up an array to hold their ids.
521  *id_array = NEW_C_HEAP_ARRAY(processorid_t, *id_length);
522  // Processors need not be numbered consecutively.
523  long found = 0;
524  processorid_t next = 0;
525  while (found < *id_length && next < MAX_PROCESSOR_ID) {
526    processor_info_t info;
527    if (processor_info(next, &info) == 0) {
528      // NB, PI_NOINTR processors are effectively online ...
529      if (info.pi_state == P_ONLINE || info.pi_state == P_NOINTR) {
530        (*id_array)[found] = next;
531        found += 1;
532      }
533    }
534    next += 1;
535  }
536  if (found < *id_length) {
537      // The loop above didn't identify the expected number of processors.
538      // We could always retry the operation, calling sysconf(_SC_NPROCESSORS_ONLN)
539      // and re-running the loop, above, but there's no guarantee of progress
540      // if the system configuration is in flux.  Instead, we just return what
541      // we've got.  Note that in the worst case find_processors_online() could
542      // return an empty set.  (As a fall-back in the case of the empty set we
543      // could just return the ID of the current processor).
544      *id_length = found ;
545  }
546
547  return true;
548}
549
550static bool assign_distribution(processorid_t* id_array,
551                                uint           id_length,
552                                uint*          distribution,
553                                uint           distribution_length) {
554  // We assume we can assign processorid_t's to uint's.
555  assert(sizeof(processorid_t) == sizeof(uint),
556         "can't convert processorid_t to uint");
557  // Quick check to see if we won't succeed.
558  if (id_length < distribution_length) {
559    return false;
560  }
561  // Assign processor ids to the distribution.
562  // Try to shuffle processors to distribute work across boards,
563  // assuming 4 processors per board.
564  const uint processors_per_board = ProcessDistributionStride;
565  // Find the maximum processor id.
566  processorid_t max_id = 0;
567  for (uint m = 0; m < id_length; m += 1) {
568    max_id = MAX2(max_id, id_array[m]);
569  }
570  // The next id, to limit loops.
571  const processorid_t limit_id = max_id + 1;
572  // Make up markers for available processors.
573  bool* available_id = NEW_C_HEAP_ARRAY(bool, limit_id);
574  for (uint c = 0; c < limit_id; c += 1) {
575    available_id[c] = false;
576  }
577  for (uint a = 0; a < id_length; a += 1) {
578    available_id[id_array[a]] = true;
579  }
580  // Step by "boards", then by "slot", copying to "assigned".
581  // NEEDS_CLEANUP: The assignment of processors should be stateful,
582  //                remembering which processors have been assigned by
583  //                previous calls, etc., so as to distribute several
584  //                independent calls of this method.  What we'd like is
585  //                It would be nice to have an API that let us ask
586  //                how many processes are bound to a processor,
587  //                but we don't have that, either.
588  //                In the short term, "board" is static so that
589  //                subsequent distributions don't all start at board 0.
590  static uint board = 0;
591  uint assigned = 0;
592  // Until we've found enough processors ....
593  while (assigned < distribution_length) {
594    // ... find the next available processor in the board.
595    for (uint slot = 0; slot < processors_per_board; slot += 1) {
596      uint try_id = board * processors_per_board + slot;
597      if ((try_id < limit_id) && (available_id[try_id] == true)) {
598        distribution[assigned] = try_id;
599        available_id[try_id] = false;
600        assigned += 1;
601        break;
602      }
603    }
604    board += 1;
605    if (board * processors_per_board + 0 >= limit_id) {
606      board = 0;
607    }
608  }
609  if (available_id != NULL) {
610    FREE_C_HEAP_ARRAY(bool, available_id);
611  }
612  return true;
613}
614
615bool os::distribute_processes(uint length, uint* distribution) {
616  bool result = false;
617  // Find the processor id's of all the available CPUs.
618  processorid_t* id_array  = NULL;
619  uint           id_length = 0;
620  // There are some races between querying information and using it,
621  // since processor sets can change dynamically.
622  psetid_t pset = PS_NONE;
623  // Are we running in a processor set?
624  if ((pset_bind(PS_QUERY, P_PID, P_MYID, &pset) == 0) && pset != PS_NONE) {
625    result = find_processors_in_pset(pset, &id_array, &id_length);
626  } else {
627    result = find_processors_online(&id_array, &id_length);
628  }
629  if (result == true) {
630    if (id_length >= length) {
631      result = assign_distribution(id_array, id_length, distribution, length);
632    } else {
633      result = false;
634    }
635  }
636  if (id_array != NULL) {
637    FREE_C_HEAP_ARRAY(processorid_t, id_array);
638  }
639  return result;
640}
641
642bool os::bind_to_processor(uint processor_id) {
643  // We assume that a processorid_t can be stored in a uint.
644  assert(sizeof(uint) == sizeof(processorid_t),
645         "can't convert uint to processorid_t");
646  int bind_result =
647    processor_bind(P_LWPID,                       // bind LWP.
648                   P_MYID,                        // bind current LWP.
649                   (processorid_t) processor_id,  // id.
650                   NULL);                         // don't return old binding.
651  return (bind_result == 0);
652}
653
654bool os::getenv(const char* name, char* buffer, int len) {
655  char* val = ::getenv( name );
656  if ( val == NULL
657  ||   strlen(val) + 1  >  len ) {
658    if (len > 0)  buffer[0] = 0; // return a null string
659    return false;
660  }
661  strcpy( buffer, val );
662  return true;
663}
664
665
666// Return true if user is running as root.
667
668bool os::have_special_privileges() {
669  static bool init = false;
670  static bool privileges = false;
671  if (!init) {
672    privileges = (getuid() != geteuid()) || (getgid() != getegid());
673    init = true;
674  }
675  return privileges;
676}
677
678
679static char* get_property(char* name, char* buffer, int buffer_size) {
680  if (os::getenv(name, buffer, buffer_size)) {
681    return buffer;
682  }
683  static char empty[] = "";
684  return empty;
685}
686
687
688void os::init_system_properties_values() {
689  char arch[12];
690  sysinfo(SI_ARCHITECTURE, arch, sizeof(arch));
691
692  // The next steps are taken in the product version:
693  //
694  // Obtain the JAVA_HOME value from the location of libjvm[_g].so.
695  // This library should be located at:
696  // <JAVA_HOME>/jre/lib/<arch>/{client|server}/libjvm[_g].so.
697  //
698  // If "/jre/lib/" appears at the right place in the path, then we
699  // assume libjvm[_g].so is installed in a JDK and we use this path.
700  //
701  // Otherwise exit with message: "Could not create the Java virtual machine."
702  //
703  // The following extra steps are taken in the debugging version:
704  //
705  // If "/jre/lib/" does NOT appear at the right place in the path
706  // instead of exit check for $JAVA_HOME environment variable.
707  //
708  // If it is defined and we are able to locate $JAVA_HOME/jre/lib/<arch>,
709  // then we append a fake suffix "hotspot/libjvm[_g].so" to this path so
710  // it looks like libjvm[_g].so is installed there
711  // <JAVA_HOME>/jre/lib/<arch>/hotspot/libjvm[_g].so.
712  //
713  // Otherwise exit.
714  //
715  // Important note: if the location of libjvm.so changes this
716  // code needs to be changed accordingly.
717
718  // The next few definitions allow the code to be verbatim:
719#define malloc(n) (char*)NEW_C_HEAP_ARRAY(char, (n))
720#define free(p) FREE_C_HEAP_ARRAY(char, p)
721#define getenv(n) ::getenv(n)
722
723#define EXTENSIONS_DIR  "/lib/ext"
724#define ENDORSED_DIR    "/lib/endorsed"
725#define COMMON_DIR      "/usr/jdk/packages"
726
727  {
728    /* sysclasspath, java_home, dll_dir */
729    {
730        char *home_path;
731        char *dll_path;
732        char *pslash;
733        char buf[MAXPATHLEN];
734        os::jvm_path(buf, sizeof(buf));
735
736        // Found the full path to libjvm.so.
737        // Now cut the path to <java_home>/jre if we can.
738        *(strrchr(buf, '/')) = '\0';  /* get rid of /libjvm.so */
739        pslash = strrchr(buf, '/');
740        if (pslash != NULL)
741            *pslash = '\0';           /* get rid of /{client|server|hotspot} */
742        dll_path = malloc(strlen(buf) + 1);
743        if (dll_path == NULL)
744            return;
745        strcpy(dll_path, buf);
746        Arguments::set_dll_dir(dll_path);
747
748        if (pslash != NULL) {
749            pslash = strrchr(buf, '/');
750            if (pslash != NULL) {
751                *pslash = '\0';       /* get rid of /<arch> */
752                pslash = strrchr(buf, '/');
753                if (pslash != NULL)
754                    *pslash = '\0';   /* get rid of /lib */
755            }
756        }
757
758        home_path = malloc(strlen(buf) + 1);
759        if (home_path == NULL)
760            return;
761        strcpy(home_path, buf);
762        Arguments::set_java_home(home_path);
763
764        if (!set_boot_path('/', ':'))
765            return;
766    }
767
768    /*
769     * Where to look for native libraries
770     */
771    {
772      // Use dlinfo() to determine the correct java.library.path.
773      //
774      // If we're launched by the Java launcher, and the user
775      // does not set java.library.path explicitly on the commandline,
776      // the Java launcher sets LD_LIBRARY_PATH for us and unsets
777      // LD_LIBRARY_PATH_32 and LD_LIBRARY_PATH_64.  In this case
778      // dlinfo returns LD_LIBRARY_PATH + crle settings (including
779      // /usr/lib), which is exactly what we want.
780      //
781      // If the user does set java.library.path, it completely
782      // overwrites this setting, and always has.
783      //
784      // If we're not launched by the Java launcher, we may
785      // get here with any/all of the LD_LIBRARY_PATH[_32|64]
786      // settings.  Again, dlinfo does exactly what we want.
787
788      Dl_serinfo     _info, *info = &_info;
789      Dl_serpath     *path;
790      char*          library_path;
791      char           *common_path;
792      int            i;
793
794      // determine search path count and required buffer size
795      if (dlinfo(RTLD_SELF, RTLD_DI_SERINFOSIZE, (void *)info) == -1) {
796        vm_exit_during_initialization("dlinfo SERINFOSIZE request", dlerror());
797      }
798
799      // allocate new buffer and initialize
800      info = (Dl_serinfo*)malloc(_info.dls_size);
801      if (info == NULL) {
802        vm_exit_out_of_memory(_info.dls_size,
803                              "init_system_properties_values info");
804      }
805      info->dls_size = _info.dls_size;
806      info->dls_cnt = _info.dls_cnt;
807
808      // obtain search path information
809      if (dlinfo(RTLD_SELF, RTLD_DI_SERINFO, (void *)info) == -1) {
810        free(info);
811        vm_exit_during_initialization("dlinfo SERINFO request", dlerror());
812      }
813
814      path = &info->dls_serpath[0];
815
816      // Note: Due to a legacy implementation, most of the library path
817      // is set in the launcher.  This was to accomodate linking restrictions
818      // on legacy Solaris implementations (which are no longer supported).
819      // Eventually, all the library path setting will be done here.
820      //
821      // However, to prevent the proliferation of improperly built native
822      // libraries, the new path component /usr/jdk/packages is added here.
823
824      // Determine the actual CPU architecture.
825      char cpu_arch[12];
826      sysinfo(SI_ARCHITECTURE, cpu_arch, sizeof(cpu_arch));
827#ifdef _LP64
828      // If we are a 64-bit vm, perform the following translations:
829      //   sparc   -> sparcv9
830      //   i386    -> amd64
831      if (strcmp(cpu_arch, "sparc") == 0)
832        strcat(cpu_arch, "v9");
833      else if (strcmp(cpu_arch, "i386") == 0)
834        strcpy(cpu_arch, "amd64");
835#endif
836
837      // Construct the invariant part of ld_library_path. Note that the
838      // space for the colon and the trailing null are provided by the
839      // nulls included by the sizeof operator.
840      size_t bufsize = sizeof(COMMON_DIR) + sizeof("/lib/") + strlen(cpu_arch);
841      common_path = malloc(bufsize);
842      if (common_path == NULL) {
843        free(info);
844        vm_exit_out_of_memory(bufsize,
845                              "init_system_properties_values common_path");
846      }
847      sprintf(common_path, COMMON_DIR "/lib/%s", cpu_arch);
848
849      // struct size is more than sufficient for the path components obtained
850      // through the dlinfo() call, so only add additional space for the path
851      // components explicitly added here.
852      bufsize = info->dls_size + strlen(common_path);
853      library_path = malloc(bufsize);
854      if (library_path == NULL) {
855        free(info);
856        free(common_path);
857        vm_exit_out_of_memory(bufsize,
858                              "init_system_properties_values library_path");
859      }
860      library_path[0] = '\0';
861
862      // Construct the desired Java library path from the linker's library
863      // search path.
864      //
865      // For compatibility, it is optimal that we insert the additional path
866      // components specific to the Java VM after those components specified
867      // in LD_LIBRARY_PATH (if any) but before those added by the ld.so
868      // infrastructure.
869      if (info->dls_cnt == 0) { // Not sure this can happen, but allow for it
870        strcpy(library_path, common_path);
871      } else {
872        int inserted = 0;
873        for (i = 0; i < info->dls_cnt; i++, path++) {
874          uint_t flags = path->dls_flags & LA_SER_MASK;
875          if (((flags & LA_SER_LIBPATH) == 0) && !inserted) {
876            strcat(library_path, common_path);
877            strcat(library_path, os::path_separator());
878            inserted = 1;
879          }
880          strcat(library_path, path->dls_name);
881          strcat(library_path, os::path_separator());
882        }
883        // eliminate trailing path separator
884        library_path[strlen(library_path)-1] = '\0';
885      }
886
887      // happens before argument parsing - can't use a trace flag
888      // tty->print_raw("init_system_properties_values: native lib path: ");
889      // tty->print_raw_cr(library_path);
890
891      // callee copies into its own buffer
892      Arguments::set_library_path(library_path);
893
894      free(common_path);
895      free(library_path);
896      free(info);
897    }
898
899    /*
900     * Extensions directories.
901     *
902     * Note that the space for the colon and the trailing null are provided
903     * by the nulls included by the sizeof operator (so actually one byte more
904     * than necessary is allocated).
905     */
906    {
907        char *buf = (char *) malloc(strlen(Arguments::get_java_home()) +
908            sizeof(EXTENSIONS_DIR) + sizeof(COMMON_DIR) +
909            sizeof(EXTENSIONS_DIR));
910        sprintf(buf, "%s" EXTENSIONS_DIR ":" COMMON_DIR EXTENSIONS_DIR,
911            Arguments::get_java_home());
912        Arguments::set_ext_dirs(buf);
913    }
914
915    /* Endorsed standards default directory. */
916    {
917        char * buf = malloc(strlen(Arguments::get_java_home()) + sizeof(ENDORSED_DIR));
918        sprintf(buf, "%s" ENDORSED_DIR, Arguments::get_java_home());
919        Arguments::set_endorsed_dirs(buf);
920    }
921  }
922
923#undef malloc
924#undef free
925#undef getenv
926#undef EXTENSIONS_DIR
927#undef ENDORSED_DIR
928#undef COMMON_DIR
929
930}
931
932void os::breakpoint() {
933  BREAKPOINT;
934}
935
936bool os::obsolete_option(const JavaVMOption *option)
937{
938  if (!strncmp(option->optionString, "-Xt", 3)) {
939    return true;
940  } else if (!strncmp(option->optionString, "-Xtm", 4)) {
941    return true;
942  } else if (!strncmp(option->optionString, "-Xverifyheap", 12)) {
943    return true;
944  } else if (!strncmp(option->optionString, "-Xmaxjitcodesize", 16)) {
945    return true;
946  }
947  return false;
948}
949
950bool os::Solaris::valid_stack_address(Thread* thread, address sp) {
951  address  stackStart  = (address)thread->stack_base();
952  address  stackEnd    = (address)(stackStart - (address)thread->stack_size());
953  if (sp < stackStart && sp >= stackEnd ) return true;
954  return false;
955}
956
957extern "C" void breakpoint() {
958  // use debugger to set breakpoint here
959}
960
961// Returns an estimate of the current stack pointer. Result must be guaranteed to
962// point into the calling threads stack, and be no lower than the current stack
963// pointer.
964address os::current_stack_pointer() {
965  volatile int dummy;
966  address sp = (address)&dummy + 8;     // %%%% need to confirm if this is right
967  return sp;
968}
969
970static thread_t main_thread;
971
972// Thread start routine for all new Java threads
973extern "C" void* java_start(void* thread_addr) {
974  // Try to randomize the cache line index of hot stack frames.
975  // This helps when threads of the same stack traces evict each other's
976  // cache lines. The threads can be either from the same JVM instance, or
977  // from different JVM instances. The benefit is especially true for
978  // processors with hyperthreading technology.
979  static int counter = 0;
980  int pid = os::current_process_id();
981  alloca(((pid ^ counter++) & 7) * 128);
982
983  int prio;
984  Thread* thread = (Thread*)thread_addr;
985  OSThread* osthr = thread->osthread();
986
987  osthr->set_lwp_id( _lwp_self() );  // Store lwp in case we are bound
988  thread->_schedctl = (void *) schedctl_init () ;
989
990  if (UseNUMA) {
991    int lgrp_id = os::numa_get_group_id();
992    if (lgrp_id != -1) {
993      thread->set_lgrp_id(lgrp_id);
994    }
995  }
996
997  // If the creator called set priority before we started,
998  // we need to call set priority now that we have an lwp.
999  // Get the priority from libthread and set the priority
1000  // for the new Solaris lwp.
1001  if ( osthr->thread_id() != -1 ) {
1002    if ( UseThreadPriorities ) {
1003      thr_getprio(osthr->thread_id(), &prio);
1004      if (ThreadPriorityVerbose) {
1005        tty->print_cr("Starting Thread " INTPTR_FORMAT ", LWP is " INTPTR_FORMAT ", setting priority: %d\n",
1006                      osthr->thread_id(), osthr->lwp_id(), prio );
1007      }
1008      os::set_native_priority(thread, prio);
1009    }
1010  } else if (ThreadPriorityVerbose) {
1011    warning("Can't set priority in _start routine, thread id hasn't been set\n");
1012  }
1013
1014  assert(osthr->get_state() == RUNNABLE, "invalid os thread state");
1015
1016  // initialize signal mask for this thread
1017  os::Solaris::hotspot_sigmask(thread);
1018
1019  thread->run();
1020
1021  // One less thread is executing
1022  // When the VMThread gets here, the main thread may have already exited
1023  // which frees the CodeHeap containing the Atomic::dec code
1024  if (thread != VMThread::vm_thread() && VMThread::vm_thread() != NULL) {
1025    Atomic::dec(&os::Solaris::_os_thread_count);
1026  }
1027
1028  if (UseDetachedThreads) {
1029    thr_exit(NULL);
1030    ShouldNotReachHere();
1031  }
1032  return NULL;
1033}
1034
1035static OSThread* create_os_thread(Thread* thread, thread_t thread_id) {
1036  // Allocate the OSThread object
1037  OSThread* osthread = new OSThread(NULL, NULL);
1038  if (osthread == NULL) return NULL;
1039
1040  // Store info on the Solaris thread into the OSThread
1041  osthread->set_thread_id(thread_id);
1042  osthread->set_lwp_id(_lwp_self());
1043  thread->_schedctl = (void *) schedctl_init () ;
1044
1045  if (UseNUMA) {
1046    int lgrp_id = os::numa_get_group_id();
1047    if (lgrp_id != -1) {
1048      thread->set_lgrp_id(lgrp_id);
1049    }
1050  }
1051
1052  if ( ThreadPriorityVerbose ) {
1053    tty->print_cr("In create_os_thread, Thread " INTPTR_FORMAT ", LWP is " INTPTR_FORMAT "\n",
1054                  osthread->thread_id(), osthread->lwp_id() );
1055  }
1056
1057  // Initial thread state is INITIALIZED, not SUSPENDED
1058  osthread->set_state(INITIALIZED);
1059
1060  return osthread;
1061}
1062
1063void os::Solaris::hotspot_sigmask(Thread* thread) {
1064
1065  //Save caller's signal mask
1066  sigset_t sigmask;
1067  thr_sigsetmask(SIG_SETMASK, NULL, &sigmask);
1068  OSThread *osthread = thread->osthread();
1069  osthread->set_caller_sigmask(sigmask);
1070
1071  thr_sigsetmask(SIG_UNBLOCK, os::Solaris::unblocked_signals(), NULL);
1072  if (!ReduceSignalUsage) {
1073    if (thread->is_VM_thread()) {
1074      // Only the VM thread handles BREAK_SIGNAL ...
1075      thr_sigsetmask(SIG_UNBLOCK, vm_signals(), NULL);
1076    } else {
1077      // ... all other threads block BREAK_SIGNAL
1078      assert(!sigismember(vm_signals(), SIGINT), "SIGINT should not be blocked");
1079      thr_sigsetmask(SIG_BLOCK, vm_signals(), NULL);
1080    }
1081  }
1082}
1083
1084bool os::create_attached_thread(JavaThread* thread) {
1085#ifdef ASSERT
1086  thread->verify_not_published();
1087#endif
1088  OSThread* osthread = create_os_thread(thread, thr_self());
1089  if (osthread == NULL) {
1090     return false;
1091  }
1092
1093  // Initial thread state is RUNNABLE
1094  osthread->set_state(RUNNABLE);
1095  thread->set_osthread(osthread);
1096
1097  // initialize signal mask for this thread
1098  // and save the caller's signal mask
1099  os::Solaris::hotspot_sigmask(thread);
1100
1101  return true;
1102}
1103
1104bool os::create_main_thread(JavaThread* thread) {
1105#ifdef ASSERT
1106  thread->verify_not_published();
1107#endif
1108  if (_starting_thread == NULL) {
1109    _starting_thread = create_os_thread(thread, main_thread);
1110     if (_starting_thread == NULL) {
1111        return false;
1112     }
1113  }
1114
1115  // The primodial thread is runnable from the start
1116  _starting_thread->set_state(RUNNABLE);
1117
1118  thread->set_osthread(_starting_thread);
1119
1120  // initialize signal mask for this thread
1121  // and save the caller's signal mask
1122  os::Solaris::hotspot_sigmask(thread);
1123
1124  return true;
1125}
1126
1127// _T2_libthread is true if we believe we are running with the newer
1128// SunSoft lwp/libthread.so (2.8 patch, 2.9 default)
1129bool os::Solaris::_T2_libthread = false;
1130
1131bool os::create_thread(Thread* thread, ThreadType thr_type, size_t stack_size) {
1132  // Allocate the OSThread object
1133  OSThread* osthread = new OSThread(NULL, NULL);
1134  if (osthread == NULL) {
1135    return false;
1136  }
1137
1138  if ( ThreadPriorityVerbose ) {
1139    char *thrtyp;
1140    switch ( thr_type ) {
1141      case vm_thread:
1142        thrtyp = (char *)"vm";
1143        break;
1144      case cgc_thread:
1145        thrtyp = (char *)"cgc";
1146        break;
1147      case pgc_thread:
1148        thrtyp = (char *)"pgc";
1149        break;
1150      case java_thread:
1151        thrtyp = (char *)"java";
1152        break;
1153      case compiler_thread:
1154        thrtyp = (char *)"compiler";
1155        break;
1156      case watcher_thread:
1157        thrtyp = (char *)"watcher";
1158        break;
1159      default:
1160        thrtyp = (char *)"unknown";
1161        break;
1162    }
1163    tty->print_cr("In create_thread, creating a %s thread\n", thrtyp);
1164  }
1165
1166  // Calculate stack size if it's not specified by caller.
1167  if (stack_size == 0) {
1168    // The default stack size 1M (2M for LP64).
1169    stack_size = (BytesPerWord >> 2) * K * K;
1170
1171    switch (thr_type) {
1172    case os::java_thread:
1173      // Java threads use ThreadStackSize which default value can be changed with the flag -Xss
1174      if (JavaThread::stack_size_at_create() > 0) stack_size = JavaThread::stack_size_at_create();
1175      break;
1176    case os::compiler_thread:
1177      if (CompilerThreadStackSize > 0) {
1178        stack_size = (size_t)(CompilerThreadStackSize * K);
1179        break;
1180      } // else fall through:
1181        // use VMThreadStackSize if CompilerThreadStackSize is not defined
1182    case os::vm_thread:
1183    case os::pgc_thread:
1184    case os::cgc_thread:
1185    case os::watcher_thread:
1186      if (VMThreadStackSize > 0) stack_size = (size_t)(VMThreadStackSize * K);
1187      break;
1188    }
1189  }
1190  stack_size = MAX2(stack_size, os::Solaris::min_stack_allowed);
1191
1192  // Initial state is ALLOCATED but not INITIALIZED
1193  osthread->set_state(ALLOCATED);
1194
1195  if (os::Solaris::_os_thread_count > os::Solaris::_os_thread_limit) {
1196    // We got lots of threads. Check if we still have some address space left.
1197    // Need to be at least 5Mb of unreserved address space. We do check by
1198    // trying to reserve some.
1199    const size_t VirtualMemoryBangSize = 20*K*K;
1200    char* mem = os::reserve_memory(VirtualMemoryBangSize);
1201    if (mem == NULL) {
1202      delete osthread;
1203      return false;
1204    } else {
1205      // Release the memory again
1206      os::release_memory(mem, VirtualMemoryBangSize);
1207    }
1208  }
1209
1210  // Setup osthread because the child thread may need it.
1211  thread->set_osthread(osthread);
1212
1213  // Create the Solaris thread
1214  // explicit THR_BOUND for T2_libthread case in case
1215  // that assumption is not accurate, but our alternate signal stack
1216  // handling is based on it which must have bound threads
1217  thread_t tid = 0;
1218  long     flags = (UseDetachedThreads ? THR_DETACHED : 0) | THR_SUSPENDED
1219                   | ((UseBoundThreads || os::Solaris::T2_libthread() ||
1220                       (thr_type == vm_thread) ||
1221                       (thr_type == cgc_thread) ||
1222                       (thr_type == pgc_thread) ||
1223                       (thr_type == compiler_thread && BackgroundCompilation)) ?
1224                      THR_BOUND : 0);
1225  int      status;
1226
1227  // 4376845 -- libthread/kernel don't provide enough LWPs to utilize all CPUs.
1228  //
1229  // On multiprocessors systems, libthread sometimes under-provisions our
1230  // process with LWPs.  On a 30-way systems, for instance, we could have
1231  // 50 user-level threads in ready state and only 2 or 3 LWPs assigned
1232  // to our process.  This can result in under utilization of PEs.
1233  // I suspect the problem is related to libthread's LWP
1234  // pool management and to the kernel's SIGBLOCKING "last LWP parked"
1235  // upcall policy.
1236  //
1237  // The following code is palliative -- it attempts to ensure that our
1238  // process has sufficient LWPs to take advantage of multiple PEs.
1239  // Proper long-term cures include using user-level threads bound to LWPs
1240  // (THR_BOUND) or using LWP-based synchronization.  Note that there is a
1241  // slight timing window with respect to sampling _os_thread_count, but
1242  // the race is benign.  Also, we should periodically recompute
1243  // _processors_online as the min of SC_NPROCESSORS_ONLN and the
1244  // the number of PEs in our partition.  You might be tempted to use
1245  // THR_NEW_LWP here, but I'd recommend against it as that could
1246  // result in undesirable growth of the libthread's LWP pool.
1247  // The fix below isn't sufficient; for instance, it doesn't take into count
1248  // LWPs parked on IO.  It does, however, help certain CPU-bound benchmarks.
1249  //
1250  // Some pathologies this scheme doesn't handle:
1251  // *  Threads can block, releasing the LWPs.  The LWPs can age out.
1252  //    When a large number of threads become ready again there aren't
1253  //    enough LWPs available to service them.  This can occur when the
1254  //    number of ready threads oscillates.
1255  // *  LWPs/Threads park on IO, thus taking the LWP out of circulation.
1256  //
1257  // Finally, we should call thr_setconcurrency() periodically to refresh
1258  // the LWP pool and thwart the LWP age-out mechanism.
1259  // The "+3" term provides a little slop -- we want to slightly overprovision.
1260
1261  if (AdjustConcurrency && os::Solaris::_os_thread_count < (_processors_online+3)) {
1262    if (!(flags & THR_BOUND)) {
1263      thr_setconcurrency (os::Solaris::_os_thread_count);       // avoid starvation
1264    }
1265  }
1266  // Although this doesn't hurt, we should warn of undefined behavior
1267  // when using unbound T1 threads with schedctl().  This should never
1268  // happen, as the compiler and VM threads are always created bound
1269  DEBUG_ONLY(
1270      if ((VMThreadHintNoPreempt || CompilerThreadHintNoPreempt) &&
1271          (!os::Solaris::T2_libthread() && (!(flags & THR_BOUND))) &&
1272          ((thr_type == vm_thread) || (thr_type == cgc_thread) ||
1273           (thr_type == pgc_thread) || (thr_type == compiler_thread && BackgroundCompilation))) {
1274         warning("schedctl behavior undefined when Compiler/VM/GC Threads are Unbound");
1275      }
1276  );
1277
1278
1279  // Mark that we don't have an lwp or thread id yet.
1280  // In case we attempt to set the priority before the thread starts.
1281  osthread->set_lwp_id(-1);
1282  osthread->set_thread_id(-1);
1283
1284  status = thr_create(NULL, stack_size, java_start, thread, flags, &tid);
1285  if (status != 0) {
1286    if (PrintMiscellaneous && (Verbose || WizardMode)) {
1287      perror("os::create_thread");
1288    }
1289    thread->set_osthread(NULL);
1290    // Need to clean up stuff we've allocated so far
1291    delete osthread;
1292    return false;
1293  }
1294
1295  Atomic::inc(&os::Solaris::_os_thread_count);
1296
1297  // Store info on the Solaris thread into the OSThread
1298  osthread->set_thread_id(tid);
1299
1300  // Remember that we created this thread so we can set priority on it
1301  osthread->set_vm_created();
1302
1303  // Set the default thread priority otherwise use NormalPriority
1304
1305  if ( UseThreadPriorities ) {
1306     thr_setprio(tid, (DefaultThreadPriority == -1) ?
1307                        java_to_os_priority[NormPriority] :
1308                        DefaultThreadPriority);
1309  }
1310
1311  // Initial thread state is INITIALIZED, not SUSPENDED
1312  osthread->set_state(INITIALIZED);
1313
1314  // The thread is returned suspended (in state INITIALIZED), and is started higher up in the call chain
1315  return true;
1316}
1317
1318/* defined for >= Solaris 10. This allows builds on earlier versions
1319 *  of Solaris to take advantage of the newly reserved Solaris JVM signals
1320 *  With SIGJVM1, SIGJVM2, INTERRUPT_SIGNAL is SIGJVM1, ASYNC_SIGNAL is SIGJVM2
1321 *  and -XX:+UseAltSigs does nothing since these should have no conflict
1322 */
1323#if !defined(SIGJVM1)
1324#define SIGJVM1 39
1325#define SIGJVM2 40
1326#endif
1327
1328debug_only(static bool signal_sets_initialized = false);
1329static sigset_t unblocked_sigs, vm_sigs, allowdebug_blocked_sigs;
1330int os::Solaris::_SIGinterrupt = INTERRUPT_SIGNAL;
1331int os::Solaris::_SIGasync = ASYNC_SIGNAL;
1332
1333bool os::Solaris::is_sig_ignored(int sig) {
1334      struct sigaction oact;
1335      sigaction(sig, (struct sigaction*)NULL, &oact);
1336      void* ohlr = oact.sa_sigaction ? CAST_FROM_FN_PTR(void*,  oact.sa_sigaction)
1337                                     : CAST_FROM_FN_PTR(void*,  oact.sa_handler);
1338      if (ohlr == CAST_FROM_FN_PTR(void*, SIG_IGN))
1339           return true;
1340      else
1341           return false;
1342}
1343
1344// Note: SIGRTMIN is a macro that calls sysconf() so it will
1345// dynamically detect SIGRTMIN value for the system at runtime, not buildtime
1346static bool isJVM1available() {
1347  return SIGJVM1 < SIGRTMIN;
1348}
1349
1350void os::Solaris::signal_sets_init() {
1351  // Should also have an assertion stating we are still single-threaded.
1352  assert(!signal_sets_initialized, "Already initialized");
1353  // Fill in signals that are necessarily unblocked for all threads in
1354  // the VM. Currently, we unblock the following signals:
1355  // SHUTDOWN{1,2,3}_SIGNAL: for shutdown hooks support (unless over-ridden
1356  //                         by -Xrs (=ReduceSignalUsage));
1357  // BREAK_SIGNAL which is unblocked only by the VM thread and blocked by all
1358  // other threads. The "ReduceSignalUsage" boolean tells us not to alter
1359  // the dispositions or masks wrt these signals.
1360  // Programs embedding the VM that want to use the above signals for their
1361  // own purposes must, at this time, use the "-Xrs" option to prevent
1362  // interference with shutdown hooks and BREAK_SIGNAL thread dumping.
1363  // (See bug 4345157, and other related bugs).
1364  // In reality, though, unblocking these signals is really a nop, since
1365  // these signals are not blocked by default.
1366  sigemptyset(&unblocked_sigs);
1367  sigemptyset(&allowdebug_blocked_sigs);
1368  sigaddset(&unblocked_sigs, SIGILL);
1369  sigaddset(&unblocked_sigs, SIGSEGV);
1370  sigaddset(&unblocked_sigs, SIGBUS);
1371  sigaddset(&unblocked_sigs, SIGFPE);
1372
1373  if (isJVM1available) {
1374    os::Solaris::set_SIGinterrupt(SIGJVM1);
1375    os::Solaris::set_SIGasync(SIGJVM2);
1376  } else if (UseAltSigs) {
1377    os::Solaris::set_SIGinterrupt(ALT_INTERRUPT_SIGNAL);
1378    os::Solaris::set_SIGasync(ALT_ASYNC_SIGNAL);
1379  } else {
1380    os::Solaris::set_SIGinterrupt(INTERRUPT_SIGNAL);
1381    os::Solaris::set_SIGasync(ASYNC_SIGNAL);
1382  }
1383
1384  sigaddset(&unblocked_sigs, os::Solaris::SIGinterrupt());
1385  sigaddset(&unblocked_sigs, os::Solaris::SIGasync());
1386
1387  if (!ReduceSignalUsage) {
1388   if (!os::Solaris::is_sig_ignored(SHUTDOWN1_SIGNAL)) {
1389      sigaddset(&unblocked_sigs, SHUTDOWN1_SIGNAL);
1390      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN1_SIGNAL);
1391   }
1392   if (!os::Solaris::is_sig_ignored(SHUTDOWN2_SIGNAL)) {
1393      sigaddset(&unblocked_sigs, SHUTDOWN2_SIGNAL);
1394      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN2_SIGNAL);
1395   }
1396   if (!os::Solaris::is_sig_ignored(SHUTDOWN3_SIGNAL)) {
1397      sigaddset(&unblocked_sigs, SHUTDOWN3_SIGNAL);
1398      sigaddset(&allowdebug_blocked_sigs, SHUTDOWN3_SIGNAL);
1399   }
1400  }
1401  // Fill in signals that are blocked by all but the VM thread.
1402  sigemptyset(&vm_sigs);
1403  if (!ReduceSignalUsage)
1404    sigaddset(&vm_sigs, BREAK_SIGNAL);
1405  debug_only(signal_sets_initialized = true);
1406
1407  // For diagnostics only used in run_periodic_checks
1408  sigemptyset(&check_signal_done);
1409}
1410
1411// These are signals that are unblocked while a thread is running Java.
1412// (For some reason, they get blocked by default.)
1413sigset_t* os::Solaris::unblocked_signals() {
1414  assert(signal_sets_initialized, "Not initialized");
1415  return &unblocked_sigs;
1416}
1417
1418// These are the signals that are blocked while a (non-VM) thread is
1419// running Java. Only the VM thread handles these signals.
1420sigset_t* os::Solaris::vm_signals() {
1421  assert(signal_sets_initialized, "Not initialized");
1422  return &vm_sigs;
1423}
1424
1425// These are signals that are blocked during cond_wait to allow debugger in
1426sigset_t* os::Solaris::allowdebug_blocked_signals() {
1427  assert(signal_sets_initialized, "Not initialized");
1428  return &allowdebug_blocked_sigs;
1429}
1430
1431// First crack at OS-specific initialization, from inside the new thread.
1432void os::initialize_thread() {
1433  int r = thr_main() ;
1434  guarantee (r == 0 || r == 1, "CR6501650 or CR6493689") ;
1435  if (r) {
1436    JavaThread* jt = (JavaThread *)Thread::current();
1437    assert(jt != NULL,"Sanity check");
1438    size_t stack_size;
1439    address base = jt->stack_base();
1440    if (Arguments::created_by_java_launcher()) {
1441      // Use 2MB to allow for Solaris 7 64 bit mode.
1442      stack_size = JavaThread::stack_size_at_create() == 0
1443        ? 2048*K : JavaThread::stack_size_at_create();
1444
1445      // There are rare cases when we may have already used more than
1446      // the basic stack size allotment before this method is invoked.
1447      // Attempt to allow for a normally sized java_stack.
1448      size_t current_stack_offset = (size_t)(base - (address)&stack_size);
1449      stack_size += ReservedSpace::page_align_size_down(current_stack_offset);
1450    } else {
1451      // 6269555: If we were not created by a Java launcher, i.e. if we are
1452      // running embedded in a native application, treat the primordial thread
1453      // as much like a native attached thread as possible.  This means using
1454      // the current stack size from thr_stksegment(), unless it is too large
1455      // to reliably setup guard pages.  A reasonable max size is 8MB.
1456      size_t current_size = current_stack_size();
1457      // This should never happen, but just in case....
1458      if (current_size == 0) current_size = 2 * K * K;
1459      stack_size = current_size > (8 * K * K) ? (8 * K * K) : current_size;
1460    }
1461    address bottom = (address)align_size_up((intptr_t)(base - stack_size), os::vm_page_size());;
1462    stack_size = (size_t)(base - bottom);
1463
1464    assert(stack_size > 0, "Stack size calculation problem");
1465
1466    if (stack_size > jt->stack_size()) {
1467      NOT_PRODUCT(
1468        struct rlimit limits;
1469        getrlimit(RLIMIT_STACK, &limits);
1470        size_t size = adjust_stack_size(base, (size_t)limits.rlim_cur);
1471        assert(size >= jt->stack_size(), "Stack size problem in main thread");
1472      )
1473      tty->print_cr(
1474        "Stack size of %d Kb exceeds current limit of %d Kb.\n"
1475        "(Stack sizes are rounded up to a multiple of the system page size.)\n"
1476        "See limit(1) to increase the stack size limit.",
1477        stack_size / K, jt->stack_size() / K);
1478      vm_exit(1);
1479    }
1480    assert(jt->stack_size() >= stack_size,
1481          "Attempt to map more stack than was allocated");
1482    jt->set_stack_size(stack_size);
1483  }
1484
1485   // 5/22/01: Right now alternate signal stacks do not handle
1486   // throwing stack overflow exceptions, see bug 4463178
1487   // Until a fix is found for this, T2 will NOT imply alternate signal
1488   // stacks.
1489   // If using T2 libthread threads, install an alternate signal stack.
1490   // Because alternate stacks associate with LWPs on Solaris,
1491   // see sigaltstack(2), if using UNBOUND threads, or if UseBoundThreads
1492   // we prefer to explicitly stack bang.
1493   // If not using T2 libthread, but using UseBoundThreads any threads
1494   // (primordial thread, jni_attachCurrentThread) we do not create,
1495   // probably are not bound, therefore they can not have an alternate
1496   // signal stack. Since our stack banging code is generated and
1497   // is shared across threads, all threads must be bound to allow
1498   // using alternate signal stacks.  The alternative is to interpose
1499   // on _lwp_create to associate an alt sig stack with each LWP,
1500   // and this could be a problem when the JVM is embedded.
1501   // We would prefer to use alternate signal stacks with T2
1502   // Since there is currently no accurate way to detect T2
1503   // we do not. Assuming T2 when running T1 causes sig 11s or assertions
1504   // on installing alternate signal stacks
1505
1506
1507   // 05/09/03: removed alternate signal stack support for Solaris
1508   // The alternate signal stack mechanism is no longer needed to
1509   // handle stack overflow. This is now handled by allocating
1510   // guard pages (red zone) and stackbanging.
1511   // Initially the alternate signal stack mechanism was removed because
1512   // it did not work with T1 llibthread. Alternate
1513   // signal stacks MUST have all threads bound to lwps. Applications
1514   // can create their own threads and attach them without their being
1515   // bound under T1. This is frequently the case for the primordial thread.
1516   // If we were ever to reenable this mechanism we would need to
1517   // use the dynamic check for T2 libthread.
1518
1519  os::Solaris::init_thread_fpu_state();
1520}
1521
1522
1523
1524// Free Solaris resources related to the OSThread
1525void os::free_thread(OSThread* osthread) {
1526  assert(osthread != NULL, "os::free_thread but osthread not set");
1527
1528
1529  // We are told to free resources of the argument thread,
1530  // but we can only really operate on the current thread.
1531  // The main thread must take the VMThread down synchronously
1532  // before the main thread exits and frees up CodeHeap
1533  guarantee((Thread::current()->osthread() == osthread
1534     || (osthread == VMThread::vm_thread()->osthread())), "os::free_thread but not current thread");
1535  if (Thread::current()->osthread() == osthread) {
1536    // Restore caller's signal mask
1537    sigset_t sigmask = osthread->caller_sigmask();
1538    thr_sigsetmask(SIG_SETMASK, &sigmask, NULL);
1539  }
1540  delete osthread;
1541}
1542
1543void os::pd_start_thread(Thread* thread) {
1544  int status = thr_continue(thread->osthread()->thread_id());
1545  assert_status(status == 0, status, "thr_continue failed");
1546}
1547
1548
1549intx os::current_thread_id() {
1550  return (intx)thr_self();
1551}
1552
1553static pid_t _initial_pid = 0;
1554
1555int os::current_process_id() {
1556  return (int)(_initial_pid ? _initial_pid : getpid());
1557}
1558
1559int os::allocate_thread_local_storage() {
1560  // %%%       in Win32 this allocates a memory segment pointed to by a
1561  //           register.  Dan Stein can implement a similar feature in
1562  //           Solaris.  Alternatively, the VM can do the same thing
1563  //           explicitly: malloc some storage and keep the pointer in a
1564  //           register (which is part of the thread's context) (or keep it
1565  //           in TLS).
1566  // %%%       In current versions of Solaris, thr_self and TSD can
1567  //           be accessed via short sequences of displaced indirections.
1568  //           The value of thr_self is available as %g7(36).
1569  //           The value of thr_getspecific(k) is stored in %g7(12)(4)(k*4-4),
1570  //           assuming that the current thread already has a value bound to k.
1571  //           It may be worth experimenting with such access patterns,
1572  //           and later having the parameters formally exported from a Solaris
1573  //           interface.  I think, however, that it will be faster to
1574  //           maintain the invariant that %g2 always contains the
1575  //           JavaThread in Java code, and have stubs simply
1576  //           treat %g2 as a caller-save register, preserving it in a %lN.
1577  thread_key_t tk;
1578  if (thr_keycreate( &tk, NULL ) )
1579    fatal1("os::allocate_thread_local_storage: thr_keycreate failed (%s)", strerror(errno));
1580  return int(tk);
1581}
1582
1583void os::free_thread_local_storage(int index) {
1584  // %%% don't think we need anything here
1585  // if ( pthread_key_delete((pthread_key_t) tk) )
1586  //   fatal("os::free_thread_local_storage: pthread_key_delete failed");
1587}
1588
1589#define SMALLINT 32   // libthread allocate for tsd_common is a version specific
1590                      // small number - point is NO swap space available
1591void os::thread_local_storage_at_put(int index, void* value) {
1592  // %%% this is used only in threadLocalStorage.cpp
1593  if (thr_setspecific((thread_key_t)index, value)) {
1594    if (errno == ENOMEM) {
1595       vm_exit_out_of_memory(SMALLINT, "thr_setspecific: out of swap space");
1596    } else {
1597      fatal1("os::thread_local_storage_at_put: thr_setspecific failed (%s)", strerror(errno));
1598    }
1599  } else {
1600      ThreadLocalStorage::set_thread_in_slot ((Thread *) value) ;
1601  }
1602}
1603
1604// This function could be called before TLS is initialized, for example, when
1605// VM receives an async signal or when VM causes a fatal error during
1606// initialization. Return NULL if thr_getspecific() fails.
1607void* os::thread_local_storage_at(int index) {
1608  // %%% this is used only in threadLocalStorage.cpp
1609  void* r = NULL;
1610  return thr_getspecific((thread_key_t)index, &r) != 0 ? NULL : r;
1611}
1612
1613
1614const int NANOSECS_PER_MILLISECS = 1000000;
1615// gethrtime can move backwards if read from one cpu and then a different cpu
1616// getTimeNanos is guaranteed to not move backward on Solaris
1617// local spinloop created as faster for a CAS on an int than
1618// a CAS on a 64bit jlong. Also Atomic::cmpxchg for jlong is not
1619// supported on sparc v8 or pre supports_cx8 intel boxes.
1620// oldgetTimeNanos for systems which do not support CAS on 64bit jlong
1621// i.e. sparc v8 and pre supports_cx8 (i486) intel boxes
1622inline hrtime_t oldgetTimeNanos() {
1623  int gotlock = LOCK_INVALID;
1624  hrtime_t newtime = gethrtime();
1625
1626  for (;;) {
1627// grab lock for max_hrtime
1628    int curlock = max_hrtime_lock;
1629    if (curlock & LOCK_BUSY)  continue;
1630    if (gotlock = Atomic::cmpxchg(LOCK_BUSY, &max_hrtime_lock, LOCK_FREE) != LOCK_FREE) continue;
1631    if (newtime > max_hrtime) {
1632      max_hrtime = newtime;
1633    } else {
1634      newtime = max_hrtime;
1635    }
1636    // release lock
1637    max_hrtime_lock = LOCK_FREE;
1638    return newtime;
1639  }
1640}
1641// gethrtime can move backwards if read from one cpu and then a different cpu
1642// getTimeNanos is guaranteed to not move backward on Solaris
1643inline hrtime_t getTimeNanos() {
1644  if (VM_Version::supports_cx8()) {
1645    const hrtime_t now = gethrtime();
1646    // Use atomic long load since 32-bit x86 uses 2 registers to keep long.
1647    const hrtime_t prev = Atomic::load((volatile jlong*)&max_hrtime);
1648    if (now <= prev)  return prev;   // same or retrograde time;
1649    const hrtime_t obsv = Atomic::cmpxchg(now, (volatile jlong*)&max_hrtime, prev);
1650    assert(obsv >= prev, "invariant");   // Monotonicity
1651    // If the CAS succeeded then we're done and return "now".
1652    // If the CAS failed and the observed value "obs" is >= now then
1653    // we should return "obs".  If the CAS failed and now > obs > prv then
1654    // some other thread raced this thread and installed a new value, in which case
1655    // we could either (a) retry the entire operation, (b) retry trying to install now
1656    // or (c) just return obs.  We use (c).   No loop is required although in some cases
1657    // we might discard a higher "now" value in deference to a slightly lower but freshly
1658    // installed obs value.   That's entirely benign -- it admits no new orderings compared
1659    // to (a) or (b) -- and greatly reduces coherence traffic.
1660    // We might also condition (c) on the magnitude of the delta between obs and now.
1661    // Avoiding excessive CAS operations to hot RW locations is critical.
1662    // See http://blogs.sun.com/dave/entry/cas_and_cache_trivia_invalidate
1663    return (prev == obsv) ? now : obsv ;
1664  } else {
1665    return oldgetTimeNanos();
1666  }
1667}
1668
1669// Time since start-up in seconds to a fine granularity.
1670// Used by VMSelfDestructTimer and the MemProfiler.
1671double os::elapsedTime() {
1672  return (double)(getTimeNanos() - first_hrtime) / (double)hrtime_hz;
1673}
1674
1675jlong os::elapsed_counter() {
1676  return (jlong)(getTimeNanos() - first_hrtime);
1677}
1678
1679jlong os::elapsed_frequency() {
1680   return hrtime_hz;
1681}
1682
1683// Return the real, user, and system times in seconds from an
1684// arbitrary fixed point in the past.
1685bool os::getTimesSecs(double* process_real_time,
1686                  double* process_user_time,
1687                  double* process_system_time) {
1688  struct tms ticks;
1689  clock_t real_ticks = times(&ticks);
1690
1691  if (real_ticks == (clock_t) (-1)) {
1692    return false;
1693  } else {
1694    double ticks_per_second = (double) clock_tics_per_sec;
1695    *process_user_time = ((double) ticks.tms_utime) / ticks_per_second;
1696    *process_system_time = ((double) ticks.tms_stime) / ticks_per_second;
1697    // For consistency return the real time from getTimeNanos()
1698    // converted to seconds.
1699    *process_real_time = ((double) getTimeNanos()) / ((double) NANOUNITS);
1700
1701    return true;
1702  }
1703}
1704
1705bool os::supports_vtime() { return true; }
1706
1707bool os::enable_vtime() {
1708  int fd = open("/proc/self/ctl", O_WRONLY);
1709  if (fd == -1)
1710    return false;
1711
1712  long cmd[] = { PCSET, PR_MSACCT };
1713  int res = write(fd, cmd, sizeof(long) * 2);
1714  close(fd);
1715  if (res != sizeof(long) * 2)
1716    return false;
1717
1718  return true;
1719}
1720
1721bool os::vtime_enabled() {
1722  int fd = open("/proc/self/status", O_RDONLY);
1723  if (fd == -1)
1724    return false;
1725
1726  pstatus_t status;
1727  int res = read(fd, (void*) &status, sizeof(pstatus_t));
1728  close(fd);
1729  if (res != sizeof(pstatus_t))
1730    return false;
1731
1732  return status.pr_flags & PR_MSACCT;
1733}
1734
1735double os::elapsedVTime() {
1736  return (double)gethrvtime() / (double)hrtime_hz;
1737}
1738
1739// Used internally for comparisons only
1740// getTimeMillis guaranteed to not move backwards on Solaris
1741jlong getTimeMillis() {
1742  jlong nanotime = getTimeNanos();
1743  return (jlong)(nanotime / NANOSECS_PER_MILLISECS);
1744}
1745
1746// Must return millis since Jan 1 1970 for JVM_CurrentTimeMillis
1747jlong os::javaTimeMillis() {
1748  timeval t;
1749  if (gettimeofday( &t, NULL) == -1)
1750    fatal1("os::javaTimeMillis: gettimeofday (%s)", strerror(errno));
1751  return jlong(t.tv_sec) * 1000  +  jlong(t.tv_usec) / 1000;
1752}
1753
1754jlong os::javaTimeNanos() {
1755  return (jlong)getTimeNanos();
1756}
1757
1758void os::javaTimeNanos_info(jvmtiTimerInfo *info_ptr) {
1759  info_ptr->max_value = ALL_64_BITS;      // gethrtime() uses all 64 bits
1760  info_ptr->may_skip_backward = false;    // not subject to resetting or drifting
1761  info_ptr->may_skip_forward = false;     // not subject to resetting or drifting
1762  info_ptr->kind = JVMTI_TIMER_ELAPSED;   // elapsed not CPU time
1763}
1764
1765char * os::local_time_string(char *buf, size_t buflen) {
1766  struct tm t;
1767  time_t long_time;
1768  time(&long_time);
1769  localtime_r(&long_time, &t);
1770  jio_snprintf(buf, buflen, "%d-%02d-%02d %02d:%02d:%02d",
1771               t.tm_year + 1900, t.tm_mon + 1, t.tm_mday,
1772               t.tm_hour, t.tm_min, t.tm_sec);
1773  return buf;
1774}
1775
1776// Note: os::shutdown() might be called very early during initialization, or
1777// called from signal handler. Before adding something to os::shutdown(), make
1778// sure it is async-safe and can handle partially initialized VM.
1779void os::shutdown() {
1780
1781  // allow PerfMemory to attempt cleanup of any persistent resources
1782  perfMemory_exit();
1783
1784  // needs to remove object in file system
1785  AttachListener::abort();
1786
1787  // flush buffered output, finish log files
1788  ostream_abort();
1789
1790  // Check for abort hook
1791  abort_hook_t abort_hook = Arguments::abort_hook();
1792  if (abort_hook != NULL) {
1793    abort_hook();
1794  }
1795}
1796
1797// Note: os::abort() might be called very early during initialization, or
1798// called from signal handler. Before adding something to os::abort(), make
1799// sure it is async-safe and can handle partially initialized VM.
1800void os::abort(bool dump_core) {
1801  os::shutdown();
1802  if (dump_core) {
1803#ifndef PRODUCT
1804    fdStream out(defaultStream::output_fd());
1805    out.print_raw("Current thread is ");
1806    char buf[16];
1807    jio_snprintf(buf, sizeof(buf), UINTX_FORMAT, os::current_thread_id());
1808    out.print_raw_cr(buf);
1809    out.print_raw_cr("Dumping core ...");
1810#endif
1811    ::abort(); // dump core (for debugging)
1812  }
1813
1814  ::exit(1);
1815}
1816
1817// Die immediately, no exit hook, no abort hook, no cleanup.
1818void os::die() {
1819  _exit(-1);
1820}
1821
1822// unused
1823void os::set_error_file(const char *logfile) {}
1824
1825// DLL functions
1826
1827const char* os::dll_file_extension() { return ".so"; }
1828
1829const char* os::get_temp_directory() { return "/tmp/"; }
1830
1831static bool file_exists(const char* filename) {
1832  struct stat statbuf;
1833  if (filename == NULL || strlen(filename) == 0) {
1834    return false;
1835  }
1836  return os::stat(filename, &statbuf) == 0;
1837}
1838
1839void os::dll_build_name(char* buffer, size_t buflen,
1840                        const char* pname, const char* fname) {
1841  // Copied from libhpi
1842  const size_t pnamelen = pname ? strlen(pname) : 0;
1843
1844  // Quietly truncate on buffer overflow.  Should be an error.
1845  if (pnamelen + strlen(fname) + 10 > (size_t) buflen) {
1846      *buffer = '\0';
1847      return;
1848  }
1849
1850  if (pnamelen == 0) {
1851    snprintf(buffer, buflen, "lib%s.so", fname);
1852  } else if (strchr(pname, *os::path_separator()) != NULL) {
1853    int n;
1854    char** pelements = split_path(pname, &n);
1855    for (int i = 0 ; i < n ; i++) {
1856      // really shouldn't be NULL but what the heck, check can't hurt
1857      if (pelements[i] == NULL || strlen(pelements[i]) == 0) {
1858        continue; // skip the empty path values
1859      }
1860      snprintf(buffer, buflen, "%s/lib%s.so", pelements[i], fname);
1861      if (file_exists(buffer)) {
1862        break;
1863      }
1864    }
1865    // release the storage
1866    for (int i = 0 ; i < n ; i++) {
1867      if (pelements[i] != NULL) {
1868        FREE_C_HEAP_ARRAY(char, pelements[i]);
1869      }
1870    }
1871    if (pelements != NULL) {
1872      FREE_C_HEAP_ARRAY(char*, pelements);
1873    }
1874  } else {
1875    snprintf(buffer, buflen, "%s/lib%s.so", pname, fname);
1876  }
1877}
1878
1879const char* os::get_current_directory(char *buf, int buflen) {
1880  return getcwd(buf, buflen);
1881}
1882
1883// check if addr is inside libjvm[_g].so
1884bool os::address_is_in_vm(address addr) {
1885  static address libjvm_base_addr;
1886  Dl_info dlinfo;
1887
1888  if (libjvm_base_addr == NULL) {
1889    dladdr(CAST_FROM_FN_PTR(void *, os::address_is_in_vm), &dlinfo);
1890    libjvm_base_addr = (address)dlinfo.dli_fbase;
1891    assert(libjvm_base_addr !=NULL, "Cannot obtain base address for libjvm");
1892  }
1893
1894  if (dladdr((void *)addr, &dlinfo)) {
1895    if (libjvm_base_addr == (address)dlinfo.dli_fbase) return true;
1896  }
1897
1898  return false;
1899}
1900
1901typedef int (*dladdr1_func_type) (void *, Dl_info *, void **, int);
1902static dladdr1_func_type dladdr1_func = NULL;
1903
1904bool os::dll_address_to_function_name(address addr, char *buf,
1905                                      int buflen, int * offset) {
1906  Dl_info dlinfo;
1907
1908  // dladdr1_func was initialized in os::init()
1909  if (dladdr1_func){
1910      // yes, we have dladdr1
1911
1912      // Support for dladdr1 is checked at runtime; it may be
1913      // available even if the vm is built on a machine that does
1914      // not have dladdr1 support.  Make sure there is a value for
1915      // RTLD_DL_SYMENT.
1916      #ifndef RTLD_DL_SYMENT
1917      #define RTLD_DL_SYMENT 1
1918      #endif
1919      Sym * info;
1920      if (dladdr1_func((void *)addr, &dlinfo, (void **)&info,
1921                       RTLD_DL_SYMENT)) {
1922          if (buf) jio_snprintf(buf, buflen, "%s", dlinfo.dli_sname);
1923          if (offset) *offset = addr - (address)dlinfo.dli_saddr;
1924
1925          // check if the returned symbol really covers addr
1926          return ((char *)dlinfo.dli_saddr + info->st_size > (char *)addr);
1927      } else {
1928          if (buf) buf[0] = '\0';
1929          if (offset) *offset  = -1;
1930          return false;
1931      }
1932  } else {
1933      // no, only dladdr is available
1934      if(dladdr((void *)addr, &dlinfo)) {
1935          if (buf) jio_snprintf(buf, buflen, dlinfo.dli_sname);
1936          if (offset) *offset = addr - (address)dlinfo.dli_saddr;
1937          return true;
1938      } else {
1939          if (buf) buf[0] = '\0';
1940          if (offset) *offset  = -1;
1941          return false;
1942      }
1943  }
1944}
1945
1946bool os::dll_address_to_library_name(address addr, char* buf,
1947                                     int buflen, int* offset) {
1948  Dl_info dlinfo;
1949
1950  if (dladdr((void*)addr, &dlinfo)){
1951     if (buf) jio_snprintf(buf, buflen, "%s", dlinfo.dli_fname);
1952     if (offset) *offset = addr - (address)dlinfo.dli_fbase;
1953     return true;
1954  } else {
1955     if (buf) buf[0] = '\0';
1956     if (offset) *offset = -1;
1957     return false;
1958  }
1959}
1960
1961// Prints the names and full paths of all opened dynamic libraries
1962// for current process
1963void os::print_dll_info(outputStream * st) {
1964    Dl_info dli;
1965    void *handle;
1966    Link_map *map;
1967    Link_map *p;
1968
1969    st->print_cr("Dynamic libraries:"); st->flush();
1970
1971    if (!dladdr(CAST_FROM_FN_PTR(void *, os::print_dll_info), &dli)) {
1972        st->print_cr("Error: Cannot print dynamic libraries.");
1973        return;
1974    }
1975    handle = dlopen(dli.dli_fname, RTLD_LAZY);
1976    if (handle == NULL) {
1977        st->print_cr("Error: Cannot print dynamic libraries.");
1978        return;
1979    }
1980    dlinfo(handle, RTLD_DI_LINKMAP, &map);
1981    if (map == NULL) {
1982        st->print_cr("Error: Cannot print dynamic libraries.");
1983        return;
1984    }
1985
1986    while (map->l_prev != NULL)
1987        map = map->l_prev;
1988
1989    while (map != NULL) {
1990        st->print_cr(PTR_FORMAT " \t%s", map->l_addr, map->l_name);
1991        map = map->l_next;
1992    }
1993
1994    dlclose(handle);
1995}
1996
1997  // Loads .dll/.so and
1998  // in case of error it checks if .dll/.so was built for the
1999  // same architecture as Hotspot is running on
2000
2001void * os::dll_load(const char *filename, char *ebuf, int ebuflen)
2002{
2003  void * result= ::dlopen(filename, RTLD_LAZY);
2004  if (result != NULL) {
2005    // Successful loading
2006    return result;
2007  }
2008
2009  Elf32_Ehdr elf_head;
2010
2011  // Read system error message into ebuf
2012  // It may or may not be overwritten below
2013  ::strncpy(ebuf, ::dlerror(), ebuflen-1);
2014  ebuf[ebuflen-1]='\0';
2015  int diag_msg_max_length=ebuflen-strlen(ebuf);
2016  char* diag_msg_buf=ebuf+strlen(ebuf);
2017
2018  if (diag_msg_max_length==0) {
2019    // No more space in ebuf for additional diagnostics message
2020    return NULL;
2021  }
2022
2023
2024  int file_descriptor= ::open(filename, O_RDONLY | O_NONBLOCK);
2025
2026  if (file_descriptor < 0) {
2027    // Can't open library, report dlerror() message
2028    return NULL;
2029  }
2030
2031  bool failed_to_read_elf_head=
2032    (sizeof(elf_head)!=
2033        (::read(file_descriptor, &elf_head,sizeof(elf_head)))) ;
2034
2035  ::close(file_descriptor);
2036  if (failed_to_read_elf_head) {
2037    // file i/o error - report dlerror() msg
2038    return NULL;
2039  }
2040
2041  typedef struct {
2042    Elf32_Half  code;         // Actual value as defined in elf.h
2043    Elf32_Half  compat_class; // Compatibility of archs at VM's sense
2044    char        elf_class;    // 32 or 64 bit
2045    char        endianess;    // MSB or LSB
2046    char*       name;         // String representation
2047  } arch_t;
2048
2049  static const arch_t arch_array[]={
2050    {EM_386,         EM_386,     ELFCLASS32, ELFDATA2LSB, (char*)"IA 32"},
2051    {EM_486,         EM_386,     ELFCLASS32, ELFDATA2LSB, (char*)"IA 32"},
2052    {EM_IA_64,       EM_IA_64,   ELFCLASS64, ELFDATA2LSB, (char*)"IA 64"},
2053    {EM_X86_64,      EM_X86_64,  ELFCLASS64, ELFDATA2LSB, (char*)"AMD 64"},
2054    {EM_SPARC,       EM_SPARC,   ELFCLASS32, ELFDATA2MSB, (char*)"Sparc 32"},
2055    {EM_SPARC32PLUS, EM_SPARC,   ELFCLASS32, ELFDATA2MSB, (char*)"Sparc 32"},
2056    {EM_SPARCV9,     EM_SPARCV9, ELFCLASS64, ELFDATA2MSB, (char*)"Sparc v9 64"},
2057    {EM_PPC,         EM_PPC,     ELFCLASS32, ELFDATA2MSB, (char*)"Power PC 32"},
2058    {EM_PPC64,       EM_PPC64,   ELFCLASS64, ELFDATA2MSB, (char*)"Power PC 64"}
2059  };
2060
2061  #if  (defined IA32)
2062    static  Elf32_Half running_arch_code=EM_386;
2063  #elif   (defined AMD64)
2064    static  Elf32_Half running_arch_code=EM_X86_64;
2065  #elif  (defined IA64)
2066    static  Elf32_Half running_arch_code=EM_IA_64;
2067  #elif  (defined __sparc) && (defined _LP64)
2068    static  Elf32_Half running_arch_code=EM_SPARCV9;
2069  #elif  (defined __sparc) && (!defined _LP64)
2070    static  Elf32_Half running_arch_code=EM_SPARC;
2071  #elif  (defined __powerpc64__)
2072    static  Elf32_Half running_arch_code=EM_PPC64;
2073  #elif  (defined __powerpc__)
2074    static  Elf32_Half running_arch_code=EM_PPC;
2075  #else
2076    #error Method os::dll_load requires that one of following is defined:\
2077         IA32, AMD64, IA64, __sparc, __powerpc__
2078  #endif
2079
2080  // Identify compatability class for VM's architecture and library's architecture
2081  // Obtain string descriptions for architectures
2082
2083  arch_t lib_arch={elf_head.e_machine,0,elf_head.e_ident[EI_CLASS], elf_head.e_ident[EI_DATA], NULL};
2084  int running_arch_index=-1;
2085
2086  for (unsigned int i=0 ; i < ARRAY_SIZE(arch_array) ; i++ ) {
2087    if (running_arch_code == arch_array[i].code) {
2088      running_arch_index    = i;
2089    }
2090    if (lib_arch.code == arch_array[i].code) {
2091      lib_arch.compat_class = arch_array[i].compat_class;
2092      lib_arch.name         = arch_array[i].name;
2093    }
2094  }
2095
2096  assert(running_arch_index != -1,
2097    "Didn't find running architecture code (running_arch_code) in arch_array");
2098  if (running_arch_index == -1) {
2099    // Even though running architecture detection failed
2100    // we may still continue with reporting dlerror() message
2101    return NULL;
2102  }
2103
2104  if (lib_arch.endianess != arch_array[running_arch_index].endianess) {
2105    ::snprintf(diag_msg_buf, diag_msg_max_length-1," (Possible cause: endianness mismatch)");
2106    return NULL;
2107  }
2108
2109  if (lib_arch.elf_class != arch_array[running_arch_index].elf_class) {
2110    ::snprintf(diag_msg_buf, diag_msg_max_length-1," (Possible cause: architecture word width mismatch)");
2111    return NULL;
2112  }
2113
2114  if (lib_arch.compat_class != arch_array[running_arch_index].compat_class) {
2115    if ( lib_arch.name!=NULL ) {
2116      ::snprintf(diag_msg_buf, diag_msg_max_length-1,
2117        " (Possible cause: can't load %s-bit .so on a %s-bit platform)",
2118        lib_arch.name, arch_array[running_arch_index].name);
2119    } else {
2120      ::snprintf(diag_msg_buf, diag_msg_max_length-1,
2121      " (Possible cause: can't load this .so (machine code=0x%x) on a %s-bit platform)",
2122        lib_arch.code,
2123        arch_array[running_arch_index].name);
2124    }
2125  }
2126
2127  return NULL;
2128}
2129
2130void* os::dll_lookup(void* handle, const char* name) {
2131  return dlsym(handle, name);
2132}
2133
2134
2135bool _print_ascii_file(const char* filename, outputStream* st) {
2136  int fd = open(filename, O_RDONLY);
2137  if (fd == -1) {
2138     return false;
2139  }
2140
2141  char buf[32];
2142  int bytes;
2143  while ((bytes = read(fd, buf, sizeof(buf))) > 0) {
2144    st->print_raw(buf, bytes);
2145  }
2146
2147  close(fd);
2148
2149  return true;
2150}
2151
2152void os::print_os_info(outputStream* st) {
2153  st->print("OS:");
2154
2155  if (!_print_ascii_file("/etc/release", st)) {
2156    st->print("Solaris");
2157  }
2158  st->cr();
2159
2160  // kernel
2161  st->print("uname:");
2162  struct utsname name;
2163  uname(&name);
2164  st->print(name.sysname); st->print(" ");
2165  st->print(name.release); st->print(" ");
2166  st->print(name.version); st->print(" ");
2167  st->print(name.machine);
2168
2169  // libthread
2170  if (os::Solaris::T2_libthread()) st->print("  (T2 libthread)");
2171  else st->print("  (T1 libthread)");
2172  st->cr();
2173
2174  // rlimit
2175  st->print("rlimit:");
2176  struct rlimit rlim;
2177
2178  st->print(" STACK ");
2179  getrlimit(RLIMIT_STACK, &rlim);
2180  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2181  else st->print("%uk", rlim.rlim_cur >> 10);
2182
2183  st->print(", CORE ");
2184  getrlimit(RLIMIT_CORE, &rlim);
2185  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2186  else st->print("%uk", rlim.rlim_cur >> 10);
2187
2188  st->print(", NOFILE ");
2189  getrlimit(RLIMIT_NOFILE, &rlim);
2190  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2191  else st->print("%d", rlim.rlim_cur);
2192
2193  st->print(", AS ");
2194  getrlimit(RLIMIT_AS, &rlim);
2195  if (rlim.rlim_cur == RLIM_INFINITY) st->print("infinity");
2196  else st->print("%uk", rlim.rlim_cur >> 10);
2197  st->cr();
2198
2199  // load average
2200  st->print("load average:");
2201  double loadavg[3];
2202  os::loadavg(loadavg, 3);
2203  st->print("%0.02f %0.02f %0.02f", loadavg[0], loadavg[1], loadavg[2]);
2204  st->cr();
2205}
2206
2207
2208static bool check_addr0(outputStream* st) {
2209  jboolean status = false;
2210  int fd = open("/proc/self/map",O_RDONLY);
2211  if (fd >= 0) {
2212    prmap_t p;
2213    while(read(fd, &p, sizeof(p)) > 0) {
2214      if (p.pr_vaddr == 0x0) {
2215        st->print("Warning: Address: 0x%x, Size: %dK, ",p.pr_vaddr, p.pr_size/1024, p.pr_mapname);
2216        st->print("Mapped file: %s, ", p.pr_mapname[0] == '\0' ? "None" : p.pr_mapname);
2217        st->print("Access:");
2218        st->print("%s",(p.pr_mflags & MA_READ)  ? "r" : "-");
2219        st->print("%s",(p.pr_mflags & MA_WRITE) ? "w" : "-");
2220        st->print("%s",(p.pr_mflags & MA_EXEC)  ? "x" : "-");
2221        st->cr();
2222        status = true;
2223      }
2224      close(fd);
2225    }
2226  }
2227  return status;
2228}
2229
2230void os::print_memory_info(outputStream* st) {
2231  st->print("Memory:");
2232  st->print(" %dk page", os::vm_page_size()>>10);
2233  st->print(", physical " UINT64_FORMAT "k", os::physical_memory()>>10);
2234  st->print("(" UINT64_FORMAT "k free)", os::available_memory() >> 10);
2235  st->cr();
2236  (void) check_addr0(st);
2237}
2238
2239// Taken from /usr/include/sys/machsig.h  Supposed to be architecture specific
2240// but they're the same for all the solaris architectures that we support.
2241const char *ill_names[] = { "ILL0", "ILL_ILLOPC", "ILL_ILLOPN", "ILL_ILLADR",
2242                          "ILL_ILLTRP", "ILL_PRVOPC", "ILL_PRVREG",
2243                          "ILL_COPROC", "ILL_BADSTK" };
2244
2245const char *fpe_names[] = { "FPE0", "FPE_INTDIV", "FPE_INTOVF", "FPE_FLTDIV",
2246                          "FPE_FLTOVF", "FPE_FLTUND", "FPE_FLTRES",
2247                          "FPE_FLTINV", "FPE_FLTSUB" };
2248
2249const char *segv_names[] = { "SEGV0", "SEGV_MAPERR", "SEGV_ACCERR" };
2250
2251const char *bus_names[] = { "BUS0", "BUS_ADRALN", "BUS_ADRERR", "BUS_OBJERR" };
2252
2253void os::print_siginfo(outputStream* st, void* siginfo) {
2254  st->print("siginfo:");
2255
2256  const int buflen = 100;
2257  char buf[buflen];
2258  siginfo_t *si = (siginfo_t*)siginfo;
2259  st->print("si_signo=%s: ", os::exception_name(si->si_signo, buf, buflen));
2260  char *err = strerror(si->si_errno);
2261  if (si->si_errno != 0 && err != NULL) {
2262    st->print("si_errno=%s", err);
2263  } else {
2264    st->print("si_errno=%d", si->si_errno);
2265  }
2266  const int c = si->si_code;
2267  assert(c > 0, "unexpected si_code");
2268  switch (si->si_signo) {
2269  case SIGILL:
2270    st->print(", si_code=%d (%s)", c, c > 8 ? "" : ill_names[c]);
2271    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2272    break;
2273  case SIGFPE:
2274    st->print(", si_code=%d (%s)", c, c > 9 ? "" : fpe_names[c]);
2275    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2276    break;
2277  case SIGSEGV:
2278    st->print(", si_code=%d (%s)", c, c > 2 ? "" : segv_names[c]);
2279    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2280    break;
2281  case SIGBUS:
2282    st->print(", si_code=%d (%s)", c, c > 3 ? "" : bus_names[c]);
2283    st->print(", si_addr=" PTR_FORMAT, si->si_addr);
2284    break;
2285  default:
2286    st->print(", si_code=%d", si->si_code);
2287    // no si_addr
2288  }
2289
2290  if ((si->si_signo == SIGBUS || si->si_signo == SIGSEGV) &&
2291      UseSharedSpaces) {
2292    FileMapInfo* mapinfo = FileMapInfo::current_info();
2293    if (mapinfo->is_in_shared_space(si->si_addr)) {
2294      st->print("\n\nError accessing class data sharing archive."   \
2295                " Mapped file inaccessible during execution, "      \
2296                " possible disk/network problem.");
2297    }
2298  }
2299  st->cr();
2300}
2301
2302// Moved from whole group, because we need them here for diagnostic
2303// prints.
2304#define OLDMAXSIGNUM 32
2305static int Maxsignum = 0;
2306static int *ourSigFlags = NULL;
2307
2308extern "C" void sigINTRHandler(int, siginfo_t*, void*);
2309
2310int os::Solaris::get_our_sigflags(int sig) {
2311  assert(ourSigFlags!=NULL, "signal data structure not initialized");
2312  assert(sig > 0 && sig < Maxsignum, "vm signal out of expected range");
2313  return ourSigFlags[sig];
2314}
2315
2316void os::Solaris::set_our_sigflags(int sig, int flags) {
2317  assert(ourSigFlags!=NULL, "signal data structure not initialized");
2318  assert(sig > 0 && sig < Maxsignum, "vm signal out of expected range");
2319  ourSigFlags[sig] = flags;
2320}
2321
2322
2323static const char* get_signal_handler_name(address handler,
2324                                           char* buf, int buflen) {
2325  int offset;
2326  bool found = os::dll_address_to_library_name(handler, buf, buflen, &offset);
2327  if (found) {
2328    // skip directory names
2329    const char *p1, *p2;
2330    p1 = buf;
2331    size_t len = strlen(os::file_separator());
2332    while ((p2 = strstr(p1, os::file_separator())) != NULL) p1 = p2 + len;
2333    jio_snprintf(buf, buflen, "%s+0x%x", p1, offset);
2334  } else {
2335    jio_snprintf(buf, buflen, PTR_FORMAT, handler);
2336  }
2337  return buf;
2338}
2339
2340static void print_signal_handler(outputStream* st, int sig,
2341                                  char* buf, size_t buflen) {
2342  struct sigaction sa;
2343
2344  sigaction(sig, NULL, &sa);
2345
2346  st->print("%s: ", os::exception_name(sig, buf, buflen));
2347
2348  address handler = (sa.sa_flags & SA_SIGINFO)
2349                  ? CAST_FROM_FN_PTR(address, sa.sa_sigaction)
2350                  : CAST_FROM_FN_PTR(address, sa.sa_handler);
2351
2352  if (handler == CAST_FROM_FN_PTR(address, SIG_DFL)) {
2353    st->print("SIG_DFL");
2354  } else if (handler == CAST_FROM_FN_PTR(address, SIG_IGN)) {
2355    st->print("SIG_IGN");
2356  } else {
2357    st->print("[%s]", get_signal_handler_name(handler, buf, buflen));
2358  }
2359
2360  st->print(", sa_mask[0]=" PTR32_FORMAT, *(uint32_t*)&sa.sa_mask);
2361
2362  address rh = VMError::get_resetted_sighandler(sig);
2363  // May be, handler was resetted by VMError?
2364  if(rh != NULL) {
2365    handler = rh;
2366    sa.sa_flags = VMError::get_resetted_sigflags(sig);
2367  }
2368
2369  st->print(", sa_flags="   PTR32_FORMAT, sa.sa_flags);
2370
2371  // Check: is it our handler?
2372  if(handler == CAST_FROM_FN_PTR(address, signalHandler) ||
2373     handler == CAST_FROM_FN_PTR(address, sigINTRHandler)) {
2374    // It is our signal handler
2375    // check for flags
2376    if(sa.sa_flags != os::Solaris::get_our_sigflags(sig)) {
2377      st->print(
2378        ", flags was changed from " PTR32_FORMAT ", consider using jsig library",
2379        os::Solaris::get_our_sigflags(sig));
2380    }
2381  }
2382  st->cr();
2383}
2384
2385void os::print_signal_handlers(outputStream* st, char* buf, size_t buflen) {
2386  st->print_cr("Signal Handlers:");
2387  print_signal_handler(st, SIGSEGV, buf, buflen);
2388  print_signal_handler(st, SIGBUS , buf, buflen);
2389  print_signal_handler(st, SIGFPE , buf, buflen);
2390  print_signal_handler(st, SIGPIPE, buf, buflen);
2391  print_signal_handler(st, SIGXFSZ, buf, buflen);
2392  print_signal_handler(st, SIGILL , buf, buflen);
2393  print_signal_handler(st, INTERRUPT_SIGNAL, buf, buflen);
2394  print_signal_handler(st, ASYNC_SIGNAL, buf, buflen);
2395  print_signal_handler(st, BREAK_SIGNAL, buf, buflen);
2396  print_signal_handler(st, SHUTDOWN1_SIGNAL , buf, buflen);
2397  print_signal_handler(st, SHUTDOWN2_SIGNAL , buf, buflen);
2398  print_signal_handler(st, SHUTDOWN3_SIGNAL, buf, buflen);
2399  print_signal_handler(st, os::Solaris::SIGinterrupt(), buf, buflen);
2400  print_signal_handler(st, os::Solaris::SIGasync(), buf, buflen);
2401}
2402
2403static char saved_jvm_path[MAXPATHLEN] = { 0 };
2404
2405// Find the full path to the current module, libjvm.so or libjvm_g.so
2406void os::jvm_path(char *buf, jint buflen) {
2407  // Error checking.
2408  if (buflen < MAXPATHLEN) {
2409    assert(false, "must use a large-enough buffer");
2410    buf[0] = '\0';
2411    return;
2412  }
2413  // Lazy resolve the path to current module.
2414  if (saved_jvm_path[0] != 0) {
2415    strcpy(buf, saved_jvm_path);
2416    return;
2417  }
2418
2419  Dl_info dlinfo;
2420  int ret = dladdr(CAST_FROM_FN_PTR(void *, os::jvm_path), &dlinfo);
2421  assert(ret != 0, "cannot locate libjvm");
2422  realpath((char *)dlinfo.dli_fname, buf);
2423
2424  if (strcmp(Arguments::sun_java_launcher(), "gamma") == 0) {
2425    // Support for the gamma launcher.  Typical value for buf is
2426    // "<JAVA_HOME>/jre/lib/<arch>/<vmtype>/libjvm.so".  If "/jre/lib/" appears at
2427    // the right place in the string, then assume we are installed in a JDK and
2428    // we're done.  Otherwise, check for a JAVA_HOME environment variable and fix
2429    // up the path so it looks like libjvm.so is installed there (append a
2430    // fake suffix hotspot/libjvm.so).
2431    const char *p = buf + strlen(buf) - 1;
2432    for (int count = 0; p > buf && count < 5; ++count) {
2433      for (--p; p > buf && *p != '/'; --p)
2434        /* empty */ ;
2435    }
2436
2437    if (strncmp(p, "/jre/lib/", 9) != 0) {
2438      // Look for JAVA_HOME in the environment.
2439      char* java_home_var = ::getenv("JAVA_HOME");
2440      if (java_home_var != NULL && java_home_var[0] != 0) {
2441        char cpu_arch[12];
2442        sysinfo(SI_ARCHITECTURE, cpu_arch, sizeof(cpu_arch));
2443#ifdef _LP64
2444        // If we are on sparc running a 64-bit vm, look in jre/lib/sparcv9.
2445        if (strcmp(cpu_arch, "sparc") == 0) {
2446          strcat(cpu_arch, "v9");
2447        } else if (strcmp(cpu_arch, "i386") == 0) {
2448          strcpy(cpu_arch, "amd64");
2449        }
2450#endif
2451        // Check the current module name "libjvm.so" or "libjvm_g.so".
2452        p = strrchr(buf, '/');
2453        assert(strstr(p, "/libjvm") == p, "invalid library name");
2454        p = strstr(p, "_g") ? "_g" : "";
2455
2456        realpath(java_home_var, buf);
2457        sprintf(buf + strlen(buf), "/jre/lib/%s", cpu_arch);
2458        if (0 == access(buf, F_OK)) {
2459          // Use current module name "libjvm[_g].so" instead of
2460          // "libjvm"debug_only("_g")".so" since for fastdebug version
2461          // we should have "libjvm.so" but debug_only("_g") adds "_g"!
2462          // It is used when we are choosing the HPI library's name
2463          // "libhpi[_g].so" in hpi::initialize_get_interface().
2464          sprintf(buf + strlen(buf), "/hotspot/libjvm%s.so", p);
2465        } else {
2466          // Go back to path of .so
2467          realpath((char *)dlinfo.dli_fname, buf);
2468        }
2469      }
2470    }
2471  }
2472
2473  strcpy(saved_jvm_path, buf);
2474}
2475
2476
2477void os::print_jni_name_prefix_on(outputStream* st, int args_size) {
2478  // no prefix required, not even "_"
2479}
2480
2481
2482void os::print_jni_name_suffix_on(outputStream* st, int args_size) {
2483  // no suffix required
2484}
2485
2486
2487// sun.misc.Signal
2488
2489extern "C" {
2490  static void UserHandler(int sig, void *siginfo, void *context) {
2491    // Ctrl-C is pressed during error reporting, likely because the error
2492    // handler fails to abort. Let VM die immediately.
2493    if (sig == SIGINT && is_error_reported()) {
2494       os::die();
2495    }
2496
2497    os::signal_notify(sig);
2498    // We do not need to reinstate the signal handler each time...
2499  }
2500}
2501
2502void* os::user_handler() {
2503  return CAST_FROM_FN_PTR(void*, UserHandler);
2504}
2505
2506extern "C" {
2507  typedef void (*sa_handler_t)(int);
2508  typedef void (*sa_sigaction_t)(int, siginfo_t *, void *);
2509}
2510
2511void* os::signal(int signal_number, void* handler) {
2512  struct sigaction sigAct, oldSigAct;
2513  sigfillset(&(sigAct.sa_mask));
2514  sigAct.sa_flags = SA_RESTART & ~SA_RESETHAND;
2515  sigAct.sa_handler = CAST_TO_FN_PTR(sa_handler_t, handler);
2516
2517  if (sigaction(signal_number, &sigAct, &oldSigAct))
2518    // -1 means registration failed
2519    return (void *)-1;
2520
2521  return CAST_FROM_FN_PTR(void*, oldSigAct.sa_handler);
2522}
2523
2524void os::signal_raise(int signal_number) {
2525  raise(signal_number);
2526}
2527
2528/*
2529 * The following code is moved from os.cpp for making this
2530 * code platform specific, which it is by its very nature.
2531 */
2532
2533// a counter for each possible signal value
2534static int Sigexit = 0;
2535static int Maxlibjsigsigs;
2536static jint *pending_signals = NULL;
2537static int *preinstalled_sigs = NULL;
2538static struct sigaction *chainedsigactions = NULL;
2539static sema_t sig_sem;
2540typedef int (*version_getting_t)();
2541version_getting_t os::Solaris::get_libjsig_version = NULL;
2542static int libjsigversion = NULL;
2543
2544int os::sigexitnum_pd() {
2545  assert(Sigexit > 0, "signal memory not yet initialized");
2546  return Sigexit;
2547}
2548
2549void os::Solaris::init_signal_mem() {
2550  // Initialize signal structures
2551  Maxsignum = SIGRTMAX;
2552  Sigexit = Maxsignum+1;
2553  assert(Maxsignum >0, "Unable to obtain max signal number");
2554
2555  Maxlibjsigsigs = Maxsignum;
2556
2557  // pending_signals has one int per signal
2558  // The additional signal is for SIGEXIT - exit signal to signal_thread
2559  pending_signals = (jint *)os::malloc(sizeof(jint) * (Sigexit+1));
2560  memset(pending_signals, 0, (sizeof(jint) * (Sigexit+1)));
2561
2562  if (UseSignalChaining) {
2563     chainedsigactions = (struct sigaction *)malloc(sizeof(struct sigaction)
2564       * (Maxsignum + 1));
2565     memset(chainedsigactions, 0, (sizeof(struct sigaction) * (Maxsignum + 1)));
2566     preinstalled_sigs = (int *)os::malloc(sizeof(int) * (Maxsignum + 1));
2567     memset(preinstalled_sigs, 0, (sizeof(int) * (Maxsignum + 1)));
2568  }
2569  ourSigFlags = (int*)malloc(sizeof(int) * (Maxsignum + 1 ));
2570  memset(ourSigFlags, 0, sizeof(int) * (Maxsignum + 1));
2571}
2572
2573void os::signal_init_pd() {
2574  int ret;
2575
2576  ret = ::sema_init(&sig_sem, 0, NULL, NULL);
2577  assert(ret == 0, "sema_init() failed");
2578}
2579
2580void os::signal_notify(int signal_number) {
2581  int ret;
2582
2583  Atomic::inc(&pending_signals[signal_number]);
2584  ret = ::sema_post(&sig_sem);
2585  assert(ret == 0, "sema_post() failed");
2586}
2587
2588static int check_pending_signals(bool wait_for_signal) {
2589  int ret;
2590  while (true) {
2591    for (int i = 0; i < Sigexit + 1; i++) {
2592      jint n = pending_signals[i];
2593      if (n > 0 && n == Atomic::cmpxchg(n - 1, &pending_signals[i], n)) {
2594        return i;
2595      }
2596    }
2597    if (!wait_for_signal) {
2598      return -1;
2599    }
2600    JavaThread *thread = JavaThread::current();
2601    ThreadBlockInVM tbivm(thread);
2602
2603    bool threadIsSuspended;
2604    do {
2605      thread->set_suspend_equivalent();
2606      // cleared by handle_special_suspend_equivalent_condition() or java_suspend_self()
2607      while((ret = ::sema_wait(&sig_sem)) == EINTR)
2608          ;
2609      assert(ret == 0, "sema_wait() failed");
2610
2611      // were we externally suspended while we were waiting?
2612      threadIsSuspended = thread->handle_special_suspend_equivalent_condition();
2613      if (threadIsSuspended) {
2614        //
2615        // The semaphore has been incremented, but while we were waiting
2616        // another thread suspended us. We don't want to continue running
2617        // while suspended because that would surprise the thread that
2618        // suspended us.
2619        //
2620        ret = ::sema_post(&sig_sem);
2621        assert(ret == 0, "sema_post() failed");
2622
2623        thread->java_suspend_self();
2624      }
2625    } while (threadIsSuspended);
2626  }
2627}
2628
2629int os::signal_lookup() {
2630  return check_pending_signals(false);
2631}
2632
2633int os::signal_wait() {
2634  return check_pending_signals(true);
2635}
2636
2637////////////////////////////////////////////////////////////////////////////////
2638// Virtual Memory
2639
2640static int page_size = -1;
2641
2642// The mmap MAP_ALIGN flag is supported on Solaris 9 and later.  init_2() will
2643// clear this var if support is not available.
2644static bool has_map_align = true;
2645
2646int os::vm_page_size() {
2647  assert(page_size != -1, "must call os::init");
2648  return page_size;
2649}
2650
2651// Solaris allocates memory by pages.
2652int os::vm_allocation_granularity() {
2653  assert(page_size != -1, "must call os::init");
2654  return page_size;
2655}
2656
2657bool os::commit_memory(char* addr, size_t bytes, bool exec) {
2658  int prot = exec ? PROT_READ|PROT_WRITE|PROT_EXEC : PROT_READ|PROT_WRITE;
2659  size_t size = bytes;
2660  return
2661     NULL != Solaris::mmap_chunk(addr, size, MAP_PRIVATE|MAP_FIXED, prot);
2662}
2663
2664bool os::commit_memory(char* addr, size_t bytes, size_t alignment_hint,
2665                       bool exec) {
2666  if (commit_memory(addr, bytes, exec)) {
2667    if (UseMPSS && alignment_hint > (size_t)vm_page_size()) {
2668      // If the large page size has been set and the VM
2669      // is using large pages, use the large page size
2670      // if it is smaller than the alignment hint. This is
2671      // a case where the VM wants to use a larger alignment size
2672      // for its own reasons but still want to use large pages
2673      // (which is what matters to setting the mpss range.
2674      size_t page_size = 0;
2675      if (large_page_size() < alignment_hint) {
2676        assert(UseLargePages, "Expected to be here for large page use only");
2677        page_size = large_page_size();
2678      } else {
2679        // If the alignment hint is less than the large page
2680        // size, the VM wants a particular alignment (thus the hint)
2681        // for internal reasons.  Try to set the mpss range using
2682        // the alignment_hint.
2683        page_size = alignment_hint;
2684      }
2685      // Since this is a hint, ignore any failures.
2686      (void)Solaris::set_mpss_range(addr, bytes, page_size);
2687    }
2688    return true;
2689  }
2690  return false;
2691}
2692
2693// Uncommit the pages in a specified region.
2694void os::free_memory(char* addr, size_t bytes) {
2695  if (madvise(addr, bytes, MADV_FREE) < 0) {
2696    debug_only(warning("MADV_FREE failed."));
2697    return;
2698  }
2699}
2700
2701// Change the page size in a given range.
2702void os::realign_memory(char *addr, size_t bytes, size_t alignment_hint) {
2703  assert((intptr_t)addr % alignment_hint == 0, "Address should be aligned.");
2704  assert((intptr_t)(addr + bytes) % alignment_hint == 0, "End should be aligned.");
2705  Solaris::set_mpss_range(addr, bytes, alignment_hint);
2706}
2707
2708// Tell the OS to make the range local to the first-touching LWP
2709void os::numa_make_local(char *addr, size_t bytes, int lgrp_hint) {
2710  assert((intptr_t)addr % os::vm_page_size() == 0, "Address should be page-aligned.");
2711  if (madvise(addr, bytes, MADV_ACCESS_LWP) < 0) {
2712    debug_only(warning("MADV_ACCESS_LWP failed."));
2713  }
2714}
2715
2716// Tell the OS that this range would be accessed from different LWPs.
2717void os::numa_make_global(char *addr, size_t bytes) {
2718  assert((intptr_t)addr % os::vm_page_size() == 0, "Address should be page-aligned.");
2719  if (madvise(addr, bytes, MADV_ACCESS_MANY) < 0) {
2720    debug_only(warning("MADV_ACCESS_MANY failed."));
2721  }
2722}
2723
2724// Get the number of the locality groups.
2725size_t os::numa_get_groups_num() {
2726  size_t n = Solaris::lgrp_nlgrps(Solaris::lgrp_cookie());
2727  return n != -1 ? n : 1;
2728}
2729
2730// Get a list of leaf locality groups. A leaf lgroup is group that
2731// doesn't have any children. Typical leaf group is a CPU or a CPU/memory
2732// board. An LWP is assigned to one of these groups upon creation.
2733size_t os::numa_get_leaf_groups(int *ids, size_t size) {
2734   if ((ids[0] = Solaris::lgrp_root(Solaris::lgrp_cookie())) == -1) {
2735     ids[0] = 0;
2736     return 1;
2737   }
2738   int result_size = 0, top = 1, bottom = 0, cur = 0;
2739   for (int k = 0; k < size; k++) {
2740     int r = Solaris::lgrp_children(Solaris::lgrp_cookie(), ids[cur],
2741                                    (Solaris::lgrp_id_t*)&ids[top], size - top);
2742     if (r == -1) {
2743       ids[0] = 0;
2744       return 1;
2745     }
2746     if (!r) {
2747       // That's a leaf node.
2748       assert (bottom <= cur, "Sanity check");
2749       // Check if the node has memory
2750       if (Solaris::lgrp_resources(Solaris::lgrp_cookie(), ids[cur],
2751                                   NULL, 0, LGRP_RSRC_MEM) > 0) {
2752         ids[bottom++] = ids[cur];
2753       }
2754     }
2755     top += r;
2756     cur++;
2757   }
2758   if (bottom == 0) {
2759     // Handle a situation, when the OS reports no memory available.
2760     // Assume UMA architecture.
2761     ids[0] = 0;
2762     return 1;
2763   }
2764   return bottom;
2765}
2766
2767// Detect the topology change. Typically happens during CPU plugging-unplugging.
2768bool os::numa_topology_changed() {
2769  int is_stale = Solaris::lgrp_cookie_stale(Solaris::lgrp_cookie());
2770  if (is_stale != -1 && is_stale) {
2771    Solaris::lgrp_fini(Solaris::lgrp_cookie());
2772    Solaris::lgrp_cookie_t c = Solaris::lgrp_init(Solaris::LGRP_VIEW_CALLER);
2773    assert(c != 0, "Failure to initialize LGRP API");
2774    Solaris::set_lgrp_cookie(c);
2775    return true;
2776  }
2777  return false;
2778}
2779
2780// Get the group id of the current LWP.
2781int os::numa_get_group_id() {
2782  int lgrp_id = Solaris::lgrp_home(P_LWPID, P_MYID);
2783  if (lgrp_id == -1) {
2784    return 0;
2785  }
2786  const int size = os::numa_get_groups_num();
2787  int *ids = (int*)alloca(size * sizeof(int));
2788
2789  // Get the ids of all lgroups with memory; r is the count.
2790  int r = Solaris::lgrp_resources(Solaris::lgrp_cookie(), lgrp_id,
2791                                  (Solaris::lgrp_id_t*)ids, size, LGRP_RSRC_MEM);
2792  if (r <= 0) {
2793    return 0;
2794  }
2795  return ids[os::random() % r];
2796}
2797
2798// Request information about the page.
2799bool os::get_page_info(char *start, page_info* info) {
2800  const uint_t info_types[] = { MEMINFO_VLGRP, MEMINFO_VPAGESIZE };
2801  uint64_t addr = (uintptr_t)start;
2802  uint64_t outdata[2];
2803  uint_t validity = 0;
2804
2805  if (os::Solaris::meminfo(&addr, 1, info_types, 2, outdata, &validity) < 0) {
2806    return false;
2807  }
2808
2809  info->size = 0;
2810  info->lgrp_id = -1;
2811
2812  if ((validity & 1) != 0) {
2813    if ((validity & 2) != 0) {
2814      info->lgrp_id = outdata[0];
2815    }
2816    if ((validity & 4) != 0) {
2817      info->size = outdata[1];
2818    }
2819    return true;
2820  }
2821  return false;
2822}
2823
2824// Scan the pages from start to end until a page different than
2825// the one described in the info parameter is encountered.
2826char *os::scan_pages(char *start, char* end, page_info* page_expected, page_info* page_found) {
2827  const uint_t info_types[] = { MEMINFO_VLGRP, MEMINFO_VPAGESIZE };
2828  const size_t types = sizeof(info_types) / sizeof(info_types[0]);
2829  uint64_t addrs[MAX_MEMINFO_CNT], outdata[types * MAX_MEMINFO_CNT];
2830  uint_t validity[MAX_MEMINFO_CNT];
2831
2832  size_t page_size = MAX2((size_t)os::vm_page_size(), page_expected->size);
2833  uint64_t p = (uint64_t)start;
2834  while (p < (uint64_t)end) {
2835    addrs[0] = p;
2836    size_t addrs_count = 1;
2837    while (addrs_count < MAX_MEMINFO_CNT && addrs[addrs_count - 1] < (uint64_t)end) {
2838      addrs[addrs_count] = addrs[addrs_count - 1] + page_size;
2839      addrs_count++;
2840    }
2841
2842    if (os::Solaris::meminfo(addrs, addrs_count, info_types, types, outdata, validity) < 0) {
2843      return NULL;
2844    }
2845
2846    size_t i = 0;
2847    for (; i < addrs_count; i++) {
2848      if ((validity[i] & 1) != 0) {
2849        if ((validity[i] & 4) != 0) {
2850          if (outdata[types * i + 1] != page_expected->size) {
2851            break;
2852          }
2853        } else
2854          if (page_expected->size != 0) {
2855            break;
2856          }
2857
2858        if ((validity[i] & 2) != 0 && page_expected->lgrp_id > 0) {
2859          if (outdata[types * i] != page_expected->lgrp_id) {
2860            break;
2861          }
2862        }
2863      } else {
2864        return NULL;
2865      }
2866    }
2867
2868    if (i != addrs_count) {
2869      if ((validity[i] & 2) != 0) {
2870        page_found->lgrp_id = outdata[types * i];
2871      } else {
2872        page_found->lgrp_id = -1;
2873      }
2874      if ((validity[i] & 4) != 0) {
2875        page_found->size = outdata[types * i + 1];
2876      } else {
2877        page_found->size = 0;
2878      }
2879      return (char*)addrs[i];
2880    }
2881
2882    p = addrs[addrs_count - 1] + page_size;
2883  }
2884  return end;
2885}
2886
2887bool os::uncommit_memory(char* addr, size_t bytes) {
2888  size_t size = bytes;
2889  // Map uncommitted pages PROT_NONE so we fail early if we touch an
2890  // uncommitted page. Otherwise, the read/write might succeed if we
2891  // have enough swap space to back the physical page.
2892  return
2893    NULL != Solaris::mmap_chunk(addr, size,
2894                                MAP_PRIVATE|MAP_FIXED|MAP_NORESERVE,
2895                                PROT_NONE);
2896}
2897
2898char* os::Solaris::mmap_chunk(char *addr, size_t size, int flags, int prot) {
2899  char *b = (char *)mmap(addr, size, prot, flags, os::Solaris::_dev_zero_fd, 0);
2900
2901  if (b == MAP_FAILED) {
2902    return NULL;
2903  }
2904  return b;
2905}
2906
2907char* os::Solaris::anon_mmap(char* requested_addr, size_t bytes, size_t alignment_hint, bool fixed) {
2908  char* addr = requested_addr;
2909  int flags = MAP_PRIVATE | MAP_NORESERVE;
2910
2911  assert(!(fixed && (alignment_hint > 0)), "alignment hint meaningless with fixed mmap");
2912
2913  if (fixed) {
2914    flags |= MAP_FIXED;
2915  } else if (has_map_align && (alignment_hint > (size_t) vm_page_size())) {
2916    flags |= MAP_ALIGN;
2917    addr = (char*) alignment_hint;
2918  }
2919
2920  // Map uncommitted pages PROT_NONE so we fail early if we touch an
2921  // uncommitted page. Otherwise, the read/write might succeed if we
2922  // have enough swap space to back the physical page.
2923  return mmap_chunk(addr, bytes, flags, PROT_NONE);
2924}
2925
2926char* os::reserve_memory(size_t bytes, char* requested_addr, size_t alignment_hint) {
2927  char* addr = Solaris::anon_mmap(requested_addr, bytes, alignment_hint, (requested_addr != NULL));
2928
2929  guarantee(requested_addr == NULL || requested_addr == addr,
2930            "OS failed to return requested mmap address.");
2931  return addr;
2932}
2933
2934// Reserve memory at an arbitrary address, only if that area is
2935// available (and not reserved for something else).
2936
2937char* os::attempt_reserve_memory_at(size_t bytes, char* requested_addr) {
2938  const int max_tries = 10;
2939  char* base[max_tries];
2940  size_t size[max_tries];
2941
2942  // Solaris adds a gap between mmap'ed regions.  The size of the gap
2943  // is dependent on the requested size and the MMU.  Our initial gap
2944  // value here is just a guess and will be corrected later.
2945  bool had_top_overlap = false;
2946  bool have_adjusted_gap = false;
2947  size_t gap = 0x400000;
2948
2949  // Assert only that the size is a multiple of the page size, since
2950  // that's all that mmap requires, and since that's all we really know
2951  // about at this low abstraction level.  If we need higher alignment,
2952  // we can either pass an alignment to this method or verify alignment
2953  // in one of the methods further up the call chain.  See bug 5044738.
2954  assert(bytes % os::vm_page_size() == 0, "reserving unexpected size block");
2955
2956  // Since snv_84, Solaris attempts to honor the address hint - see 5003415.
2957  // Give it a try, if the kernel honors the hint we can return immediately.
2958  char* addr = Solaris::anon_mmap(requested_addr, bytes, 0, false);
2959  volatile int err = errno;
2960  if (addr == requested_addr) {
2961    return addr;
2962  } else if (addr != NULL) {
2963    unmap_memory(addr, bytes);
2964  }
2965
2966  if (PrintMiscellaneous && Verbose) {
2967    char buf[256];
2968    buf[0] = '\0';
2969    if (addr == NULL) {
2970      jio_snprintf(buf, sizeof(buf), ": %s", strerror(err));
2971    }
2972    warning("attempt_reserve_memory_at: couldn't reserve %d bytes at "
2973            PTR_FORMAT ": reserve_memory_helper returned " PTR_FORMAT
2974            "%s", bytes, requested_addr, addr, buf);
2975  }
2976
2977  // Address hint method didn't work.  Fall back to the old method.
2978  // In theory, once SNV becomes our oldest supported platform, this
2979  // code will no longer be needed.
2980  //
2981  // Repeatedly allocate blocks until the block is allocated at the
2982  // right spot. Give up after max_tries.
2983  int i;
2984  for (i = 0; i < max_tries; ++i) {
2985    base[i] = reserve_memory(bytes);
2986
2987    if (base[i] != NULL) {
2988      // Is this the block we wanted?
2989      if (base[i] == requested_addr) {
2990        size[i] = bytes;
2991        break;
2992      }
2993
2994      // check that the gap value is right
2995      if (had_top_overlap && !have_adjusted_gap) {
2996        size_t actual_gap = base[i-1] - base[i] - bytes;
2997        if (gap != actual_gap) {
2998          // adjust the gap value and retry the last 2 allocations
2999          assert(i > 0, "gap adjustment code problem");
3000          have_adjusted_gap = true;  // adjust the gap only once, just in case
3001          gap = actual_gap;
3002          if (PrintMiscellaneous && Verbose) {
3003            warning("attempt_reserve_memory_at: adjusted gap to 0x%lx", gap);
3004          }
3005          unmap_memory(base[i], bytes);
3006          unmap_memory(base[i-1], size[i-1]);
3007          i-=2;
3008          continue;
3009        }
3010      }
3011
3012      // Does this overlap the block we wanted? Give back the overlapped
3013      // parts and try again.
3014      //
3015      // There is still a bug in this code: if top_overlap == bytes,
3016      // the overlap is offset from requested region by the value of gap.
3017      // In this case giving back the overlapped part will not work,
3018      // because we'll give back the entire block at base[i] and
3019      // therefore the subsequent allocation will not generate a new gap.
3020      // This could be fixed with a new algorithm that used larger
3021      // or variable size chunks to find the requested region -
3022      // but such a change would introduce additional complications.
3023      // It's rare enough that the planets align for this bug,
3024      // so we'll just wait for a fix for 6204603/5003415 which
3025      // will provide a mmap flag to allow us to avoid this business.
3026
3027      size_t top_overlap = requested_addr + (bytes + gap) - base[i];
3028      if (top_overlap >= 0 && top_overlap < bytes) {
3029        had_top_overlap = true;
3030        unmap_memory(base[i], top_overlap);
3031        base[i] += top_overlap;
3032        size[i] = bytes - top_overlap;
3033      } else {
3034        size_t bottom_overlap = base[i] + bytes - requested_addr;
3035        if (bottom_overlap >= 0 && bottom_overlap < bytes) {
3036          if (PrintMiscellaneous && Verbose && bottom_overlap == 0) {
3037            warning("attempt_reserve_memory_at: possible alignment bug");
3038          }
3039          unmap_memory(requested_addr, bottom_overlap);
3040          size[i] = bytes - bottom_overlap;
3041        } else {
3042          size[i] = bytes;
3043        }
3044      }
3045    }
3046  }
3047
3048  // Give back the unused reserved pieces.
3049
3050  for (int j = 0; j < i; ++j) {
3051    if (base[j] != NULL) {
3052      unmap_memory(base[j], size[j]);
3053    }
3054  }
3055
3056  return (i < max_tries) ? requested_addr : NULL;
3057}
3058
3059bool os::release_memory(char* addr, size_t bytes) {
3060  size_t size = bytes;
3061  return munmap(addr, size) == 0;
3062}
3063
3064static bool solaris_mprotect(char* addr, size_t bytes, int prot) {
3065  assert(addr == (char*)align_size_down((uintptr_t)addr, os::vm_page_size()),
3066         "addr must be page aligned");
3067  int retVal = mprotect(addr, bytes, prot);
3068  return retVal == 0;
3069}
3070
3071// Protect memory (Used to pass readonly pages through
3072// JNI GetArray<type>Elements with empty arrays.)
3073// Also, used for serialization page and for compressed oops null pointer
3074// checking.
3075bool os::protect_memory(char* addr, size_t bytes, ProtType prot,
3076                        bool is_committed) {
3077  unsigned int p = 0;
3078  switch (prot) {
3079  case MEM_PROT_NONE: p = PROT_NONE; break;
3080  case MEM_PROT_READ: p = PROT_READ; break;
3081  case MEM_PROT_RW:   p = PROT_READ|PROT_WRITE; break;
3082  case MEM_PROT_RWX:  p = PROT_READ|PROT_WRITE|PROT_EXEC; break;
3083  default:
3084    ShouldNotReachHere();
3085  }
3086  // is_committed is unused.
3087  return solaris_mprotect(addr, bytes, p);
3088}
3089
3090// guard_memory and unguard_memory only happens within stack guard pages.
3091// Since ISM pertains only to the heap, guard and unguard memory should not
3092/// happen with an ISM region.
3093bool os::guard_memory(char* addr, size_t bytes) {
3094  return solaris_mprotect(addr, bytes, PROT_NONE);
3095}
3096
3097bool os::unguard_memory(char* addr, size_t bytes) {
3098  return solaris_mprotect(addr, bytes, PROT_READ|PROT_WRITE);
3099}
3100
3101// Large page support
3102
3103// UseLargePages is the master flag to enable/disable large page memory.
3104// UseMPSS and UseISM are supported for compatibility reasons. Their combined
3105// effects can be described in the following table:
3106//
3107// UseLargePages UseMPSS UseISM
3108//    false         *       *   => UseLargePages is the master switch, turning
3109//                                 it off will turn off both UseMPSS and
3110//                                 UseISM. VM will not use large page memory
3111//                                 regardless the settings of UseMPSS/UseISM.
3112//     true      false    false => Unless future Solaris provides other
3113//                                 mechanism to use large page memory, this
3114//                                 combination is equivalent to -UseLargePages,
3115//                                 VM will not use large page memory
3116//     true      true     false => JVM will use MPSS for large page memory.
3117//                                 This is the default behavior.
3118//     true      false    true  => JVM will use ISM for large page memory.
3119//     true      true     true  => JVM will use ISM if it is available.
3120//                                 Otherwise, JVM will fall back to MPSS.
3121//                                 Becaues ISM is now available on all
3122//                                 supported Solaris versions, this combination
3123//                                 is equivalent to +UseISM -UseMPSS.
3124
3125typedef int (*getpagesizes_func_type) (size_t[], int);
3126static size_t _large_page_size = 0;
3127
3128bool os::Solaris::ism_sanity_check(bool warn, size_t * page_size) {
3129  // x86 uses either 2M or 4M page, depending on whether PAE (Physical Address
3130  // Extensions) mode is enabled. AMD64/EM64T uses 2M page in 64bit mode. Sparc
3131  // can support multiple page sizes.
3132
3133  // Don't bother to probe page size because getpagesizes() comes with MPSS.
3134  // ISM is only recommended on old Solaris where there is no MPSS support.
3135  // Simply choose a conservative value as default.
3136  *page_size = LargePageSizeInBytes ? LargePageSizeInBytes :
3137               SPARC_ONLY(4 * M) IA32_ONLY(4 * M) AMD64_ONLY(2 * M);
3138
3139  // ISM is available on all supported Solaris versions
3140  return true;
3141}
3142
3143// Insertion sort for small arrays (descending order).
3144static void insertion_sort_descending(size_t* array, int len) {
3145  for (int i = 0; i < len; i++) {
3146    size_t val = array[i];
3147    for (size_t key = i; key > 0 && array[key - 1] < val; --key) {
3148      size_t tmp = array[key];
3149      array[key] = array[key - 1];
3150      array[key - 1] = tmp;
3151    }
3152  }
3153}
3154
3155bool os::Solaris::mpss_sanity_check(bool warn, size_t * page_size) {
3156  getpagesizes_func_type getpagesizes_func =
3157    CAST_TO_FN_PTR(getpagesizes_func_type, dlsym(RTLD_DEFAULT, "getpagesizes"));
3158  if (getpagesizes_func == NULL) {
3159    if (warn) {
3160      warning("MPSS is not supported by the operating system.");
3161    }
3162    return false;
3163  }
3164
3165  const unsigned int usable_count = VM_Version::page_size_count();
3166  if (usable_count == 1) {
3167    return false;
3168  }
3169
3170  // Fill the array of page sizes.
3171  int n = getpagesizes_func(_page_sizes, page_sizes_max);
3172  assert(n > 0, "Solaris bug?");
3173  if (n == page_sizes_max) {
3174    // Add a sentinel value (necessary only if the array was completely filled
3175    // since it is static (zeroed at initialization)).
3176    _page_sizes[--n] = 0;
3177    DEBUG_ONLY(warning("increase the size of the os::_page_sizes array.");)
3178  }
3179  assert(_page_sizes[n] == 0, "missing sentinel");
3180
3181  if (n == 1) return false;     // Only one page size available.
3182
3183  // Skip sizes larger than 4M (or LargePageSizeInBytes if it was set) and
3184  // select up to usable_count elements.  First sort the array, find the first
3185  // acceptable value, then copy the usable sizes to the top of the array and
3186  // trim the rest.  Make sure to include the default page size :-).
3187  //
3188  // A better policy could get rid of the 4M limit by taking the sizes of the
3189  // important VM memory regions (java heap and possibly the code cache) into
3190  // account.
3191  insertion_sort_descending(_page_sizes, n);
3192  const size_t size_limit =
3193    FLAG_IS_DEFAULT(LargePageSizeInBytes) ? 4 * M : LargePageSizeInBytes;
3194  int beg;
3195  for (beg = 0; beg < n && _page_sizes[beg] > size_limit; ++beg) /* empty */ ;
3196  const int end = MIN2((int)usable_count, n) - 1;
3197  for (int cur = 0; cur < end; ++cur, ++beg) {
3198    _page_sizes[cur] = _page_sizes[beg];
3199  }
3200  _page_sizes[end] = vm_page_size();
3201  _page_sizes[end + 1] = 0;
3202
3203  if (_page_sizes[end] > _page_sizes[end - 1]) {
3204    // Default page size is not the smallest; sort again.
3205    insertion_sort_descending(_page_sizes, end + 1);
3206  }
3207  *page_size = _page_sizes[0];
3208
3209  return true;
3210}
3211
3212bool os::large_page_init() {
3213  if (!UseLargePages) {
3214    UseISM = false;
3215    UseMPSS = false;
3216    return false;
3217  }
3218
3219  // print a warning if any large page related flag is specified on command line
3220  bool warn_on_failure = !FLAG_IS_DEFAULT(UseLargePages)        ||
3221                         !FLAG_IS_DEFAULT(UseISM)               ||
3222                         !FLAG_IS_DEFAULT(UseMPSS)              ||
3223                         !FLAG_IS_DEFAULT(LargePageSizeInBytes);
3224  UseISM = UseISM &&
3225           Solaris::ism_sanity_check(warn_on_failure, &_large_page_size);
3226  if (UseISM) {
3227    // ISM disables MPSS to be compatible with old JDK behavior
3228    UseMPSS = false;
3229    _page_sizes[0] = _large_page_size;
3230    _page_sizes[1] = vm_page_size();
3231  }
3232
3233  UseMPSS = UseMPSS &&
3234            Solaris::mpss_sanity_check(warn_on_failure, &_large_page_size);
3235
3236  UseLargePages = UseISM || UseMPSS;
3237  return UseLargePages;
3238}
3239
3240bool os::Solaris::set_mpss_range(caddr_t start, size_t bytes, size_t align) {
3241  // Signal to OS that we want large pages for addresses
3242  // from addr, addr + bytes
3243  struct memcntl_mha mpss_struct;
3244  mpss_struct.mha_cmd = MHA_MAPSIZE_VA;
3245  mpss_struct.mha_pagesize = align;
3246  mpss_struct.mha_flags = 0;
3247  if (memcntl(start, bytes, MC_HAT_ADVISE,
3248              (caddr_t) &mpss_struct, 0, 0) < 0) {
3249    debug_only(warning("Attempt to use MPSS failed."));
3250    return false;
3251  }
3252  return true;
3253}
3254
3255char* os::reserve_memory_special(size_t bytes, char* addr, bool exec) {
3256  // "exec" is passed in but not used.  Creating the shared image for
3257  // the code cache doesn't have an SHM_X executable permission to check.
3258  assert(UseLargePages && UseISM, "only for ISM large pages");
3259
3260  size_t size = bytes;
3261  char* retAddr = NULL;
3262  int shmid;
3263  key_t ismKey;
3264
3265  bool warn_on_failure = UseISM &&
3266                        (!FLAG_IS_DEFAULT(UseLargePages)         ||
3267                         !FLAG_IS_DEFAULT(UseISM)                ||
3268                         !FLAG_IS_DEFAULT(LargePageSizeInBytes)
3269                        );
3270  char msg[128];
3271
3272  ismKey = IPC_PRIVATE;
3273
3274  // Create a large shared memory region to attach to based on size.
3275  // Currently, size is the total size of the heap
3276  shmid = shmget(ismKey, size, SHM_R | SHM_W | IPC_CREAT);
3277  if (shmid == -1){
3278     if (warn_on_failure) {
3279       jio_snprintf(msg, sizeof(msg), "Failed to reserve shared memory (errno = %d).", errno);
3280       warning(msg);
3281     }
3282     return NULL;
3283  }
3284
3285  // Attach to the region
3286  retAddr = (char *) shmat(shmid, 0, SHM_SHARE_MMU | SHM_R | SHM_W);
3287  int err = errno;
3288
3289  // Remove shmid. If shmat() is successful, the actual shared memory segment
3290  // will be deleted when it's detached by shmdt() or when the process
3291  // terminates. If shmat() is not successful this will remove the shared
3292  // segment immediately.
3293  shmctl(shmid, IPC_RMID, NULL);
3294
3295  if (retAddr == (char *) -1) {
3296    if (warn_on_failure) {
3297      jio_snprintf(msg, sizeof(msg), "Failed to attach shared memory (errno = %d).", err);
3298      warning(msg);
3299    }
3300    return NULL;
3301  }
3302
3303  return retAddr;
3304}
3305
3306bool os::release_memory_special(char* base, size_t bytes) {
3307  // detaching the SHM segment will also delete it, see reserve_memory_special()
3308  int rslt = shmdt(base);
3309  return rslt == 0;
3310}
3311
3312size_t os::large_page_size() {
3313  return _large_page_size;
3314}
3315
3316// MPSS allows application to commit large page memory on demand; with ISM
3317// the entire memory region must be allocated as shared memory.
3318bool os::can_commit_large_page_memory() {
3319  return UseISM ? false : true;
3320}
3321
3322bool os::can_execute_large_page_memory() {
3323  return UseISM ? false : true;
3324}
3325
3326static int os_sleep(jlong millis, bool interruptible) {
3327  const jlong limit = INT_MAX;
3328  jlong prevtime;
3329  int res;
3330
3331  while (millis > limit) {
3332    if ((res = os_sleep(limit, interruptible)) != OS_OK)
3333      return res;
3334    millis -= limit;
3335  }
3336
3337  // Restart interrupted polls with new parameters until the proper delay
3338  // has been completed.
3339
3340  prevtime = getTimeMillis();
3341
3342  while (millis > 0) {
3343    jlong newtime;
3344
3345    if (!interruptible) {
3346      // Following assert fails for os::yield_all:
3347      // assert(!thread->is_Java_thread(), "must not be java thread");
3348      res = poll(NULL, 0, millis);
3349    } else {
3350      JavaThread *jt = JavaThread::current();
3351
3352      INTERRUPTIBLE_NORESTART_VM_ALWAYS(poll(NULL, 0, millis), res, jt,
3353        os::Solaris::clear_interrupted);
3354    }
3355
3356    // INTERRUPTIBLE_NORESTART_VM_ALWAYS returns res == OS_INTRPT for
3357    // thread.Interrupt.
3358
3359    if((res == OS_ERR) && (errno == EINTR)) {
3360      newtime = getTimeMillis();
3361      assert(newtime >= prevtime, "time moving backwards");
3362    /* Doing prevtime and newtime in microseconds doesn't help precision,
3363       and trying to round up to avoid lost milliseconds can result in a
3364       too-short delay. */
3365      millis -= newtime - prevtime;
3366      if(millis <= 0)
3367        return OS_OK;
3368      prevtime = newtime;
3369    } else
3370      return res;
3371  }
3372
3373  return OS_OK;
3374}
3375
3376// Read calls from inside the vm need to perform state transitions
3377size_t os::read(int fd, void *buf, unsigned int nBytes) {
3378  INTERRUPTIBLE_RETURN_INT_VM(::read(fd, buf, nBytes), os::Solaris::clear_interrupted);
3379}
3380
3381int os::sleep(Thread* thread, jlong millis, bool interruptible) {
3382  assert(thread == Thread::current(),  "thread consistency check");
3383
3384  // TODO-FIXME: this should be removed.
3385  // On Solaris machines (especially 2.5.1) we found that sometimes the VM gets into a live lock
3386  // situation with a JavaThread being starved out of a lwp. The kernel doesn't seem to generate
3387  // a SIGWAITING signal which would enable the threads library to create a new lwp for the starving
3388  // thread. We suspect that because the Watcher thread keeps waking up at periodic intervals the kernel
3389  // is fooled into believing that the system is making progress. In the code below we block the
3390  // the watcher thread while safepoint is in progress so that it would not appear as though the
3391  // system is making progress.
3392  if (!Solaris::T2_libthread() &&
3393      thread->is_Watcher_thread() && SafepointSynchronize::is_synchronizing() && !Arguments::has_profile()) {
3394    // We now try to acquire the threads lock. Since this lock is held by the VM thread during
3395    // the entire safepoint, the watcher thread will  line up here during the safepoint.
3396    Threads_lock->lock_without_safepoint_check();
3397    Threads_lock->unlock();
3398  }
3399
3400  if (thread->is_Java_thread()) {
3401    // This is a JavaThread so we honor the _thread_blocked protocol
3402    // even for sleeps of 0 milliseconds. This was originally done
3403    // as a workaround for bug 4338139. However, now we also do it
3404    // to honor the suspend-equivalent protocol.
3405
3406    JavaThread *jt = (JavaThread *) thread;
3407    ThreadBlockInVM tbivm(jt);
3408
3409    jt->set_suspend_equivalent();
3410    // cleared by handle_special_suspend_equivalent_condition() or
3411    // java_suspend_self() via check_and_wait_while_suspended()
3412
3413    int ret_code;
3414    if (millis <= 0) {
3415      thr_yield();
3416      ret_code = 0;
3417    } else {
3418      // The original sleep() implementation did not create an
3419      // OSThreadWaitState helper for sleeps of 0 milliseconds.
3420      // I'm preserving that decision for now.
3421      OSThreadWaitState osts(jt->osthread(), false /* not Object.wait() */);
3422
3423      ret_code = os_sleep(millis, interruptible);
3424    }
3425
3426    // were we externally suspended while we were waiting?
3427    jt->check_and_wait_while_suspended();
3428
3429    return ret_code;
3430  }
3431
3432  // non-JavaThread from this point on:
3433
3434  if (millis <= 0) {
3435    thr_yield();
3436    return 0;
3437  }
3438
3439  OSThreadWaitState osts(thread->osthread(), false /* not Object.wait() */);
3440
3441  return os_sleep(millis, interruptible);
3442}
3443
3444int os::naked_sleep() {
3445  // %% make the sleep time an integer flag. for now use 1 millisec.
3446  return os_sleep(1, false);
3447}
3448
3449// Sleep forever; naked call to OS-specific sleep; use with CAUTION
3450void os::infinite_sleep() {
3451  while (true) {    // sleep forever ...
3452    ::sleep(100);   // ... 100 seconds at a time
3453  }
3454}
3455
3456// Used to convert frequent JVM_Yield() to nops
3457bool os::dont_yield() {
3458  if (DontYieldALot) {
3459    static hrtime_t last_time = 0;
3460    hrtime_t diff = getTimeNanos() - last_time;
3461
3462    if (diff < DontYieldALotInterval * 1000000)
3463      return true;
3464
3465    last_time += diff;
3466
3467    return false;
3468  }
3469  else {
3470    return false;
3471  }
3472}
3473
3474// Caveat: Solaris os::yield() causes a thread-state transition whereas
3475// the linux and win32 implementations do not.  This should be checked.
3476
3477void os::yield() {
3478  // Yields to all threads with same or greater priority
3479  os::sleep(Thread::current(), 0, false);
3480}
3481
3482// Note that yield semantics are defined by the scheduling class to which
3483// the thread currently belongs.  Typically, yield will _not yield to
3484// other equal or higher priority threads that reside on the dispatch queues
3485// of other CPUs.
3486
3487os::YieldResult os::NakedYield() { thr_yield(); return os::YIELD_UNKNOWN; }
3488
3489
3490// On Solaris we found that yield_all doesn't always yield to all other threads.
3491// There have been cases where there is a thread ready to execute but it doesn't
3492// get an lwp as the VM thread continues to spin with sleeps of 1 millisecond.
3493// The 1 millisecond wait doesn't seem long enough for the kernel to issue a
3494// SIGWAITING signal which will cause a new lwp to be created. So we count the
3495// number of times yield_all is called in the one loop and increase the sleep
3496// time after 8 attempts. If this fails too we increase the concurrency level
3497// so that the starving thread would get an lwp
3498
3499void os::yield_all(int attempts) {
3500  // Yields to all threads, including threads with lower priorities
3501  if (attempts == 0) {
3502    os::sleep(Thread::current(), 1, false);
3503  } else {
3504    int iterations = attempts % 30;
3505    if (iterations == 0 && !os::Solaris::T2_libthread()) {
3506      // thr_setconcurrency and _getconcurrency make sense only under T1.
3507      int noofLWPS = thr_getconcurrency();
3508      if (noofLWPS < (Threads::number_of_threads() + 2)) {
3509        thr_setconcurrency(thr_getconcurrency() + 1);
3510      }
3511    } else if (iterations < 25) {
3512      os::sleep(Thread::current(), 1, false);
3513    } else {
3514      os::sleep(Thread::current(), 10, false);
3515    }
3516  }
3517}
3518
3519// Called from the tight loops to possibly influence time-sharing heuristics
3520void os::loop_breaker(int attempts) {
3521  os::yield_all(attempts);
3522}
3523
3524
3525// Interface for setting lwp priorities.  If we are using T2 libthread,
3526// which forces the use of BoundThreads or we manually set UseBoundThreads,
3527// all of our threads will be assigned to real lwp's.  Using the thr_setprio
3528// function is meaningless in this mode so we must adjust the real lwp's priority
3529// The routines below implement the getting and setting of lwp priorities.
3530//
3531// Note: There are three priority scales used on Solaris.  Java priotities
3532//       which range from 1 to 10, libthread "thr_setprio" scale which range
3533//       from 0 to 127, and the current scheduling class of the process we
3534//       are running in.  This is typically from -60 to +60.
3535//       The setting of the lwp priorities in done after a call to thr_setprio
3536//       so Java priorities are mapped to libthread priorities and we map from
3537//       the latter to lwp priorities.  We don't keep priorities stored in
3538//       Java priorities since some of our worker threads want to set priorities
3539//       higher than all Java threads.
3540//
3541// For related information:
3542// (1)  man -s 2 priocntl
3543// (2)  man -s 4 priocntl
3544// (3)  man dispadmin
3545// =    librt.so
3546// =    libthread/common/rtsched.c - thrp_setlwpprio().
3547// =    ps -cL <pid> ... to validate priority.
3548// =    sched_get_priority_min and _max
3549//              pthread_create
3550//              sched_setparam
3551//              pthread_setschedparam
3552//
3553// Assumptions:
3554// +    We assume that all threads in the process belong to the same
3555//              scheduling class.   IE. an homogenous process.
3556// +    Must be root or in IA group to change change "interactive" attribute.
3557//              Priocntl() will fail silently.  The only indication of failure is when
3558//              we read-back the value and notice that it hasn't changed.
3559// +    Interactive threads enter the runq at the head, non-interactive at the tail.
3560// +    For RT, change timeslice as well.  Invariant:
3561//              constant "priority integral"
3562//              Konst == TimeSlice * (60-Priority)
3563//              Given a priority, compute appropriate timeslice.
3564// +    Higher numerical values have higher priority.
3565
3566// sched class attributes
3567typedef struct {
3568        int   schedPolicy;              // classID
3569        int   maxPrio;
3570        int   minPrio;
3571} SchedInfo;
3572
3573
3574static SchedInfo tsLimits, iaLimits, rtLimits;
3575
3576#ifdef ASSERT
3577static int  ReadBackValidate = 1;
3578#endif
3579static int  myClass     = 0;
3580static int  myMin       = 0;
3581static int  myMax       = 0;
3582static int  myCur       = 0;
3583static bool priocntl_enable = false;
3584
3585
3586// Call the version of priocntl suitable for all supported versions
3587// of Solaris. We need to call through this wrapper so that we can
3588// build on Solaris 9 and run on Solaris 8, 9 and 10.
3589//
3590// This code should be removed if we ever stop supporting Solaris 8
3591// and earlier releases.
3592
3593static long priocntl_stub(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg);
3594typedef long (*priocntl_type)(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg);
3595static priocntl_type priocntl_ptr = priocntl_stub;
3596
3597// Stub to set the value of the real pointer, and then call the real
3598// function.
3599
3600static long priocntl_stub(int pcver, idtype_t idtype, id_t id, int cmd, caddr_t arg) {
3601  // Try Solaris 8- name only.
3602  priocntl_type tmp = (priocntl_type)dlsym(RTLD_DEFAULT, "__priocntl");
3603  guarantee(tmp != NULL, "priocntl function not found.");
3604  priocntl_ptr = tmp;
3605  return (*priocntl_ptr)(PC_VERSION, idtype, id, cmd, arg);
3606}
3607
3608
3609// lwp_priocntl_init
3610//
3611// Try to determine the priority scale for our process.
3612//
3613// Return errno or 0 if OK.
3614//
3615static
3616int     lwp_priocntl_init ()
3617{
3618  int rslt;
3619  pcinfo_t ClassInfo;
3620  pcparms_t ParmInfo;
3621  int i;
3622
3623  if (!UseThreadPriorities) return 0;
3624
3625  // We are using Bound threads, we need to determine our priority ranges
3626  if (os::Solaris::T2_libthread() || UseBoundThreads) {
3627    // If ThreadPriorityPolicy is 1, switch tables
3628    if (ThreadPriorityPolicy == 1) {
3629      for (i = 0 ; i < MaxPriority+1; i++)
3630        os::java_to_os_priority[i] = prio_policy1[i];
3631    }
3632  }
3633  // Not using Bound Threads, set to ThreadPolicy 1
3634  else {
3635    for ( i = 0 ; i < MaxPriority+1; i++ ) {
3636      os::java_to_os_priority[i] = prio_policy1[i];
3637    }
3638    return 0;
3639  }
3640
3641
3642  // Get IDs for a set of well-known scheduling classes.
3643  // TODO-FIXME: GETCLINFO returns the current # of classes in the
3644  // the system.  We should have a loop that iterates over the
3645  // classID values, which are known to be "small" integers.
3646
3647  strcpy(ClassInfo.pc_clname, "TS");
3648  ClassInfo.pc_cid = -1;
3649  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3650  if (rslt < 0) return errno;
3651  assert(ClassInfo.pc_cid != -1, "cid for TS class is -1");
3652  tsLimits.schedPolicy = ClassInfo.pc_cid;
3653  tsLimits.maxPrio = ((tsinfo_t*)ClassInfo.pc_clinfo)->ts_maxupri;
3654  tsLimits.minPrio = -tsLimits.maxPrio;
3655
3656  strcpy(ClassInfo.pc_clname, "IA");
3657  ClassInfo.pc_cid = -1;
3658  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3659  if (rslt < 0) return errno;
3660  assert(ClassInfo.pc_cid != -1, "cid for IA class is -1");
3661  iaLimits.schedPolicy = ClassInfo.pc_cid;
3662  iaLimits.maxPrio = ((iainfo_t*)ClassInfo.pc_clinfo)->ia_maxupri;
3663  iaLimits.minPrio = -iaLimits.maxPrio;
3664
3665  strcpy(ClassInfo.pc_clname, "RT");
3666  ClassInfo.pc_cid = -1;
3667  rslt = (*priocntl_ptr)(PC_VERSION, P_ALL, 0, PC_GETCID, (caddr_t)&ClassInfo);
3668  if (rslt < 0) return errno;
3669  assert(ClassInfo.pc_cid != -1, "cid for RT class is -1");
3670  rtLimits.schedPolicy = ClassInfo.pc_cid;
3671  rtLimits.maxPrio = ((rtinfo_t*)ClassInfo.pc_clinfo)->rt_maxpri;
3672  rtLimits.minPrio = 0;
3673
3674
3675  // Query our "current" scheduling class.
3676  // This will normally be IA,TS or, rarely, RT.
3677  memset (&ParmInfo, 0, sizeof(ParmInfo));
3678  ParmInfo.pc_cid = PC_CLNULL;
3679  rslt = (*priocntl_ptr) (PC_VERSION, P_PID, P_MYID, PC_GETPARMS, (caddr_t)&ParmInfo );
3680  if ( rslt < 0 ) return errno;
3681  myClass = ParmInfo.pc_cid;
3682
3683  // We now know our scheduling classId, get specific information
3684  // the class.
3685  ClassInfo.pc_cid = myClass;
3686  ClassInfo.pc_clname[0] = 0;
3687  rslt = (*priocntl_ptr) (PC_VERSION, (idtype)0, 0, PC_GETCLINFO, (caddr_t)&ClassInfo );
3688  if ( rslt < 0 ) return errno;
3689
3690  if (ThreadPriorityVerbose)
3691    tty->print_cr ("lwp_priocntl_init: Class=%d(%s)...", myClass, ClassInfo.pc_clname);
3692
3693  memset(&ParmInfo, 0, sizeof(pcparms_t));
3694  ParmInfo.pc_cid = PC_CLNULL;
3695  rslt = (*priocntl_ptr)(PC_VERSION, P_PID, P_MYID, PC_GETPARMS, (caddr_t)&ParmInfo);
3696  if (rslt < 0) return errno;
3697
3698  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3699    myMin = rtLimits.minPrio;
3700    myMax = rtLimits.maxPrio;
3701  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3702    iaparms_t *iaInfo  = (iaparms_t*)ParmInfo.pc_clparms;
3703    myMin = iaLimits.minPrio;
3704    myMax = iaLimits.maxPrio;
3705    myMax = MIN2(myMax, (int)iaInfo->ia_uprilim);       // clamp - restrict
3706  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3707    tsparms_t *tsInfo  = (tsparms_t*)ParmInfo.pc_clparms;
3708    myMin = tsLimits.minPrio;
3709    myMax = tsLimits.maxPrio;
3710    myMax = MIN2(myMax, (int)tsInfo->ts_uprilim);       // clamp - restrict
3711  } else {
3712    // No clue - punt
3713    if (ThreadPriorityVerbose)
3714      tty->print_cr ("Unknown scheduling class: %s ... \n", ClassInfo.pc_clname);
3715    return EINVAL;      // no clue, punt
3716  }
3717
3718  if (ThreadPriorityVerbose)
3719        tty->print_cr ("Thread priority Range: [%d..%d]\n", myMin, myMax);
3720
3721  priocntl_enable = true;  // Enable changing priorities
3722  return 0;
3723}
3724
3725#define IAPRI(x)        ((iaparms_t *)((x).pc_clparms))
3726#define RTPRI(x)        ((rtparms_t *)((x).pc_clparms))
3727#define TSPRI(x)        ((tsparms_t *)((x).pc_clparms))
3728
3729
3730// scale_to_lwp_priority
3731//
3732// Convert from the libthread "thr_setprio" scale to our current
3733// lwp scheduling class scale.
3734//
3735static
3736int     scale_to_lwp_priority (int rMin, int rMax, int x)
3737{
3738  int v;
3739
3740  if (x == 127) return rMax;            // avoid round-down
3741    v = (((x*(rMax-rMin)))/128)+rMin;
3742  return v;
3743}
3744
3745
3746// set_lwp_priority
3747//
3748// Set the priority of the lwp.  This call should only be made
3749// when using bound threads (T2 threads are bound by default).
3750//
3751int     set_lwp_priority (int ThreadID, int lwpid, int newPrio )
3752{
3753  int rslt;
3754  int Actual, Expected, prv;
3755  pcparms_t ParmInfo;                   // for GET-SET
3756#ifdef ASSERT
3757  pcparms_t ReadBack;                   // for readback
3758#endif
3759
3760  // Set priority via PC_GETPARMS, update, PC_SETPARMS
3761  // Query current values.
3762  // TODO: accelerate this by eliminating the PC_GETPARMS call.
3763  // Cache "pcparms_t" in global ParmCache.
3764  // TODO: elide set-to-same-value
3765
3766  // If something went wrong on init, don't change priorities.
3767  if ( !priocntl_enable ) {
3768    if (ThreadPriorityVerbose)
3769      tty->print_cr("Trying to set priority but init failed, ignoring");
3770    return EINVAL;
3771  }
3772
3773
3774  // If lwp hasn't started yet, just return
3775  // the _start routine will call us again.
3776  if ( lwpid <= 0 ) {
3777    if (ThreadPriorityVerbose) {
3778      tty->print_cr ("deferring the set_lwp_priority of thread " INTPTR_FORMAT " to %d, lwpid not set",
3779                     ThreadID, newPrio);
3780    }
3781    return 0;
3782  }
3783
3784  if (ThreadPriorityVerbose) {
3785    tty->print_cr ("set_lwp_priority(" INTPTR_FORMAT "@" INTPTR_FORMAT " %d) ",
3786                   ThreadID, lwpid, newPrio);
3787  }
3788
3789  memset(&ParmInfo, 0, sizeof(pcparms_t));
3790  ParmInfo.pc_cid = PC_CLNULL;
3791  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_GETPARMS, (caddr_t)&ParmInfo);
3792  if (rslt < 0) return errno;
3793
3794  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3795    rtparms_t *rtInfo  = (rtparms_t*)ParmInfo.pc_clparms;
3796    rtInfo->rt_pri     = scale_to_lwp_priority (rtLimits.minPrio, rtLimits.maxPrio, newPrio);
3797    rtInfo->rt_tqsecs  = RT_NOCHANGE;
3798    rtInfo->rt_tqnsecs = RT_NOCHANGE;
3799    if (ThreadPriorityVerbose) {
3800      tty->print_cr("RT: %d->%d\n", newPrio, rtInfo->rt_pri);
3801    }
3802  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3803    iaparms_t *iaInfo  = (iaparms_t*)ParmInfo.pc_clparms;
3804    int maxClamped     = MIN2(iaLimits.maxPrio, (int)iaInfo->ia_uprilim);
3805    iaInfo->ia_upri    = scale_to_lwp_priority(iaLimits.minPrio, maxClamped, newPrio);
3806    iaInfo->ia_uprilim = IA_NOCHANGE;
3807    iaInfo->ia_mode    = IA_NOCHANGE;
3808    if (ThreadPriorityVerbose) {
3809      tty->print_cr ("IA: [%d...%d] %d->%d\n",
3810               iaLimits.minPrio, maxClamped, newPrio, iaInfo->ia_upri);
3811    }
3812  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3813    tsparms_t *tsInfo  = (tsparms_t*)ParmInfo.pc_clparms;
3814    int maxClamped     = MIN2(tsLimits.maxPrio, (int)tsInfo->ts_uprilim);
3815    prv                = tsInfo->ts_upri;
3816    tsInfo->ts_upri    = scale_to_lwp_priority(tsLimits.minPrio, maxClamped, newPrio);
3817    tsInfo->ts_uprilim = IA_NOCHANGE;
3818    if (ThreadPriorityVerbose) {
3819      tty->print_cr ("TS: %d [%d...%d] %d->%d\n",
3820               prv, tsLimits.minPrio, maxClamped, newPrio, tsInfo->ts_upri);
3821    }
3822    if (prv == tsInfo->ts_upri) return 0;
3823  } else {
3824    if ( ThreadPriorityVerbose ) {
3825      tty->print_cr ("Unknown scheduling class\n");
3826    }
3827      return EINVAL;    // no clue, punt
3828  }
3829
3830  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_SETPARMS, (caddr_t)&ParmInfo);
3831  if (ThreadPriorityVerbose && rslt) {
3832    tty->print_cr ("PC_SETPARMS ->%d %d\n", rslt, errno);
3833  }
3834  if (rslt < 0) return errno;
3835
3836#ifdef ASSERT
3837  // Sanity check: read back what we just attempted to set.
3838  // In theory it could have changed in the interim ...
3839  //
3840  // The priocntl system call is tricky.
3841  // Sometimes it'll validate the priority value argument and
3842  // return EINVAL if unhappy.  At other times it fails silently.
3843  // Readbacks are prudent.
3844
3845  if (!ReadBackValidate) return 0;
3846
3847  memset(&ReadBack, 0, sizeof(pcparms_t));
3848  ReadBack.pc_cid = PC_CLNULL;
3849  rslt = (*priocntl_ptr)(PC_VERSION, P_LWPID, lwpid, PC_GETPARMS, (caddr_t)&ReadBack);
3850  assert(rslt >= 0, "priocntl failed");
3851  Actual = Expected = 0xBAD;
3852  assert(ParmInfo.pc_cid == ReadBack.pc_cid, "cid's don't match");
3853  if (ParmInfo.pc_cid == rtLimits.schedPolicy) {
3854    Actual   = RTPRI(ReadBack)->rt_pri;
3855    Expected = RTPRI(ParmInfo)->rt_pri;
3856  } else if (ParmInfo.pc_cid == iaLimits.schedPolicy) {
3857    Actual   = IAPRI(ReadBack)->ia_upri;
3858    Expected = IAPRI(ParmInfo)->ia_upri;
3859  } else if (ParmInfo.pc_cid == tsLimits.schedPolicy) {
3860    Actual   = TSPRI(ReadBack)->ts_upri;
3861    Expected = TSPRI(ParmInfo)->ts_upri;
3862  } else {
3863    if ( ThreadPriorityVerbose ) {
3864      tty->print_cr("set_lwp_priority: unexpected class in readback: %d\n", ParmInfo.pc_cid);
3865    }
3866  }
3867
3868  if (Actual != Expected) {
3869    if ( ThreadPriorityVerbose ) {
3870      tty->print_cr ("set_lwp_priority(%d %d) Class=%d: actual=%d vs expected=%d\n",
3871             lwpid, newPrio, ReadBack.pc_cid, Actual, Expected);
3872    }
3873  }
3874#endif
3875
3876  return 0;
3877}
3878
3879
3880
3881// Solaris only gives access to 128 real priorities at a time,
3882// so we expand Java's ten to fill this range.  This would be better
3883// if we dynamically adjusted relative priorities.
3884//
3885// The ThreadPriorityPolicy option allows us to select 2 different
3886// priority scales.
3887//
3888// ThreadPriorityPolicy=0
3889// Since the Solaris' default priority is MaximumPriority, we do not
3890// set a priority lower than Max unless a priority lower than
3891// NormPriority is requested.
3892//
3893// ThreadPriorityPolicy=1
3894// This mode causes the priority table to get filled with
3895// linear values.  NormPriority get's mapped to 50% of the
3896// Maximum priority an so on.  This will cause VM threads
3897// to get unfair treatment against other Solaris processes
3898// which do not explicitly alter their thread priorities.
3899//
3900
3901
3902int os::java_to_os_priority[MaxPriority + 1] = {
3903  -99999,         // 0 Entry should never be used
3904
3905  0,              // 1 MinPriority
3906  32,             // 2
3907  64,             // 3
3908
3909  96,             // 4
3910  127,            // 5 NormPriority
3911  127,            // 6
3912
3913  127,            // 7
3914  127,            // 8
3915  127,            // 9 NearMaxPriority
3916
3917  127             // 10 MaxPriority
3918};
3919
3920
3921OSReturn os::set_native_priority(Thread* thread, int newpri) {
3922  assert(newpri >= MinimumPriority && newpri <= MaximumPriority, "bad priority mapping");
3923  if ( !UseThreadPriorities ) return OS_OK;
3924  int status = thr_setprio(thread->osthread()->thread_id(), newpri);
3925  if ( os::Solaris::T2_libthread() || (UseBoundThreads && thread->osthread()->is_vm_created()) )
3926    status |= (set_lwp_priority (thread->osthread()->thread_id(),
3927                    thread->osthread()->lwp_id(), newpri ));
3928  return (status == 0) ? OS_OK : OS_ERR;
3929}
3930
3931
3932OSReturn os::get_native_priority(const Thread* const thread, int *priority_ptr) {
3933  int p;
3934  if ( !UseThreadPriorities ) {
3935    *priority_ptr = NormalPriority;
3936    return OS_OK;
3937  }
3938  int status = thr_getprio(thread->osthread()->thread_id(), &p);
3939  if (status != 0) {
3940    return OS_ERR;
3941  }
3942  *priority_ptr = p;
3943  return OS_OK;
3944}
3945
3946
3947// Hint to the underlying OS that a task switch would not be good.
3948// Void return because it's a hint and can fail.
3949void os::hint_no_preempt() {
3950  schedctl_start(schedctl_init());
3951}
3952
3953void os::interrupt(Thread* thread) {
3954  assert(Thread::current() == thread || Threads_lock->owned_by_self(), "possibility of dangling Thread pointer");
3955
3956  OSThread* osthread = thread->osthread();
3957
3958  int isInterrupted = osthread->interrupted();
3959  if (!isInterrupted) {
3960      osthread->set_interrupted(true);
3961      OrderAccess::fence();
3962      // os::sleep() is implemented with either poll (NULL,0,timeout) or
3963      // by parking on _SleepEvent.  If the former, thr_kill will unwedge
3964      // the sleeper by SIGINTR, otherwise the unpark() will wake the sleeper.
3965      ParkEvent * const slp = thread->_SleepEvent ;
3966      if (slp != NULL) slp->unpark() ;
3967  }
3968
3969  // For JSR166:  unpark after setting status but before thr_kill -dl
3970  if (thread->is_Java_thread()) {
3971    ((JavaThread*)thread)->parker()->unpark();
3972  }
3973
3974  // Handle interruptible wait() ...
3975  ParkEvent * const ev = thread->_ParkEvent ;
3976  if (ev != NULL) ev->unpark() ;
3977
3978  // When events are used everywhere for os::sleep, then this thr_kill
3979  // will only be needed if UseVMInterruptibleIO is true.
3980
3981  if (!isInterrupted) {
3982    int status = thr_kill(osthread->thread_id(), os::Solaris::SIGinterrupt());
3983    assert_status(status == 0, status, "thr_kill");
3984
3985    // Bump thread interruption counter
3986    RuntimeService::record_thread_interrupt_signaled_count();
3987  }
3988}
3989
3990
3991bool os::is_interrupted(Thread* thread, bool clear_interrupted) {
3992  assert(Thread::current() == thread || Threads_lock->owned_by_self(), "possibility of dangling Thread pointer");
3993
3994  OSThread* osthread = thread->osthread();
3995
3996  bool res = osthread->interrupted();
3997
3998  // NOTE that since there is no "lock" around these two operations,
3999  // there is the possibility that the interrupted flag will be
4000  // "false" but that the interrupt event will be set. This is
4001  // intentional. The effect of this is that Object.wait() will appear
4002  // to have a spurious wakeup, which is not harmful, and the
4003  // possibility is so rare that it is not worth the added complexity
4004  // to add yet another lock. It has also been recommended not to put
4005  // the interrupted flag into the os::Solaris::Event structure,
4006  // because it hides the issue.
4007  if (res && clear_interrupted) {
4008    osthread->set_interrupted(false);
4009  }
4010  return res;
4011}
4012
4013
4014void os::print_statistics() {
4015}
4016
4017int os::message_box(const char* title, const char* message) {
4018  int i;
4019  fdStream err(defaultStream::error_fd());
4020  for (i = 0; i < 78; i++) err.print_raw("=");
4021  err.cr();
4022  err.print_raw_cr(title);
4023  for (i = 0; i < 78; i++) err.print_raw("-");
4024  err.cr();
4025  err.print_raw_cr(message);
4026  for (i = 0; i < 78; i++) err.print_raw("=");
4027  err.cr();
4028
4029  char buf[16];
4030  // Prevent process from exiting upon "read error" without consuming all CPU
4031  while (::read(0, buf, sizeof(buf)) <= 0) { ::sleep(100); }
4032
4033  return buf[0] == 'y' || buf[0] == 'Y';
4034}
4035
4036// A lightweight implementation that does not suspend the target thread and
4037// thus returns only a hint. Used for profiling only!
4038ExtendedPC os::get_thread_pc(Thread* thread) {
4039  // Make sure that it is called by the watcher and the Threads lock is owned.
4040  assert(Thread::current()->is_Watcher_thread(), "Must be watcher and own Threads_lock");
4041  // For now, is only used to profile the VM Thread
4042  assert(thread->is_VM_thread(), "Can only be called for VMThread");
4043  ExtendedPC epc;
4044
4045  GetThreadPC_Callback  cb(ProfileVM_lock);
4046  OSThread *osthread = thread->osthread();
4047  const int time_to_wait = 400; // 400ms wait for initial response
4048  int status = cb.interrupt(thread, time_to_wait);
4049
4050  if (cb.is_done() ) {
4051    epc = cb.addr();
4052  } else {
4053    DEBUG_ONLY(tty->print_cr("Failed to get pc for thread: %d got %d status",
4054                              osthread->thread_id(), status););
4055    // epc is already NULL
4056  }
4057  return epc;
4058}
4059
4060
4061// This does not do anything on Solaris. This is basically a hook for being
4062// able to use structured exception handling (thread-local exception filters) on, e.g., Win32.
4063void os::os_exception_wrapper(java_call_t f, JavaValue* value, methodHandle* method, JavaCallArguments* args, Thread* thread) {
4064  f(value, method, args, thread);
4065}
4066
4067// This routine may be used by user applications as a "hook" to catch signals.
4068// The user-defined signal handler must pass unrecognized signals to this
4069// routine, and if it returns true (non-zero), then the signal handler must
4070// return immediately.  If the flag "abort_if_unrecognized" is true, then this
4071// routine will never retun false (zero), but instead will execute a VM panic
4072// routine kill the process.
4073//
4074// If this routine returns false, it is OK to call it again.  This allows
4075// the user-defined signal handler to perform checks either before or after
4076// the VM performs its own checks.  Naturally, the user code would be making
4077// a serious error if it tried to handle an exception (such as a null check
4078// or breakpoint) that the VM was generating for its own correct operation.
4079//
4080// This routine may recognize any of the following kinds of signals:
4081// SIGBUS, SIGSEGV, SIGILL, SIGFPE, BREAK_SIGNAL, SIGPIPE, SIGXFSZ,
4082// os::Solaris::SIGasync
4083// It should be consulted by handlers for any of those signals.
4084// It explicitly does not recognize os::Solaris::SIGinterrupt
4085//
4086// The caller of this routine must pass in the three arguments supplied
4087// to the function referred to in the "sa_sigaction" (not the "sa_handler")
4088// field of the structure passed to sigaction().  This routine assumes that
4089// the sa_flags field passed to sigaction() includes SA_SIGINFO and SA_RESTART.
4090//
4091// Note that the VM will print warnings if it detects conflicting signal
4092// handlers, unless invoked with the option "-XX:+AllowUserSignalHandlers".
4093//
4094extern "C" int JVM_handle_solaris_signal(int signo, siginfo_t* siginfo, void* ucontext, int abort_if_unrecognized);
4095
4096
4097void signalHandler(int sig, siginfo_t* info, void* ucVoid) {
4098  JVM_handle_solaris_signal(sig, info, ucVoid, true);
4099}
4100
4101/* Do not delete - if guarantee is ever removed,  a signal handler (even empty)
4102   is needed to provoke threads blocked on IO to return an EINTR
4103   Note: this explicitly does NOT call JVM_handle_solaris_signal and
4104   does NOT participate in signal chaining due to requirement for
4105   NOT setting SA_RESTART to make EINTR work. */
4106extern "C" void sigINTRHandler(int sig, siginfo_t* info, void* ucVoid) {
4107   if (UseSignalChaining) {
4108      struct sigaction *actp = os::Solaris::get_chained_signal_action(sig);
4109      if (actp && actp->sa_handler) {
4110        vm_exit_during_initialization("Signal chaining detected for VM interrupt signal, try -XX:+UseAltSigs");
4111      }
4112   }
4113}
4114
4115// This boolean allows users to forward their own non-matching signals
4116// to JVM_handle_solaris_signal, harmlessly.
4117bool os::Solaris::signal_handlers_are_installed = false;
4118
4119// For signal-chaining
4120bool os::Solaris::libjsig_is_loaded = false;
4121typedef struct sigaction *(*get_signal_t)(int);
4122get_signal_t os::Solaris::get_signal_action = NULL;
4123
4124struct sigaction* os::Solaris::get_chained_signal_action(int sig) {
4125  struct sigaction *actp = NULL;
4126
4127  if ((libjsig_is_loaded)  && (sig <= Maxlibjsigsigs)) {
4128    // Retrieve the old signal handler from libjsig
4129    actp = (*get_signal_action)(sig);
4130  }
4131  if (actp == NULL) {
4132    // Retrieve the preinstalled signal handler from jvm
4133    actp = get_preinstalled_handler(sig);
4134  }
4135
4136  return actp;
4137}
4138
4139static bool call_chained_handler(struct sigaction *actp, int sig,
4140                                 siginfo_t *siginfo, void *context) {
4141  // Call the old signal handler
4142  if (actp->sa_handler == SIG_DFL) {
4143    // It's more reasonable to let jvm treat it as an unexpected exception
4144    // instead of taking the default action.
4145    return false;
4146  } else if (actp->sa_handler != SIG_IGN) {
4147    if ((actp->sa_flags & SA_NODEFER) == 0) {
4148      // automaticlly block the signal
4149      sigaddset(&(actp->sa_mask), sig);
4150    }
4151
4152    sa_handler_t hand;
4153    sa_sigaction_t sa;
4154    bool siginfo_flag_set = (actp->sa_flags & SA_SIGINFO) != 0;
4155    // retrieve the chained handler
4156    if (siginfo_flag_set) {
4157      sa = actp->sa_sigaction;
4158    } else {
4159      hand = actp->sa_handler;
4160    }
4161
4162    if ((actp->sa_flags & SA_RESETHAND) != 0) {
4163      actp->sa_handler = SIG_DFL;
4164    }
4165
4166    // try to honor the signal mask
4167    sigset_t oset;
4168    thr_sigsetmask(SIG_SETMASK, &(actp->sa_mask), &oset);
4169
4170    // call into the chained handler
4171    if (siginfo_flag_set) {
4172      (*sa)(sig, siginfo, context);
4173    } else {
4174      (*hand)(sig);
4175    }
4176
4177    // restore the signal mask
4178    thr_sigsetmask(SIG_SETMASK, &oset, 0);
4179  }
4180  // Tell jvm's signal handler the signal is taken care of.
4181  return true;
4182}
4183
4184bool os::Solaris::chained_handler(int sig, siginfo_t* siginfo, void* context) {
4185  bool chained = false;
4186  // signal-chaining
4187  if (UseSignalChaining) {
4188    struct sigaction *actp = get_chained_signal_action(sig);
4189    if (actp != NULL) {
4190      chained = call_chained_handler(actp, sig, siginfo, context);
4191    }
4192  }
4193  return chained;
4194}
4195
4196struct sigaction* os::Solaris::get_preinstalled_handler(int sig) {
4197  assert((chainedsigactions != (struct sigaction *)NULL) && (preinstalled_sigs != (int *)NULL) , "signals not yet initialized");
4198  if (preinstalled_sigs[sig] != 0) {
4199    return &chainedsigactions[sig];
4200  }
4201  return NULL;
4202}
4203
4204void os::Solaris::save_preinstalled_handler(int sig, struct sigaction& oldAct) {
4205
4206  assert(sig > 0 && sig <= Maxsignum, "vm signal out of expected range");
4207  assert((chainedsigactions != (struct sigaction *)NULL) && (preinstalled_sigs != (int *)NULL) , "signals not yet initialized");
4208  chainedsigactions[sig] = oldAct;
4209  preinstalled_sigs[sig] = 1;
4210}
4211
4212void os::Solaris::set_signal_handler(int sig, bool set_installed, bool oktochain) {
4213  // Check for overwrite.
4214  struct sigaction oldAct;
4215  sigaction(sig, (struct sigaction*)NULL, &oldAct);
4216  void* oldhand = oldAct.sa_sigaction ? CAST_FROM_FN_PTR(void*,  oldAct.sa_sigaction)
4217                                      : CAST_FROM_FN_PTR(void*,  oldAct.sa_handler);
4218  if (oldhand != CAST_FROM_FN_PTR(void*, SIG_DFL) &&
4219      oldhand != CAST_FROM_FN_PTR(void*, SIG_IGN) &&
4220      oldhand != CAST_FROM_FN_PTR(void*, signalHandler)) {
4221    if (AllowUserSignalHandlers || !set_installed) {
4222      // Do not overwrite; user takes responsibility to forward to us.
4223      return;
4224    } else if (UseSignalChaining) {
4225      if (oktochain) {
4226        // save the old handler in jvm
4227        save_preinstalled_handler(sig, oldAct);
4228      } else {
4229        vm_exit_during_initialization("Signal chaining not allowed for VM interrupt signal, try -XX:+UseAltSigs.");
4230      }
4231      // libjsig also interposes the sigaction() call below and saves the
4232      // old sigaction on it own.
4233    } else {
4234      fatal2("Encountered unexpected pre-existing sigaction handler %#lx for signal %d.", (long)oldhand, sig);
4235    }
4236  }
4237
4238  struct sigaction sigAct;
4239  sigfillset(&(sigAct.sa_mask));
4240  sigAct.sa_handler = SIG_DFL;
4241
4242  sigAct.sa_sigaction = signalHandler;
4243  // Handle SIGSEGV on alternate signal stack if
4244  // not using stack banging
4245  if (!UseStackBanging && sig == SIGSEGV) {
4246    sigAct.sa_flags = SA_SIGINFO | SA_RESTART | SA_ONSTACK;
4247  // Interruptible i/o requires SA_RESTART cleared so EINTR
4248  // is returned instead of restarting system calls
4249  } else if (sig == os::Solaris::SIGinterrupt()) {
4250    sigemptyset(&sigAct.sa_mask);
4251    sigAct.sa_handler = NULL;
4252    sigAct.sa_flags = SA_SIGINFO;
4253    sigAct.sa_sigaction = sigINTRHandler;
4254  } else {
4255    sigAct.sa_flags = SA_SIGINFO | SA_RESTART;
4256  }
4257  os::Solaris::set_our_sigflags(sig, sigAct.sa_flags);
4258
4259  sigaction(sig, &sigAct, &oldAct);
4260
4261  void* oldhand2 = oldAct.sa_sigaction ? CAST_FROM_FN_PTR(void*, oldAct.sa_sigaction)
4262                                       : CAST_FROM_FN_PTR(void*, oldAct.sa_handler);
4263  assert(oldhand2 == oldhand, "no concurrent signal handler installation");
4264}
4265
4266
4267#define DO_SIGNAL_CHECK(sig) \
4268  if (!sigismember(&check_signal_done, sig)) \
4269    os::Solaris::check_signal_handler(sig)
4270
4271// This method is a periodic task to check for misbehaving JNI applications
4272// under CheckJNI, we can add any periodic checks here
4273
4274void os::run_periodic_checks() {
4275  // A big source of grief is hijacking virt. addr 0x0 on Solaris,
4276  // thereby preventing a NULL checks.
4277  if(!check_addr0_done) check_addr0_done = check_addr0(tty);
4278
4279  if (check_signals == false) return;
4280
4281  // SEGV and BUS if overridden could potentially prevent
4282  // generation of hs*.log in the event of a crash, debugging
4283  // such a case can be very challenging, so we absolutely
4284  // check for the following for a good measure:
4285  DO_SIGNAL_CHECK(SIGSEGV);
4286  DO_SIGNAL_CHECK(SIGILL);
4287  DO_SIGNAL_CHECK(SIGFPE);
4288  DO_SIGNAL_CHECK(SIGBUS);
4289  DO_SIGNAL_CHECK(SIGPIPE);
4290  DO_SIGNAL_CHECK(SIGXFSZ);
4291
4292  // ReduceSignalUsage allows the user to override these handlers
4293  // see comments at the very top and jvm_solaris.h
4294  if (!ReduceSignalUsage) {
4295    DO_SIGNAL_CHECK(SHUTDOWN1_SIGNAL);
4296    DO_SIGNAL_CHECK(SHUTDOWN2_SIGNAL);
4297    DO_SIGNAL_CHECK(SHUTDOWN3_SIGNAL);
4298    DO_SIGNAL_CHECK(BREAK_SIGNAL);
4299  }
4300
4301  // See comments above for using JVM1/JVM2 and UseAltSigs
4302  DO_SIGNAL_CHECK(os::Solaris::SIGinterrupt());
4303  DO_SIGNAL_CHECK(os::Solaris::SIGasync());
4304
4305}
4306
4307typedef int (*os_sigaction_t)(int, const struct sigaction *, struct sigaction *);
4308
4309static os_sigaction_t os_sigaction = NULL;
4310
4311void os::Solaris::check_signal_handler(int sig) {
4312  char buf[O_BUFLEN];
4313  address jvmHandler = NULL;
4314
4315  struct sigaction act;
4316  if (os_sigaction == NULL) {
4317    // only trust the default sigaction, in case it has been interposed
4318    os_sigaction = (os_sigaction_t)dlsym(RTLD_DEFAULT, "sigaction");
4319    if (os_sigaction == NULL) return;
4320  }
4321
4322  os_sigaction(sig, (struct sigaction*)NULL, &act);
4323
4324  address thisHandler = (act.sa_flags & SA_SIGINFO)
4325    ? CAST_FROM_FN_PTR(address, act.sa_sigaction)
4326    : CAST_FROM_FN_PTR(address, act.sa_handler) ;
4327
4328
4329  switch(sig) {
4330    case SIGSEGV:
4331    case SIGBUS:
4332    case SIGFPE:
4333    case SIGPIPE:
4334    case SIGXFSZ:
4335    case SIGILL:
4336      jvmHandler = CAST_FROM_FN_PTR(address, signalHandler);
4337      break;
4338
4339    case SHUTDOWN1_SIGNAL:
4340    case SHUTDOWN2_SIGNAL:
4341    case SHUTDOWN3_SIGNAL:
4342    case BREAK_SIGNAL:
4343      jvmHandler = (address)user_handler();
4344      break;
4345
4346    default:
4347      int intrsig = os::Solaris::SIGinterrupt();
4348      int asynsig = os::Solaris::SIGasync();
4349
4350      if (sig == intrsig) {
4351        jvmHandler = CAST_FROM_FN_PTR(address, sigINTRHandler);
4352      } else if (sig == asynsig) {
4353        jvmHandler = CAST_FROM_FN_PTR(address, signalHandler);
4354      } else {
4355        return;
4356      }
4357      break;
4358  }
4359
4360
4361  if (thisHandler != jvmHandler) {
4362    tty->print("Warning: %s handler ", exception_name(sig, buf, O_BUFLEN));
4363    tty->print("expected:%s", get_signal_handler_name(jvmHandler, buf, O_BUFLEN));
4364    tty->print_cr("  found:%s", get_signal_handler_name(thisHandler, buf, O_BUFLEN));
4365    // No need to check this sig any longer
4366    sigaddset(&check_signal_done, sig);
4367  } else if(os::Solaris::get_our_sigflags(sig) != 0 && act.sa_flags != os::Solaris::get_our_sigflags(sig)) {
4368    tty->print("Warning: %s handler flags ", exception_name(sig, buf, O_BUFLEN));
4369    tty->print("expected:" PTR32_FORMAT, os::Solaris::get_our_sigflags(sig));
4370    tty->print_cr("  found:" PTR32_FORMAT, act.sa_flags);
4371    // No need to check this sig any longer
4372    sigaddset(&check_signal_done, sig);
4373  }
4374
4375  // Print all the signal handler state
4376  if (sigismember(&check_signal_done, sig)) {
4377    print_signal_handlers(tty, buf, O_BUFLEN);
4378  }
4379
4380}
4381
4382void os::Solaris::install_signal_handlers() {
4383  bool libjsigdone = false;
4384  signal_handlers_are_installed = true;
4385
4386  // signal-chaining
4387  typedef void (*signal_setting_t)();
4388  signal_setting_t begin_signal_setting = NULL;
4389  signal_setting_t end_signal_setting = NULL;
4390  begin_signal_setting = CAST_TO_FN_PTR(signal_setting_t,
4391                                        dlsym(RTLD_DEFAULT, "JVM_begin_signal_setting"));
4392  if (begin_signal_setting != NULL) {
4393    end_signal_setting = CAST_TO_FN_PTR(signal_setting_t,
4394                                        dlsym(RTLD_DEFAULT, "JVM_end_signal_setting"));
4395    get_signal_action = CAST_TO_FN_PTR(get_signal_t,
4396                                       dlsym(RTLD_DEFAULT, "JVM_get_signal_action"));
4397    get_libjsig_version = CAST_TO_FN_PTR(version_getting_t,
4398                                         dlsym(RTLD_DEFAULT, "JVM_get_libjsig_version"));
4399    libjsig_is_loaded = true;
4400    if (os::Solaris::get_libjsig_version != NULL) {
4401      libjsigversion =  (*os::Solaris::get_libjsig_version)();
4402    }
4403    assert(UseSignalChaining, "should enable signal-chaining");
4404  }
4405  if (libjsig_is_loaded) {
4406    // Tell libjsig jvm is setting signal handlers
4407    (*begin_signal_setting)();
4408  }
4409
4410  set_signal_handler(SIGSEGV, true, true);
4411  set_signal_handler(SIGPIPE, true, true);
4412  set_signal_handler(SIGXFSZ, true, true);
4413  set_signal_handler(SIGBUS, true, true);
4414  set_signal_handler(SIGILL, true, true);
4415  set_signal_handler(SIGFPE, true, true);
4416
4417
4418  if (os::Solaris::SIGinterrupt() > OLDMAXSIGNUM || os::Solaris::SIGasync() > OLDMAXSIGNUM) {
4419
4420    // Pre-1.4.1 Libjsig limited to signal chaining signals <= 32 so
4421    // can not register overridable signals which might be > 32
4422    if (libjsig_is_loaded && libjsigversion <= JSIG_VERSION_1_4_1) {
4423    // Tell libjsig jvm has finished setting signal handlers
4424      (*end_signal_setting)();
4425      libjsigdone = true;
4426    }
4427  }
4428
4429  // Never ok to chain our SIGinterrupt
4430  set_signal_handler(os::Solaris::SIGinterrupt(), true, false);
4431  set_signal_handler(os::Solaris::SIGasync(), true, true);
4432
4433  if (libjsig_is_loaded && !libjsigdone) {
4434    // Tell libjsig jvm finishes setting signal handlers
4435    (*end_signal_setting)();
4436  }
4437
4438  // We don't activate signal checker if libjsig is in place, we trust ourselves
4439  // and if UserSignalHandler is installed all bets are off
4440  if (CheckJNICalls) {
4441    if (libjsig_is_loaded) {
4442      tty->print_cr("Info: libjsig is activated, all active signal checking is disabled");
4443      check_signals = false;
4444    }
4445    if (AllowUserSignalHandlers) {
4446      tty->print_cr("Info: AllowUserSignalHandlers is activated, all active signal checking is disabled");
4447      check_signals = false;
4448    }
4449  }
4450}
4451
4452
4453void report_error(const char* file_name, int line_no, const char* title, const char* format, ...);
4454
4455const char * signames[] = {
4456  "SIG0",
4457  "SIGHUP", "SIGINT", "SIGQUIT", "SIGILL", "SIGTRAP",
4458  "SIGABRT", "SIGEMT", "SIGFPE", "SIGKILL", "SIGBUS",
4459  "SIGSEGV", "SIGSYS", "SIGPIPE", "SIGALRM", "SIGTERM",
4460  "SIGUSR1", "SIGUSR2", "SIGCLD", "SIGPWR", "SIGWINCH",
4461  "SIGURG", "SIGPOLL", "SIGSTOP", "SIGTSTP", "SIGCONT",
4462  "SIGTTIN", "SIGTTOU", "SIGVTALRM", "SIGPROF", "SIGXCPU",
4463  "SIGXFSZ", "SIGWAITING", "SIGLWP", "SIGFREEZE", "SIGTHAW",
4464  "SIGCANCEL", "SIGLOST"
4465};
4466
4467const char* os::exception_name(int exception_code, char* buf, size_t size) {
4468  if (0 < exception_code && exception_code <= SIGRTMAX) {
4469    // signal
4470    if (exception_code < sizeof(signames)/sizeof(const char*)) {
4471       jio_snprintf(buf, size, "%s", signames[exception_code]);
4472    } else {
4473       jio_snprintf(buf, size, "SIG%d", exception_code);
4474    }
4475    return buf;
4476  } else {
4477    return NULL;
4478  }
4479}
4480
4481// (Static) wrappers for the new libthread API
4482int_fnP_thread_t_iP_uP_stack_tP_gregset_t os::Solaris::_thr_getstate;
4483int_fnP_thread_t_i_gregset_t os::Solaris::_thr_setstate;
4484int_fnP_thread_t_i os::Solaris::_thr_setmutator;
4485int_fnP_thread_t os::Solaris::_thr_suspend_mutator;
4486int_fnP_thread_t os::Solaris::_thr_continue_mutator;
4487
4488// (Static) wrapper for getisax(2) call.
4489os::Solaris::getisax_func_t os::Solaris::_getisax = 0;
4490
4491// (Static) wrappers for the liblgrp API
4492os::Solaris::lgrp_home_func_t os::Solaris::_lgrp_home;
4493os::Solaris::lgrp_init_func_t os::Solaris::_lgrp_init;
4494os::Solaris::lgrp_fini_func_t os::Solaris::_lgrp_fini;
4495os::Solaris::lgrp_root_func_t os::Solaris::_lgrp_root;
4496os::Solaris::lgrp_children_func_t os::Solaris::_lgrp_children;
4497os::Solaris::lgrp_resources_func_t os::Solaris::_lgrp_resources;
4498os::Solaris::lgrp_nlgrps_func_t os::Solaris::_lgrp_nlgrps;
4499os::Solaris::lgrp_cookie_stale_func_t os::Solaris::_lgrp_cookie_stale;
4500os::Solaris::lgrp_cookie_t os::Solaris::_lgrp_cookie = 0;
4501
4502// (Static) wrapper for meminfo() call.
4503os::Solaris::meminfo_func_t os::Solaris::_meminfo = 0;
4504
4505static address resolve_symbol_lazy(const char* name) {
4506  address addr = (address) dlsym(RTLD_DEFAULT, name);
4507  if(addr == NULL) {
4508    // RTLD_DEFAULT was not defined on some early versions of 2.5.1
4509    addr = (address) dlsym(RTLD_NEXT, name);
4510  }
4511  return addr;
4512}
4513
4514static address resolve_symbol(const char* name) {
4515  address addr = resolve_symbol_lazy(name);
4516  if(addr == NULL) {
4517    fatal(dlerror());
4518  }
4519  return addr;
4520}
4521
4522
4523
4524// isT2_libthread()
4525//
4526// Routine to determine if we are currently using the new T2 libthread.
4527//
4528// We determine if we are using T2 by reading /proc/self/lstatus and
4529// looking for a thread with the ASLWP bit set.  If we find this status
4530// bit set, we must assume that we are NOT using T2.  The T2 team
4531// has approved this algorithm.
4532//
4533// We need to determine if we are running with the new T2 libthread
4534// since setting native thread priorities is handled differently
4535// when using this library.  All threads created using T2 are bound
4536// threads. Calling thr_setprio is meaningless in this case.
4537//
4538bool isT2_libthread() {
4539  static prheader_t * lwpArray = NULL;
4540  static int lwpSize = 0;
4541  static int lwpFile = -1;
4542  lwpstatus_t * that;
4543  char lwpName [128];
4544  bool isT2 = false;
4545
4546#define ADR(x)  ((uintptr_t)(x))
4547#define LWPINDEX(ary,ix)   ((lwpstatus_t *)(((ary)->pr_entsize * (ix)) + (ADR((ary) + 1))))
4548
4549  lwpFile = open("/proc/self/lstatus", O_RDONLY, 0);
4550  if (lwpFile < 0) {
4551      if (ThreadPriorityVerbose) warning ("Couldn't open /proc/self/lstatus\n");
4552      return false;
4553  }
4554  lwpSize = 16*1024;
4555  for (;;) {
4556    lseek (lwpFile, 0, SEEK_SET);
4557    lwpArray = (prheader_t *)NEW_C_HEAP_ARRAY(char, lwpSize);
4558    if (read(lwpFile, lwpArray, lwpSize) < 0) {
4559      if (ThreadPriorityVerbose) warning("Error reading /proc/self/lstatus\n");
4560      break;
4561    }
4562    if ((lwpArray->pr_nent * lwpArray->pr_entsize) <= lwpSize) {
4563       // We got a good snapshot - now iterate over the list.
4564      int aslwpcount = 0;
4565      for (int i = 0; i < lwpArray->pr_nent; i++ ) {
4566        that = LWPINDEX(lwpArray,i);
4567        if (that->pr_flags & PR_ASLWP) {
4568          aslwpcount++;
4569        }
4570      }
4571      if (aslwpcount == 0) isT2 = true;
4572      break;
4573    }
4574    lwpSize = lwpArray->pr_nent * lwpArray->pr_entsize;
4575    FREE_C_HEAP_ARRAY(char, lwpArray);  // retry.
4576  }
4577
4578  FREE_C_HEAP_ARRAY(char, lwpArray);
4579  close (lwpFile);
4580  if (ThreadPriorityVerbose) {
4581    if (isT2) tty->print_cr("We are running with a T2 libthread\n");
4582    else tty->print_cr("We are not running with a T2 libthread\n");
4583  }
4584  return isT2;
4585}
4586
4587
4588void os::Solaris::libthread_init() {
4589  address func = (address)dlsym(RTLD_DEFAULT, "_thr_suspend_allmutators");
4590
4591  // Determine if we are running with the new T2 libthread
4592  os::Solaris::set_T2_libthread(isT2_libthread());
4593
4594  lwp_priocntl_init();
4595
4596  // RTLD_DEFAULT was not defined on some early versions of 5.5.1
4597  if(func == NULL) {
4598    func = (address) dlsym(RTLD_NEXT, "_thr_suspend_allmutators");
4599    // Guarantee that this VM is running on an new enough OS (5.6 or
4600    // later) that it will have a new enough libthread.so.
4601    guarantee(func != NULL, "libthread.so is too old.");
4602  }
4603
4604  // Initialize the new libthread getstate API wrappers
4605  func = resolve_symbol("thr_getstate");
4606  os::Solaris::set_thr_getstate(CAST_TO_FN_PTR(int_fnP_thread_t_iP_uP_stack_tP_gregset_t, func));
4607
4608  func = resolve_symbol("thr_setstate");
4609  os::Solaris::set_thr_setstate(CAST_TO_FN_PTR(int_fnP_thread_t_i_gregset_t, func));
4610
4611  func = resolve_symbol("thr_setmutator");
4612  os::Solaris::set_thr_setmutator(CAST_TO_FN_PTR(int_fnP_thread_t_i, func));
4613
4614  func = resolve_symbol("thr_suspend_mutator");
4615  os::Solaris::set_thr_suspend_mutator(CAST_TO_FN_PTR(int_fnP_thread_t, func));
4616
4617  func = resolve_symbol("thr_continue_mutator");
4618  os::Solaris::set_thr_continue_mutator(CAST_TO_FN_PTR(int_fnP_thread_t, func));
4619
4620  int size;
4621  void (*handler_info_func)(address *, int *);
4622  handler_info_func = CAST_TO_FN_PTR(void (*)(address *, int *), resolve_symbol("thr_sighndlrinfo"));
4623  handler_info_func(&handler_start, &size);
4624  handler_end = handler_start + size;
4625}
4626
4627
4628int_fnP_mutex_tP os::Solaris::_mutex_lock;
4629int_fnP_mutex_tP os::Solaris::_mutex_trylock;
4630int_fnP_mutex_tP os::Solaris::_mutex_unlock;
4631int_fnP_mutex_tP_i_vP os::Solaris::_mutex_init;
4632int_fnP_mutex_tP os::Solaris::_mutex_destroy;
4633int os::Solaris::_mutex_scope = USYNC_THREAD;
4634
4635int_fnP_cond_tP_mutex_tP_timestruc_tP os::Solaris::_cond_timedwait;
4636int_fnP_cond_tP_mutex_tP os::Solaris::_cond_wait;
4637int_fnP_cond_tP os::Solaris::_cond_signal;
4638int_fnP_cond_tP os::Solaris::_cond_broadcast;
4639int_fnP_cond_tP_i_vP os::Solaris::_cond_init;
4640int_fnP_cond_tP os::Solaris::_cond_destroy;
4641int os::Solaris::_cond_scope = USYNC_THREAD;
4642
4643void os::Solaris::synchronization_init() {
4644  if(UseLWPSynchronization) {
4645    os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_lock")));
4646    os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_trylock")));
4647    os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("_lwp_mutex_unlock")));
4648    os::Solaris::set_mutex_init(lwp_mutex_init);
4649    os::Solaris::set_mutex_destroy(lwp_mutex_destroy);
4650    os::Solaris::set_mutex_scope(USYNC_THREAD);
4651
4652    os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("_lwp_cond_timedwait")));
4653    os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("_lwp_cond_wait")));
4654    os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("_lwp_cond_signal")));
4655    os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("_lwp_cond_broadcast")));
4656    os::Solaris::set_cond_init(lwp_cond_init);
4657    os::Solaris::set_cond_destroy(lwp_cond_destroy);
4658    os::Solaris::set_cond_scope(USYNC_THREAD);
4659  }
4660  else {
4661    os::Solaris::set_mutex_scope(USYNC_THREAD);
4662    os::Solaris::set_cond_scope(USYNC_THREAD);
4663
4664    if(UsePthreads) {
4665      os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_lock")));
4666      os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_trylock")));
4667      os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_unlock")));
4668      os::Solaris::set_mutex_init(pthread_mutex_default_init);
4669      os::Solaris::set_mutex_destroy(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("pthread_mutex_destroy")));
4670
4671      os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("pthread_cond_timedwait")));
4672      os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("pthread_cond_wait")));
4673      os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_signal")));
4674      os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_broadcast")));
4675      os::Solaris::set_cond_init(pthread_cond_default_init);
4676      os::Solaris::set_cond_destroy(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("pthread_cond_destroy")));
4677    }
4678    else {
4679      os::Solaris::set_mutex_lock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_lock")));
4680      os::Solaris::set_mutex_trylock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_trylock")));
4681      os::Solaris::set_mutex_unlock(CAST_TO_FN_PTR(int_fnP_mutex_tP, resolve_symbol("mutex_unlock")));
4682      os::Solaris::set_mutex_init(::mutex_init);
4683      os::Solaris::set_mutex_destroy(::mutex_destroy);
4684
4685      os::Solaris::set_cond_timedwait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP_timestruc_tP, resolve_symbol("cond_timedwait")));
4686      os::Solaris::set_cond_wait(CAST_TO_FN_PTR(int_fnP_cond_tP_mutex_tP, resolve_symbol("cond_wait")));
4687      os::Solaris::set_cond_signal(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("cond_signal")));
4688      os::Solaris::set_cond_broadcast(CAST_TO_FN_PTR(int_fnP_cond_tP, resolve_symbol("cond_broadcast")));
4689      os::Solaris::set_cond_init(::cond_init);
4690      os::Solaris::set_cond_destroy(::cond_destroy);
4691    }
4692  }
4693}
4694
4695bool os::Solaris::liblgrp_init() {
4696  void *handle = dlopen("liblgrp.so.1", RTLD_LAZY);
4697  if (handle != NULL) {
4698    os::Solaris::set_lgrp_home(CAST_TO_FN_PTR(lgrp_home_func_t, dlsym(handle, "lgrp_home")));
4699    os::Solaris::set_lgrp_init(CAST_TO_FN_PTR(lgrp_init_func_t, dlsym(handle, "lgrp_init")));
4700    os::Solaris::set_lgrp_fini(CAST_TO_FN_PTR(lgrp_fini_func_t, dlsym(handle, "lgrp_fini")));
4701    os::Solaris::set_lgrp_root(CAST_TO_FN_PTR(lgrp_root_func_t, dlsym(handle, "lgrp_root")));
4702    os::Solaris::set_lgrp_children(CAST_TO_FN_PTR(lgrp_children_func_t, dlsym(handle, "lgrp_children")));
4703    os::Solaris::set_lgrp_resources(CAST_TO_FN_PTR(lgrp_resources_func_t, dlsym(handle, "lgrp_resources")));
4704    os::Solaris::set_lgrp_nlgrps(CAST_TO_FN_PTR(lgrp_nlgrps_func_t, dlsym(handle, "lgrp_nlgrps")));
4705    os::Solaris::set_lgrp_cookie_stale(CAST_TO_FN_PTR(lgrp_cookie_stale_func_t,
4706                                       dlsym(handle, "lgrp_cookie_stale")));
4707
4708    lgrp_cookie_t c = lgrp_init(LGRP_VIEW_CALLER);
4709    set_lgrp_cookie(c);
4710    return true;
4711  }
4712  return false;
4713}
4714
4715void os::Solaris::misc_sym_init() {
4716  address func;
4717
4718  // getisax
4719  func = resolve_symbol_lazy("getisax");
4720  if (func != NULL) {
4721    os::Solaris::_getisax = CAST_TO_FN_PTR(getisax_func_t, func);
4722  }
4723
4724  // meminfo
4725  func = resolve_symbol_lazy("meminfo");
4726  if (func != NULL) {
4727    os::Solaris::set_meminfo(CAST_TO_FN_PTR(meminfo_func_t, func));
4728  }
4729}
4730
4731uint_t os::Solaris::getisax(uint32_t* array, uint_t n) {
4732  assert(_getisax != NULL, "_getisax not set");
4733  return _getisax(array, n);
4734}
4735
4736// Symbol doesn't exist in Solaris 8 pset.h
4737#ifndef PS_MYID
4738#define PS_MYID -3
4739#endif
4740
4741// int pset_getloadavg(psetid_t pset, double loadavg[], int nelem);
4742typedef long (*pset_getloadavg_type)(psetid_t pset, double loadavg[], int nelem);
4743static pset_getloadavg_type pset_getloadavg_ptr = NULL;
4744
4745void init_pset_getloadavg_ptr(void) {
4746  pset_getloadavg_ptr =
4747    (pset_getloadavg_type)dlsym(RTLD_DEFAULT, "pset_getloadavg");
4748  if (PrintMiscellaneous && Verbose && pset_getloadavg_ptr == NULL) {
4749    warning("pset_getloadavg function not found");
4750  }
4751}
4752
4753int os::Solaris::_dev_zero_fd = -1;
4754
4755// this is called _before_ the global arguments have been parsed
4756void os::init(void) {
4757  _initial_pid = getpid();
4758
4759  max_hrtime = first_hrtime = gethrtime();
4760
4761  init_random(1234567);
4762
4763  page_size = sysconf(_SC_PAGESIZE);
4764  if (page_size == -1)
4765    fatal1("os_solaris.cpp: os::init: sysconf failed (%s)", strerror(errno));
4766  init_page_sizes((size_t) page_size);
4767
4768  Solaris::initialize_system_info();
4769
4770  // Initialize misc. symbols as soon as possible, so we can use them
4771  // if we need them.
4772  Solaris::misc_sym_init();
4773
4774  int fd = open("/dev/zero", O_RDWR);
4775  if (fd < 0) {
4776    fatal1("os::init: cannot open /dev/zero (%s)", strerror(errno));
4777  } else {
4778    Solaris::set_dev_zero_fd(fd);
4779
4780    // Close on exec, child won't inherit.
4781    fcntl(fd, F_SETFD, FD_CLOEXEC);
4782  }
4783
4784  clock_tics_per_sec = CLK_TCK;
4785
4786  // check if dladdr1() exists; dladdr1 can provide more information than
4787  // dladdr for os::dll_address_to_function_name. It comes with SunOS 5.9
4788  // and is available on linker patches for 5.7 and 5.8.
4789  // libdl.so must have been loaded, this call is just an entry lookup
4790  void * hdl = dlopen("libdl.so", RTLD_NOW);
4791  if (hdl)
4792    dladdr1_func = CAST_TO_FN_PTR(dladdr1_func_type, dlsym(hdl, "dladdr1"));
4793
4794  // (Solaris only) this switches to calls that actually do locking.
4795  ThreadCritical::initialize();
4796
4797  main_thread = thr_self();
4798
4799  // Constant minimum stack size allowed. It must be at least
4800  // the minimum of what the OS supports (thr_min_stack()), and
4801  // enough to allow the thread to get to user bytecode execution.
4802  Solaris::min_stack_allowed = MAX2(thr_min_stack(), Solaris::min_stack_allowed);
4803  // If the pagesize of the VM is greater than 8K determine the appropriate
4804  // number of initial guard pages.  The user can change this with the
4805  // command line arguments, if needed.
4806  if (vm_page_size() > 8*K) {
4807    StackYellowPages = 1;
4808    StackRedPages = 1;
4809    StackShadowPages = round_to((StackShadowPages*8*K), vm_page_size()) / vm_page_size();
4810  }
4811}
4812
4813// To install functions for atexit system call
4814extern "C" {
4815  static void perfMemory_exit_helper() {
4816    perfMemory_exit();
4817  }
4818}
4819
4820// this is called _after_ the global arguments have been parsed
4821jint os::init_2(void) {
4822  // try to enable extended file IO ASAP, see 6431278
4823  os::Solaris::try_enable_extended_io();
4824
4825  // Allocate a single page and mark it as readable for safepoint polling.  Also
4826  // use this first mmap call to check support for MAP_ALIGN.
4827  address polling_page = (address)Solaris::mmap_chunk((char*)page_size,
4828                                                      page_size,
4829                                                      MAP_PRIVATE | MAP_ALIGN,
4830                                                      PROT_READ);
4831  if (polling_page == NULL) {
4832    has_map_align = false;
4833    polling_page = (address)Solaris::mmap_chunk(NULL, page_size, MAP_PRIVATE,
4834                                                PROT_READ);
4835  }
4836
4837  os::set_polling_page(polling_page);
4838
4839#ifndef PRODUCT
4840  if( Verbose && PrintMiscellaneous )
4841    tty->print("[SafePoint Polling address: " INTPTR_FORMAT "]\n", (intptr_t)polling_page);
4842#endif
4843
4844  if (!UseMembar) {
4845    address mem_serialize_page = (address)Solaris::mmap_chunk( NULL, page_size, MAP_PRIVATE, PROT_READ | PROT_WRITE );
4846    guarantee( mem_serialize_page != NULL, "mmap Failed for memory serialize page");
4847    os::set_memory_serialize_page( mem_serialize_page );
4848
4849#ifndef PRODUCT
4850    if(Verbose && PrintMiscellaneous)
4851      tty->print("[Memory Serialize  Page address: " INTPTR_FORMAT "]\n", (intptr_t)mem_serialize_page);
4852#endif
4853}
4854
4855  FLAG_SET_DEFAULT(UseLargePages, os::large_page_init());
4856
4857  // Check minimum allowable stack size for thread creation and to initialize
4858  // the java system classes, including StackOverflowError - depends on page
4859  // size.  Add a page for compiler2 recursion in main thread.
4860  // Add in BytesPerWord times page size to account for VM stack during
4861  // class initialization depending on 32 or 64 bit VM.
4862  guarantee((Solaris::min_stack_allowed >=
4863    (StackYellowPages+StackRedPages+StackShadowPages+BytesPerWord
4864     COMPILER2_PRESENT(+1)) * page_size),
4865    "need to increase Solaris::min_stack_allowed on this platform");
4866
4867  size_t threadStackSizeInBytes = ThreadStackSize * K;
4868  if (threadStackSizeInBytes != 0 &&
4869    threadStackSizeInBytes < Solaris::min_stack_allowed) {
4870    tty->print_cr("\nThe stack size specified is too small, Specify at least %dk",
4871                  Solaris::min_stack_allowed/K);
4872    return JNI_ERR;
4873  }
4874
4875  // For 64kbps there will be a 64kb page size, which makes
4876  // the usable default stack size quite a bit less.  Increase the
4877  // stack for 64kb (or any > than 8kb) pages, this increases
4878  // virtual memory fragmentation (since we're not creating the
4879  // stack on a power of 2 boundary.  The real fix for this
4880  // should be to fix the guard page mechanism.
4881
4882  if (vm_page_size() > 8*K) {
4883      threadStackSizeInBytes = (threadStackSizeInBytes != 0)
4884         ? threadStackSizeInBytes +
4885           ((StackYellowPages + StackRedPages) * vm_page_size())
4886         : 0;
4887      ThreadStackSize = threadStackSizeInBytes/K;
4888  }
4889
4890  // Make the stack size a multiple of the page size so that
4891  // the yellow/red zones can be guarded.
4892  JavaThread::set_stack_size_at_create(round_to(threadStackSizeInBytes,
4893        vm_page_size()));
4894
4895  Solaris::libthread_init();
4896
4897  if (UseNUMA) {
4898    if (!Solaris::liblgrp_init()) {
4899      UseNUMA = false;
4900    } else {
4901      size_t lgrp_limit = os::numa_get_groups_num();
4902      int *lgrp_ids = NEW_C_HEAP_ARRAY(int, lgrp_limit);
4903      size_t lgrp_num = os::numa_get_leaf_groups(lgrp_ids, lgrp_limit);
4904      FREE_C_HEAP_ARRAY(int, lgrp_ids);
4905      if (lgrp_num < 2) {
4906        // There's only one locality group, disable NUMA.
4907        UseNUMA = false;
4908      }
4909    }
4910    if (!UseNUMA && ForceNUMA) {
4911      UseNUMA = true;
4912    }
4913  }
4914
4915  Solaris::signal_sets_init();
4916  Solaris::init_signal_mem();
4917  Solaris::install_signal_handlers();
4918
4919  if (libjsigversion < JSIG_VERSION_1_4_1) {
4920    Maxlibjsigsigs = OLDMAXSIGNUM;
4921  }
4922
4923  // initialize synchronization primitives to use either thread or
4924  // lwp synchronization (controlled by UseLWPSynchronization)
4925  Solaris::synchronization_init();
4926
4927  if (MaxFDLimit) {
4928    // set the number of file descriptors to max. print out error
4929    // if getrlimit/setrlimit fails but continue regardless.
4930    struct rlimit nbr_files;
4931    int status = getrlimit(RLIMIT_NOFILE, &nbr_files);
4932    if (status != 0) {
4933      if (PrintMiscellaneous && (Verbose || WizardMode))
4934        perror("os::init_2 getrlimit failed");
4935    } else {
4936      nbr_files.rlim_cur = nbr_files.rlim_max;
4937      status = setrlimit(RLIMIT_NOFILE, &nbr_files);
4938      if (status != 0) {
4939        if (PrintMiscellaneous && (Verbose || WizardMode))
4940          perror("os::init_2 setrlimit failed");
4941      }
4942    }
4943  }
4944
4945  // Initialize HPI.
4946  jint hpi_result = hpi::initialize();
4947  if (hpi_result != JNI_OK) {
4948    tty->print_cr("There was an error trying to initialize the HPI library.");
4949    return hpi_result;
4950  }
4951
4952  // Calculate theoretical max. size of Threads to guard gainst
4953  // artifical out-of-memory situations, where all available address-
4954  // space has been reserved by thread stacks. Default stack size is 1Mb.
4955  size_t pre_thread_stack_size = (JavaThread::stack_size_at_create()) ?
4956    JavaThread::stack_size_at_create() : (1*K*K);
4957  assert(pre_thread_stack_size != 0, "Must have a stack");
4958  // Solaris has a maximum of 4Gb of user programs. Calculate the thread limit when
4959  // we should start doing Virtual Memory banging. Currently when the threads will
4960  // have used all but 200Mb of space.
4961  size_t max_address_space = ((unsigned int)4 * K * K * K) - (200 * K * K);
4962  Solaris::_os_thread_limit = max_address_space / pre_thread_stack_size;
4963
4964  // at-exit methods are called in the reverse order of their registration.
4965  // In Solaris 7 and earlier, atexit functions are called on return from
4966  // main or as a result of a call to exit(3C). There can be only 32 of
4967  // these functions registered and atexit() does not set errno. In Solaris
4968  // 8 and later, there is no limit to the number of functions registered
4969  // and atexit() sets errno. In addition, in Solaris 8 and later, atexit
4970  // functions are called upon dlclose(3DL) in addition to return from main
4971  // and exit(3C).
4972
4973  if (PerfAllowAtExitRegistration) {
4974    // only register atexit functions if PerfAllowAtExitRegistration is set.
4975    // atexit functions can be delayed until process exit time, which
4976    // can be problematic for embedded VM situations. Embedded VMs should
4977    // call DestroyJavaVM() to assure that VM resources are released.
4978
4979    // note: perfMemory_exit_helper atexit function may be removed in
4980    // the future if the appropriate cleanup code can be added to the
4981    // VM_Exit VMOperation's doit method.
4982    if (atexit(perfMemory_exit_helper) != 0) {
4983      warning("os::init2 atexit(perfMemory_exit_helper) failed");
4984    }
4985  }
4986
4987  // Init pset_loadavg function pointer
4988  init_pset_getloadavg_ptr();
4989
4990  return JNI_OK;
4991}
4992
4993
4994// Mark the polling page as unreadable
4995void os::make_polling_page_unreadable(void) {
4996  if( mprotect((char *)_polling_page, page_size, PROT_NONE) != 0 )
4997    fatal("Could not disable polling page");
4998};
4999
5000// Mark the polling page as readable
5001void os::make_polling_page_readable(void) {
5002  if( mprotect((char *)_polling_page, page_size, PROT_READ) != 0 )
5003    fatal("Could not enable polling page");
5004};
5005
5006// OS interface.
5007
5008int os::stat(const char *path, struct stat *sbuf) {
5009  char pathbuf[MAX_PATH];
5010  if (strlen(path) > MAX_PATH - 1) {
5011    errno = ENAMETOOLONG;
5012    return -1;
5013  }
5014  hpi::native_path(strcpy(pathbuf, path));
5015  return ::stat(pathbuf, sbuf);
5016}
5017
5018
5019bool os::check_heap(bool force) { return true; }
5020
5021typedef int (*vsnprintf_t)(char* buf, size_t count, const char* fmt, va_list argptr);
5022static vsnprintf_t sol_vsnprintf = NULL;
5023
5024int local_vsnprintf(char* buf, size_t count, const char* fmt, va_list argptr) {
5025  if (!sol_vsnprintf) {
5026    //search  for the named symbol in the objects that were loaded after libjvm
5027    void* where = RTLD_NEXT;
5028    if ((sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "__vsnprintf"))) == NULL)
5029        sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "vsnprintf"));
5030    if (!sol_vsnprintf){
5031      //search  for the named symbol in the objects that were loaded before libjvm
5032      where = RTLD_DEFAULT;
5033      if ((sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "__vsnprintf"))) == NULL)
5034        sol_vsnprintf = CAST_TO_FN_PTR(vsnprintf_t, dlsym(where, "vsnprintf"));
5035      assert(sol_vsnprintf != NULL, "vsnprintf not found");
5036    }
5037  }
5038  return (*sol_vsnprintf)(buf, count, fmt, argptr);
5039}
5040
5041
5042// Is a (classpath) directory empty?
5043bool os::dir_is_empty(const char* path) {
5044  DIR *dir = NULL;
5045  struct dirent *ptr;
5046
5047  dir = opendir(path);
5048  if (dir == NULL) return true;
5049
5050  /* Scan the directory */
5051  bool result = true;
5052  char buf[sizeof(struct dirent) + MAX_PATH];
5053  struct dirent *dbuf = (struct dirent *) buf;
5054  while (result && (ptr = readdir(dir, dbuf)) != NULL) {
5055    if (strcmp(ptr->d_name, ".") != 0 && strcmp(ptr->d_name, "..") != 0) {
5056      result = false;
5057    }
5058  }
5059  closedir(dir);
5060  return result;
5061}
5062
5063// create binary file, rewriting existing file if required
5064int os::create_binary_file(const char* path, bool rewrite_existing) {
5065  int oflags = O_WRONLY | O_CREAT;
5066  if (!rewrite_existing) {
5067    oflags |= O_EXCL;
5068  }
5069  return ::open64(path, oflags, S_IREAD | S_IWRITE);
5070}
5071
5072// return current position of file pointer
5073jlong os::current_file_offset(int fd) {
5074  return (jlong)::lseek64(fd, (off64_t)0, SEEK_CUR);
5075}
5076
5077// move file pointer to the specified offset
5078jlong os::seek_to_file_offset(int fd, jlong offset) {
5079  return (jlong)::lseek64(fd, (off64_t)offset, SEEK_SET);
5080}
5081
5082// Map a block of memory.
5083char* os::map_memory(int fd, const char* file_name, size_t file_offset,
5084                     char *addr, size_t bytes, bool read_only,
5085                     bool allow_exec) {
5086  int prot;
5087  int flags;
5088
5089  if (read_only) {
5090    prot = PROT_READ;
5091    flags = MAP_SHARED;
5092  } else {
5093    prot = PROT_READ | PROT_WRITE;
5094    flags = MAP_PRIVATE;
5095  }
5096
5097  if (allow_exec) {
5098    prot |= PROT_EXEC;
5099  }
5100
5101  if (addr != NULL) {
5102    flags |= MAP_FIXED;
5103  }
5104
5105  char* mapped_address = (char*)mmap(addr, (size_t)bytes, prot, flags,
5106                                     fd, file_offset);
5107  if (mapped_address == MAP_FAILED) {
5108    return NULL;
5109  }
5110  return mapped_address;
5111}
5112
5113
5114// Remap a block of memory.
5115char* os::remap_memory(int fd, const char* file_name, size_t file_offset,
5116                       char *addr, size_t bytes, bool read_only,
5117                       bool allow_exec) {
5118  // same as map_memory() on this OS
5119  return os::map_memory(fd, file_name, file_offset, addr, bytes, read_only,
5120                        allow_exec);
5121}
5122
5123
5124// Unmap a block of memory.
5125bool os::unmap_memory(char* addr, size_t bytes) {
5126  return munmap(addr, bytes) == 0;
5127}
5128
5129void os::pause() {
5130  char filename[MAX_PATH];
5131  if (PauseAtStartupFile && PauseAtStartupFile[0]) {
5132    jio_snprintf(filename, MAX_PATH, PauseAtStartupFile);
5133  } else {
5134    jio_snprintf(filename, MAX_PATH, "./vm.paused.%d", current_process_id());
5135  }
5136
5137  int fd = ::open(filename, O_WRONLY | O_CREAT | O_TRUNC, 0666);
5138  if (fd != -1) {
5139    struct stat buf;
5140    close(fd);
5141    while (::stat(filename, &buf) == 0) {
5142      (void)::poll(NULL, 0, 100);
5143    }
5144  } else {
5145    jio_fprintf(stderr,
5146      "Could not open pause file '%s', continuing immediately.\n", filename);
5147  }
5148}
5149
5150#ifndef PRODUCT
5151#ifdef INTERPOSE_ON_SYSTEM_SYNCH_FUNCTIONS
5152// Turn this on if you need to trace synch operations.
5153// Set RECORD_SYNCH_LIMIT to a large-enough value,
5154// and call record_synch_enable and record_synch_disable
5155// around the computation of interest.
5156
5157void record_synch(char* name, bool returning);  // defined below
5158
5159class RecordSynch {
5160  char* _name;
5161 public:
5162  RecordSynch(char* name) :_name(name)
5163                 { record_synch(_name, false); }
5164  ~RecordSynch() { record_synch(_name,   true);  }
5165};
5166
5167#define CHECK_SYNCH_OP(ret, name, params, args, inner)          \
5168extern "C" ret name params {                                    \
5169  typedef ret name##_t params;                                  \
5170  static name##_t* implem = NULL;                               \
5171  static int callcount = 0;                                     \
5172  if (implem == NULL) {                                         \
5173    implem = (name##_t*) dlsym(RTLD_NEXT, #name);               \
5174    if (implem == NULL)  fatal(dlerror());                      \
5175  }                                                             \
5176  ++callcount;                                                  \
5177  RecordSynch _rs(#name);                                       \
5178  inner;                                                        \
5179  return implem args;                                           \
5180}
5181// in dbx, examine callcounts this way:
5182// for n in $(eval whereis callcount | awk '{print $2}'); do print $n; done
5183
5184#define CHECK_POINTER_OK(p) \
5185  (Universe::perm_gen() == NULL || !Universe::is_reserved_heap((oop)(p)))
5186#define CHECK_MU \
5187  if (!CHECK_POINTER_OK(mu)) fatal("Mutex must be in C heap only.");
5188#define CHECK_CV \
5189  if (!CHECK_POINTER_OK(cv)) fatal("Condvar must be in C heap only.");
5190#define CHECK_P(p) \
5191  if (!CHECK_POINTER_OK(p))  fatal(false,  "Pointer must be in C heap only.");
5192
5193#define CHECK_MUTEX(mutex_op) \
5194CHECK_SYNCH_OP(int, mutex_op, (mutex_t *mu), (mu), CHECK_MU);
5195
5196CHECK_MUTEX(   mutex_lock)
5197CHECK_MUTEX(  _mutex_lock)
5198CHECK_MUTEX( mutex_unlock)
5199CHECK_MUTEX(_mutex_unlock)
5200CHECK_MUTEX( mutex_trylock)
5201CHECK_MUTEX(_mutex_trylock)
5202
5203#define CHECK_COND(cond_op) \
5204CHECK_SYNCH_OP(int, cond_op, (cond_t *cv, mutex_t *mu), (cv, mu), CHECK_MU;CHECK_CV);
5205
5206CHECK_COND( cond_wait);
5207CHECK_COND(_cond_wait);
5208CHECK_COND(_cond_wait_cancel);
5209
5210#define CHECK_COND2(cond_op) \
5211CHECK_SYNCH_OP(int, cond_op, (cond_t *cv, mutex_t *mu, timestruc_t* ts), (cv, mu, ts), CHECK_MU;CHECK_CV);
5212
5213CHECK_COND2( cond_timedwait);
5214CHECK_COND2(_cond_timedwait);
5215CHECK_COND2(_cond_timedwait_cancel);
5216
5217// do the _lwp_* versions too
5218#define mutex_t lwp_mutex_t
5219#define cond_t  lwp_cond_t
5220CHECK_MUTEX(  _lwp_mutex_lock)
5221CHECK_MUTEX(  _lwp_mutex_unlock)
5222CHECK_MUTEX(  _lwp_mutex_trylock)
5223CHECK_MUTEX( __lwp_mutex_lock)
5224CHECK_MUTEX( __lwp_mutex_unlock)
5225CHECK_MUTEX( __lwp_mutex_trylock)
5226CHECK_MUTEX(___lwp_mutex_lock)
5227CHECK_MUTEX(___lwp_mutex_unlock)
5228
5229CHECK_COND(  _lwp_cond_wait);
5230CHECK_COND( __lwp_cond_wait);
5231CHECK_COND(___lwp_cond_wait);
5232
5233CHECK_COND2(  _lwp_cond_timedwait);
5234CHECK_COND2( __lwp_cond_timedwait);
5235#undef mutex_t
5236#undef cond_t
5237
5238CHECK_SYNCH_OP(int, _lwp_suspend2,       (int lwp, int *n), (lwp, n), 0);
5239CHECK_SYNCH_OP(int,__lwp_suspend2,       (int lwp, int *n), (lwp, n), 0);
5240CHECK_SYNCH_OP(int, _lwp_kill,           (int lwp, int n),  (lwp, n), 0);
5241CHECK_SYNCH_OP(int,__lwp_kill,           (int lwp, int n),  (lwp, n), 0);
5242CHECK_SYNCH_OP(int, _lwp_sema_wait,      (lwp_sema_t* p),   (p),  CHECK_P(p));
5243CHECK_SYNCH_OP(int,__lwp_sema_wait,      (lwp_sema_t* p),   (p),  CHECK_P(p));
5244CHECK_SYNCH_OP(int, _lwp_cond_broadcast, (lwp_cond_t* cv),  (cv), CHECK_CV);
5245CHECK_SYNCH_OP(int,__lwp_cond_broadcast, (lwp_cond_t* cv),  (cv), CHECK_CV);
5246
5247
5248// recording machinery:
5249
5250enum { RECORD_SYNCH_LIMIT = 200 };
5251char* record_synch_name[RECORD_SYNCH_LIMIT];
5252void* record_synch_arg0ptr[RECORD_SYNCH_LIMIT];
5253bool record_synch_returning[RECORD_SYNCH_LIMIT];
5254thread_t record_synch_thread[RECORD_SYNCH_LIMIT];
5255int record_synch_count = 0;
5256bool record_synch_enabled = false;
5257
5258// in dbx, examine recorded data this way:
5259// for n in name arg0ptr returning thread; do print record_synch_$n[0..record_synch_count-1]; done
5260
5261void record_synch(char* name, bool returning) {
5262  if (record_synch_enabled) {
5263    if (record_synch_count < RECORD_SYNCH_LIMIT) {
5264      record_synch_name[record_synch_count] = name;
5265      record_synch_returning[record_synch_count] = returning;
5266      record_synch_thread[record_synch_count] = thr_self();
5267      record_synch_arg0ptr[record_synch_count] = &name;
5268      record_synch_count++;
5269    }
5270    // put more checking code here:
5271    // ...
5272  }
5273}
5274
5275void record_synch_enable() {
5276  // start collecting trace data, if not already doing so
5277  if (!record_synch_enabled)  record_synch_count = 0;
5278  record_synch_enabled = true;
5279}
5280
5281void record_synch_disable() {
5282  // stop collecting trace data
5283  record_synch_enabled = false;
5284}
5285
5286#endif // INTERPOSE_ON_SYSTEM_SYNCH_FUNCTIONS
5287#endif // PRODUCT
5288
5289const intptr_t thr_time_off  = (intptr_t)(&((prusage_t *)(NULL))->pr_utime);
5290const intptr_t thr_time_size = (intptr_t)(&((prusage_t *)(NULL))->pr_ttime) -
5291                               (intptr_t)(&((prusage_t *)(NULL))->pr_utime);
5292
5293
5294// JVMTI & JVM monitoring and management support
5295// The thread_cpu_time() and current_thread_cpu_time() are only
5296// supported if is_thread_cpu_time_supported() returns true.
5297// They are not supported on Solaris T1.
5298
5299// current_thread_cpu_time(bool) and thread_cpu_time(Thread*, bool)
5300// are used by JVM M&M and JVMTI to get user+sys or user CPU time
5301// of a thread.
5302//
5303// current_thread_cpu_time() and thread_cpu_time(Thread *)
5304// returns the fast estimate available on the platform.
5305
5306// hrtime_t gethrvtime() return value includes
5307// user time but does not include system time
5308jlong os::current_thread_cpu_time() {
5309  return (jlong) gethrvtime();
5310}
5311
5312jlong os::thread_cpu_time(Thread *thread) {
5313  // return user level CPU time only to be consistent with
5314  // what current_thread_cpu_time returns.
5315  // thread_cpu_time_info() must be changed if this changes
5316  return os::thread_cpu_time(thread, false /* user time only */);
5317}
5318
5319jlong os::current_thread_cpu_time(bool user_sys_cpu_time) {
5320  if (user_sys_cpu_time) {
5321    return os::thread_cpu_time(Thread::current(), user_sys_cpu_time);
5322  } else {
5323    return os::current_thread_cpu_time();
5324  }
5325}
5326
5327jlong os::thread_cpu_time(Thread *thread, bool user_sys_cpu_time) {
5328  char proc_name[64];
5329  int count;
5330  prusage_t prusage;
5331  jlong lwp_time;
5332  int fd;
5333
5334  sprintf(proc_name, "/proc/%d/lwp/%d/lwpusage",
5335                     getpid(),
5336                     thread->osthread()->lwp_id());
5337  fd = open(proc_name, O_RDONLY);
5338  if ( fd == -1 ) return -1;
5339
5340  do {
5341    count = pread(fd,
5342                  (void *)&prusage.pr_utime,
5343                  thr_time_size,
5344                  thr_time_off);
5345  } while (count < 0 && errno == EINTR);
5346  close(fd);
5347  if ( count < 0 ) return -1;
5348
5349  if (user_sys_cpu_time) {
5350    // user + system CPU time
5351    lwp_time = (((jlong)prusage.pr_stime.tv_sec +
5352                 (jlong)prusage.pr_utime.tv_sec) * (jlong)1000000000) +
5353                 (jlong)prusage.pr_stime.tv_nsec +
5354                 (jlong)prusage.pr_utime.tv_nsec;
5355  } else {
5356    // user level CPU time only
5357    lwp_time = ((jlong)prusage.pr_utime.tv_sec * (jlong)1000000000) +
5358                (jlong)prusage.pr_utime.tv_nsec;
5359  }
5360
5361  return(lwp_time);
5362}
5363
5364void os::current_thread_cpu_time_info(jvmtiTimerInfo *info_ptr) {
5365  info_ptr->max_value = ALL_64_BITS;      // will not wrap in less than 64 bits
5366  info_ptr->may_skip_backward = false;    // elapsed time not wall time
5367  info_ptr->may_skip_forward = false;     // elapsed time not wall time
5368  info_ptr->kind = JVMTI_TIMER_USER_CPU;  // only user time is returned
5369}
5370
5371void os::thread_cpu_time_info(jvmtiTimerInfo *info_ptr) {
5372  info_ptr->max_value = ALL_64_BITS;      // will not wrap in less than 64 bits
5373  info_ptr->may_skip_backward = false;    // elapsed time not wall time
5374  info_ptr->may_skip_forward = false;     // elapsed time not wall time
5375  info_ptr->kind = JVMTI_TIMER_USER_CPU;  // only user time is returned
5376}
5377
5378bool os::is_thread_cpu_time_supported() {
5379  if ( os::Solaris::T2_libthread() || UseBoundThreads ) {
5380    return true;
5381  } else {
5382    return false;
5383  }
5384}
5385
5386// System loadavg support.  Returns -1 if load average cannot be obtained.
5387// Return the load average for our processor set if the primitive exists
5388// (Solaris 9 and later).  Otherwise just return system wide loadavg.
5389int os::loadavg(double loadavg[], int nelem) {
5390  if (pset_getloadavg_ptr != NULL) {
5391    return (*pset_getloadavg_ptr)(PS_MYID, loadavg, nelem);
5392  } else {
5393    return ::getloadavg(loadavg, nelem);
5394  }
5395}
5396
5397//---------------------------------------------------------------------------------
5398#ifndef PRODUCT
5399
5400static address same_page(address x, address y) {
5401  intptr_t page_bits = -os::vm_page_size();
5402  if ((intptr_t(x) & page_bits) == (intptr_t(y) & page_bits))
5403    return x;
5404  else if (x > y)
5405    return (address)(intptr_t(y) | ~page_bits) + 1;
5406  else
5407    return (address)(intptr_t(y) & page_bits);
5408}
5409
5410bool os::find(address addr) {
5411  Dl_info dlinfo;
5412  memset(&dlinfo, 0, sizeof(dlinfo));
5413  if (dladdr(addr, &dlinfo)) {
5414#ifdef _LP64
5415    tty->print("0x%016lx: ", addr);
5416#else
5417    tty->print("0x%08x: ", addr);
5418#endif
5419    if (dlinfo.dli_sname != NULL)
5420      tty->print("%s+%#lx", dlinfo.dli_sname, addr-(intptr_t)dlinfo.dli_saddr);
5421    else if (dlinfo.dli_fname)
5422      tty->print("<offset %#lx>", addr-(intptr_t)dlinfo.dli_fbase);
5423    else
5424      tty->print("<absolute address>");
5425    if (dlinfo.dli_fname)  tty->print(" in %s", dlinfo.dli_fname);
5426#ifdef _LP64
5427    if (dlinfo.dli_fbase)  tty->print(" at 0x%016lx", dlinfo.dli_fbase);
5428#else
5429    if (dlinfo.dli_fbase)  tty->print(" at 0x%08x", dlinfo.dli_fbase);
5430#endif
5431    tty->cr();
5432
5433    if (Verbose) {
5434      // decode some bytes around the PC
5435      address begin = same_page(addr-40, addr);
5436      address end   = same_page(addr+40, addr);
5437      address       lowest = (address) dlinfo.dli_sname;
5438      if (!lowest)  lowest = (address) dlinfo.dli_fbase;
5439      if (begin < lowest)  begin = lowest;
5440      Dl_info dlinfo2;
5441      if (dladdr(end, &dlinfo2) && dlinfo2.dli_saddr != dlinfo.dli_saddr
5442          && end > dlinfo2.dli_saddr && dlinfo2.dli_saddr > begin)
5443        end = (address) dlinfo2.dli_saddr;
5444      Disassembler::decode(begin, end);
5445    }
5446    return true;
5447  }
5448  return false;
5449}
5450
5451#endif
5452
5453
5454// Following function has been added to support HotSparc's libjvm.so running
5455// under Solaris production JDK 1.2.2 / 1.3.0.  These came from
5456// src/solaris/hpi/native_threads in the EVM codebase.
5457//
5458// NOTE: This is no longer needed in the 1.3.1 and 1.4 production release
5459// libraries and should thus be removed. We will leave it behind for a while
5460// until we no longer want to able to run on top of 1.3.0 Solaris production
5461// JDK. See 4341971.
5462
5463#define STACK_SLACK 0x800
5464
5465extern "C" {
5466  intptr_t sysThreadAvailableStackWithSlack() {
5467    stack_t st;
5468    intptr_t retval, stack_top;
5469    retval = thr_stksegment(&st);
5470    assert(retval == 0, "incorrect return value from thr_stksegment");
5471    assert((address)&st < (address)st.ss_sp, "Invalid stack base returned");
5472    assert((address)&st > (address)st.ss_sp-st.ss_size, "Invalid stack size returned");
5473    stack_top=(intptr_t)st.ss_sp-st.ss_size;
5474    return ((intptr_t)&stack_top - stack_top - STACK_SLACK);
5475  }
5476}
5477
5478// Just to get the Kernel build to link on solaris for testing.
5479
5480extern "C" {
5481class ASGCT_CallTrace;
5482void AsyncGetCallTrace(ASGCT_CallTrace *trace, jint depth, void* ucontext)
5483  KERNEL_RETURN;
5484}
5485
5486
5487// ObjectMonitor park-unpark infrastructure ...
5488//
5489// We implement Solaris and Linux PlatformEvents with the
5490// obvious condvar-mutex-flag triple.
5491// Another alternative that works quite well is pipes:
5492// Each PlatformEvent consists of a pipe-pair.
5493// The thread associated with the PlatformEvent
5494// calls park(), which reads from the input end of the pipe.
5495// Unpark() writes into the other end of the pipe.
5496// The write-side of the pipe must be set NDELAY.
5497// Unfortunately pipes consume a large # of handles.
5498// Native solaris lwp_park() and lwp_unpark() work nicely, too.
5499// Using pipes for the 1st few threads might be workable, however.
5500//
5501// park() is permitted to return spuriously.
5502// Callers of park() should wrap the call to park() in
5503// an appropriate loop.  A litmus test for the correct
5504// usage of park is the following: if park() were modified
5505// to immediately return 0 your code should still work,
5506// albeit degenerating to a spin loop.
5507//
5508// An interesting optimization for park() is to use a trylock()
5509// to attempt to acquire the mutex.  If the trylock() fails
5510// then we know that a concurrent unpark() operation is in-progress.
5511// in that case the park() code could simply set _count to 0
5512// and return immediately.  The subsequent park() operation *might*
5513// return immediately.  That's harmless as the caller of park() is
5514// expected to loop.  By using trylock() we will have avoided a
5515// avoided a context switch caused by contention on the per-thread mutex.
5516//
5517// TODO-FIXME:
5518// 1.  Reconcile Doug's JSR166 j.u.c park-unpark with the
5519//     objectmonitor implementation.
5520// 2.  Collapse the JSR166 parker event, and the
5521//     objectmonitor ParkEvent into a single "Event" construct.
5522// 3.  In park() and unpark() add:
5523//     assert (Thread::current() == AssociatedWith).
5524// 4.  add spurious wakeup injection on a -XX:EarlyParkReturn=N switch.
5525//     1-out-of-N park() operations will return immediately.
5526//
5527// _Event transitions in park()
5528//   -1 => -1 : illegal
5529//    1 =>  0 : pass - return immediately
5530//    0 => -1 : block
5531//
5532// _Event serves as a restricted-range semaphore.
5533//
5534// Another possible encoding of _Event would be with
5535// explicit "PARKED" == 01b and "SIGNALED" == 10b bits.
5536//
5537// TODO-FIXME: add DTRACE probes for:
5538// 1.   Tx parks
5539// 2.   Ty unparks Tx
5540// 3.   Tx resumes from park
5541
5542
5543// value determined through experimentation
5544#define ROUNDINGFIX 11
5545
5546// utility to compute the abstime argument to timedwait.
5547// TODO-FIXME: switch from compute_abstime() to unpackTime().
5548
5549static timestruc_t* compute_abstime(timestruc_t* abstime, jlong millis) {
5550  // millis is the relative timeout time
5551  // abstime will be the absolute timeout time
5552  if (millis < 0)  millis = 0;
5553  struct timeval now;
5554  int status = gettimeofday(&now, NULL);
5555  assert(status == 0, "gettimeofday");
5556  jlong seconds = millis / 1000;
5557  jlong max_wait_period;
5558
5559  if (UseLWPSynchronization) {
5560    // forward port of fix for 4275818 (not sleeping long enough)
5561    // There was a bug in Solaris 6, 7 and pre-patch 5 of 8 where
5562    // _lwp_cond_timedwait() used a round_down algorithm rather
5563    // than a round_up. For millis less than our roundfactor
5564    // it rounded down to 0 which doesn't meet the spec.
5565    // For millis > roundfactor we may return a bit sooner, but
5566    // since we can not accurately identify the patch level and
5567    // this has already been fixed in Solaris 9 and 8 we will
5568    // leave it alone rather than always rounding down.
5569
5570    if (millis > 0 && millis < ROUNDINGFIX) millis = ROUNDINGFIX;
5571       // It appears that when we go directly through Solaris _lwp_cond_timedwait()
5572           // the acceptable max time threshold is smaller than for libthread on 2.5.1 and 2.6
5573           max_wait_period = 21000000;
5574  } else {
5575    max_wait_period = 50000000;
5576  }
5577  millis %= 1000;
5578  if (seconds > max_wait_period) {      // see man cond_timedwait(3T)
5579     seconds = max_wait_period;
5580  }
5581  abstime->tv_sec = now.tv_sec  + seconds;
5582  long       usec = now.tv_usec + millis * 1000;
5583  if (usec >= 1000000) {
5584    abstime->tv_sec += 1;
5585    usec -= 1000000;
5586  }
5587  abstime->tv_nsec = usec * 1000;
5588  return abstime;
5589}
5590
5591// Test-and-clear _Event, always leaves _Event set to 0, returns immediately.
5592// Conceptually TryPark() should be equivalent to park(0).
5593
5594int os::PlatformEvent::TryPark() {
5595  for (;;) {
5596    const int v = _Event ;
5597    guarantee ((v == 0) || (v == 1), "invariant") ;
5598    if (Atomic::cmpxchg (0, &_Event, v) == v) return v  ;
5599  }
5600}
5601
5602void os::PlatformEvent::park() {           // AKA: down()
5603  // Invariant: Only the thread associated with the Event/PlatformEvent
5604  // may call park().
5605  int v ;
5606  for (;;) {
5607      v = _Event ;
5608      if (Atomic::cmpxchg (v-1, &_Event, v) == v) break ;
5609  }
5610  guarantee (v >= 0, "invariant") ;
5611  if (v == 0) {
5612     // Do this the hard way by blocking ...
5613     // See http://monaco.sfbay/detail.jsf?cr=5094058.
5614     // TODO-FIXME: for Solaris SPARC set fprs.FEF=0 prior to parking.
5615     // Only for SPARC >= V8PlusA
5616#if defined(__sparc) && defined(COMPILER2)
5617     if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5618#endif
5619     int status = os::Solaris::mutex_lock(_mutex);
5620     assert_status(status == 0, status,  "mutex_lock");
5621     guarantee (_nParked == 0, "invariant") ;
5622     ++ _nParked ;
5623     while (_Event < 0) {
5624        // for some reason, under 2.7 lwp_cond_wait() may return ETIME ...
5625        // Treat this the same as if the wait was interrupted
5626        // With usr/lib/lwp going to kernel, always handle ETIME
5627        status = os::Solaris::cond_wait(_cond, _mutex);
5628        if (status == ETIME) status = EINTR ;
5629        assert_status(status == 0 || status == EINTR, status, "cond_wait");
5630     }
5631     -- _nParked ;
5632     _Event = 0 ;
5633     status = os::Solaris::mutex_unlock(_mutex);
5634     assert_status(status == 0, status, "mutex_unlock");
5635  }
5636}
5637
5638int os::PlatformEvent::park(jlong millis) {
5639  guarantee (_nParked == 0, "invariant") ;
5640  int v ;
5641  for (;;) {
5642      v = _Event ;
5643      if (Atomic::cmpxchg (v-1, &_Event, v) == v) break ;
5644  }
5645  guarantee (v >= 0, "invariant") ;
5646  if (v != 0) return OS_OK ;
5647
5648  int ret = OS_TIMEOUT;
5649  timestruc_t abst;
5650  compute_abstime (&abst, millis);
5651
5652  // See http://monaco.sfbay/detail.jsf?cr=5094058.
5653  // For Solaris SPARC set fprs.FEF=0 prior to parking.
5654  // Only for SPARC >= V8PlusA
5655#if defined(__sparc) && defined(COMPILER2)
5656 if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5657#endif
5658  int status = os::Solaris::mutex_lock(_mutex);
5659  assert_status(status == 0, status, "mutex_lock");
5660  guarantee (_nParked == 0, "invariant") ;
5661  ++ _nParked ;
5662  while (_Event < 0) {
5663     int status = os::Solaris::cond_timedwait(_cond, _mutex, &abst);
5664     assert_status(status == 0 || status == EINTR ||
5665                   status == ETIME || status == ETIMEDOUT,
5666                   status, "cond_timedwait");
5667     if (!FilterSpuriousWakeups) break ;                // previous semantics
5668     if (status == ETIME || status == ETIMEDOUT) break ;
5669     // We consume and ignore EINTR and spurious wakeups.
5670  }
5671  -- _nParked ;
5672  if (_Event >= 0) ret = OS_OK ;
5673  _Event = 0 ;
5674  status = os::Solaris::mutex_unlock(_mutex);
5675  assert_status(status == 0, status, "mutex_unlock");
5676  return ret;
5677}
5678
5679void os::PlatformEvent::unpark() {
5680  int v, AnyWaiters;
5681
5682  // Increment _Event.
5683  // Another acceptable implementation would be to simply swap 1
5684  // into _Event:
5685  //   if (Swap (&_Event, 1) < 0) {
5686  //      mutex_lock (_mutex) ; AnyWaiters = nParked; mutex_unlock (_mutex) ;
5687  //      if (AnyWaiters) cond_signal (_cond) ;
5688  //   }
5689
5690  for (;;) {
5691    v = _Event ;
5692    if (v > 0) {
5693       // The LD of _Event could have reordered or be satisfied
5694       // by a read-aside from this processor's write buffer.
5695       // To avoid problems execute a barrier and then
5696       // ratify the value.  A degenerate CAS() would also work.
5697       // Viz., CAS (v+0, &_Event, v) == v).
5698       OrderAccess::fence() ;
5699       if (_Event == v) return ;
5700       continue ;
5701    }
5702    if (Atomic::cmpxchg (v+1, &_Event, v) == v) break ;
5703  }
5704
5705  // If the thread associated with the event was parked, wake it.
5706  if (v < 0) {
5707     int status ;
5708     // Wait for the thread assoc with the PlatformEvent to vacate.
5709     status = os::Solaris::mutex_lock(_mutex);
5710     assert_status(status == 0, status, "mutex_lock");
5711     AnyWaiters = _nParked ;
5712     status = os::Solaris::mutex_unlock(_mutex);
5713     assert_status(status == 0, status, "mutex_unlock");
5714     guarantee (AnyWaiters == 0 || AnyWaiters == 1, "invariant") ;
5715     if (AnyWaiters != 0) {
5716       // We intentional signal *after* dropping the lock
5717       // to avoid a common class of futile wakeups.
5718       status = os::Solaris::cond_signal(_cond);
5719       assert_status(status == 0, status, "cond_signal");
5720     }
5721  }
5722}
5723
5724// JSR166
5725// -------------------------------------------------------
5726
5727/*
5728 * The solaris and linux implementations of park/unpark are fairly
5729 * conservative for now, but can be improved. They currently use a
5730 * mutex/condvar pair, plus _counter.
5731 * Park decrements _counter if > 0, else does a condvar wait.  Unpark
5732 * sets count to 1 and signals condvar.  Only one thread ever waits
5733 * on the condvar. Contention seen when trying to park implies that someone
5734 * is unparking you, so don't wait. And spurious returns are fine, so there
5735 * is no need to track notifications.
5736 */
5737
5738#define NANOSECS_PER_SEC 1000000000
5739#define NANOSECS_PER_MILLISEC 1000000
5740#define MAX_SECS 100000000
5741
5742/*
5743 * This code is common to linux and solaris and will be moved to a
5744 * common place in dolphin.
5745 *
5746 * The passed in time value is either a relative time in nanoseconds
5747 * or an absolute time in milliseconds. Either way it has to be unpacked
5748 * into suitable seconds and nanoseconds components and stored in the
5749 * given timespec structure.
5750 * Given time is a 64-bit value and the time_t used in the timespec is only
5751 * a signed-32-bit value (except on 64-bit Linux) we have to watch for
5752 * overflow if times way in the future are given. Further on Solaris versions
5753 * prior to 10 there is a restriction (see cond_timedwait) that the specified
5754 * number of seconds, in abstime, is less than current_time  + 100,000,000.
5755 * As it will be 28 years before "now + 100000000" will overflow we can
5756 * ignore overflow and just impose a hard-limit on seconds using the value
5757 * of "now + 100,000,000". This places a limit on the timeout of about 3.17
5758 * years from "now".
5759 */
5760static void unpackTime(timespec* absTime, bool isAbsolute, jlong time) {
5761  assert (time > 0, "convertTime");
5762
5763  struct timeval now;
5764  int status = gettimeofday(&now, NULL);
5765  assert(status == 0, "gettimeofday");
5766
5767  time_t max_secs = now.tv_sec + MAX_SECS;
5768
5769  if (isAbsolute) {
5770    jlong secs = time / 1000;
5771    if (secs > max_secs) {
5772      absTime->tv_sec = max_secs;
5773    }
5774    else {
5775      absTime->tv_sec = secs;
5776    }
5777    absTime->tv_nsec = (time % 1000) * NANOSECS_PER_MILLISEC;
5778  }
5779  else {
5780    jlong secs = time / NANOSECS_PER_SEC;
5781    if (secs >= MAX_SECS) {
5782      absTime->tv_sec = max_secs;
5783      absTime->tv_nsec = 0;
5784    }
5785    else {
5786      absTime->tv_sec = now.tv_sec + secs;
5787      absTime->tv_nsec = (time % NANOSECS_PER_SEC) + now.tv_usec*1000;
5788      if (absTime->tv_nsec >= NANOSECS_PER_SEC) {
5789        absTime->tv_nsec -= NANOSECS_PER_SEC;
5790        ++absTime->tv_sec; // note: this must be <= max_secs
5791      }
5792    }
5793  }
5794  assert(absTime->tv_sec >= 0, "tv_sec < 0");
5795  assert(absTime->tv_sec <= max_secs, "tv_sec > max_secs");
5796  assert(absTime->tv_nsec >= 0, "tv_nsec < 0");
5797  assert(absTime->tv_nsec < NANOSECS_PER_SEC, "tv_nsec >= nanos_per_sec");
5798}
5799
5800void Parker::park(bool isAbsolute, jlong time) {
5801
5802  // Optional fast-path check:
5803  // Return immediately if a permit is available.
5804  if (_counter > 0) {
5805      _counter = 0 ;
5806      OrderAccess::fence();
5807      return ;
5808  }
5809
5810  // Optional fast-exit: Check interrupt before trying to wait
5811  Thread* thread = Thread::current();
5812  assert(thread->is_Java_thread(), "Must be JavaThread");
5813  JavaThread *jt = (JavaThread *)thread;
5814  if (Thread::is_interrupted(thread, false)) {
5815    return;
5816  }
5817
5818  // First, demultiplex/decode time arguments
5819  timespec absTime;
5820  if (time < 0) { // don't wait at all
5821    return;
5822  }
5823  if (time > 0) {
5824    // Warning: this code might be exposed to the old Solaris time
5825    // round-down bugs.  Grep "roundingFix" for details.
5826    unpackTime(&absTime, isAbsolute, time);
5827  }
5828
5829  // Enter safepoint region
5830  // Beware of deadlocks such as 6317397.
5831  // The per-thread Parker:: _mutex is a classic leaf-lock.
5832  // In particular a thread must never block on the Threads_lock while
5833  // holding the Parker:: mutex.  If safepoints are pending both the
5834  // the ThreadBlockInVM() CTOR and DTOR may grab Threads_lock.
5835  ThreadBlockInVM tbivm(jt);
5836
5837  // Don't wait if cannot get lock since interference arises from
5838  // unblocking.  Also. check interrupt before trying wait
5839  if (Thread::is_interrupted(thread, false) ||
5840      os::Solaris::mutex_trylock(_mutex) != 0) {
5841    return;
5842  }
5843
5844  int status ;
5845
5846  if (_counter > 0)  { // no wait needed
5847    _counter = 0;
5848    status = os::Solaris::mutex_unlock(_mutex);
5849    assert (status == 0, "invariant") ;
5850    OrderAccess::fence();
5851    return;
5852  }
5853
5854#ifdef ASSERT
5855  // Don't catch signals while blocked; let the running threads have the signals.
5856  // (This allows a debugger to break into the running thread.)
5857  sigset_t oldsigs;
5858  sigset_t* allowdebug_blocked = os::Solaris::allowdebug_blocked_signals();
5859  thr_sigsetmask(SIG_BLOCK, allowdebug_blocked, &oldsigs);
5860#endif
5861
5862  OSThreadWaitState osts(thread->osthread(), false /* not Object.wait() */);
5863  jt->set_suspend_equivalent();
5864  // cleared by handle_special_suspend_equivalent_condition() or java_suspend_self()
5865
5866  // Do this the hard way by blocking ...
5867  // See http://monaco.sfbay/detail.jsf?cr=5094058.
5868  // TODO-FIXME: for Solaris SPARC set fprs.FEF=0 prior to parking.
5869  // Only for SPARC >= V8PlusA
5870#if defined(__sparc) && defined(COMPILER2)
5871  if (ClearFPUAtPark) { _mark_fpu_nosave() ; }
5872#endif
5873
5874  if (time == 0) {
5875    status = os::Solaris::cond_wait (_cond, _mutex) ;
5876  } else {
5877    status = os::Solaris::cond_timedwait (_cond, _mutex, &absTime);
5878  }
5879  // Note that an untimed cond_wait() can sometimes return ETIME on older
5880  // versions of the Solaris.
5881  assert_status(status == 0 || status == EINTR ||
5882                status == ETIME || status == ETIMEDOUT,
5883                status, "cond_timedwait");
5884
5885#ifdef ASSERT
5886  thr_sigsetmask(SIG_SETMASK, &oldsigs, NULL);
5887#endif
5888  _counter = 0 ;
5889  status = os::Solaris::mutex_unlock(_mutex);
5890  assert_status(status == 0, status, "mutex_unlock") ;
5891
5892  // If externally suspended while waiting, re-suspend
5893  if (jt->handle_special_suspend_equivalent_condition()) {
5894    jt->java_suspend_self();
5895  }
5896
5897  OrderAccess::fence();
5898}
5899
5900void Parker::unpark() {
5901  int s, status ;
5902  status = os::Solaris::mutex_lock (_mutex) ;
5903  assert (status == 0, "invariant") ;
5904  s = _counter;
5905  _counter = 1;
5906  status = os::Solaris::mutex_unlock (_mutex) ;
5907  assert (status == 0, "invariant") ;
5908
5909  if (s < 1) {
5910    status = os::Solaris::cond_signal (_cond) ;
5911    assert (status == 0, "invariant") ;
5912  }
5913}
5914
5915extern char** environ;
5916
5917// Run the specified command in a separate process. Return its exit value,
5918// or -1 on failure (e.g. can't fork a new process).
5919// Unlike system(), this function can be called from signal handler. It
5920// doesn't block SIGINT et al.
5921int os::fork_and_exec(char* cmd) {
5922  char * argv[4];
5923  argv[0] = (char *)"sh";
5924  argv[1] = (char *)"-c";
5925  argv[2] = cmd;
5926  argv[3] = NULL;
5927
5928  // fork is async-safe, fork1 is not so can't use in signal handler
5929  pid_t pid;
5930  Thread* t = ThreadLocalStorage::get_thread_slow();
5931  if (t != NULL && t->is_inside_signal_handler()) {
5932    pid = fork();
5933  } else {
5934    pid = fork1();
5935  }
5936
5937  if (pid < 0) {
5938    // fork failed
5939    warning("fork failed: %s", strerror(errno));
5940    return -1;
5941
5942  } else if (pid == 0) {
5943    // child process
5944
5945    // try to be consistent with system(), which uses "/usr/bin/sh" on Solaris
5946    execve("/usr/bin/sh", argv, environ);
5947
5948    // execve failed
5949    _exit(-1);
5950
5951  } else  {
5952    // copied from J2SE ..._waitForProcessExit() in UNIXProcess_md.c; we don't
5953    // care about the actual exit code, for now.
5954
5955    int status;
5956
5957    // Wait for the child process to exit.  This returns immediately if
5958    // the child has already exited. */
5959    while (waitpid(pid, &status, 0) < 0) {
5960        switch (errno) {
5961        case ECHILD: return 0;
5962        case EINTR: break;
5963        default: return -1;
5964        }
5965    }
5966
5967    if (WIFEXITED(status)) {
5968       // The child exited normally; get its exit code.
5969       return WEXITSTATUS(status);
5970    } else if (WIFSIGNALED(status)) {
5971       // The child exited because of a signal
5972       // The best value to return is 0x80 + signal number,
5973       // because that is what all Unix shells do, and because
5974       // it allows callers to distinguish between process exit and
5975       // process death by signal.
5976       return 0x80 + WTERMSIG(status);
5977    } else {
5978       // Unknown exit code; pass it through
5979       return status;
5980    }
5981  }
5982}
5983