1/*
2 * Copyright (c) 2014, 2016, Oracle and/or its affiliates. All rights reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20 * or visit www.oracle.com if you need additional information or have any
21 * questions.
22 *
23 */
24
25#ifndef SHARE_VM_GC_G1_G1STRINGDEDUP_HPP
26#define SHARE_VM_GC_G1_G1STRINGDEDUP_HPP
27
28//
29// String Deduplication
30//
31// String deduplication aims to reduce the heap live-set by deduplicating identical
32// instances of String so that they share the same backing character array.
33//
34// The deduplication process is divided in two main parts, 1) finding the objects to
35// deduplicate, and 2) deduplicating those objects. The first part is done as part of
36// a normal GC cycle when objects are marked or evacuated. At this time a check is
37// applied on each object to check if it is a candidate for deduplication. If so, the
38// object is placed on the deduplication queue for later processing. The second part,
39// processing the objects on the deduplication queue, is a concurrent phase which
40// starts right after the stop-the-wold marking/evacuation phase. This phase is
41// executed by the deduplication thread, which pulls deduplication candidates of the
42// deduplication queue and tries to deduplicate them.
43//
44// A deduplication hashtable is used to keep track of all unique character arrays
45// used by String objects. When deduplicating, a lookup is made in this table to see
46// if there is already an identical character array somewhere on the heap. If so, the
47// String object is adjusted to point to that character array, releasing the reference
48// to the original array allowing it to eventually be garbage collected. If the lookup
49// fails the character array is instead inserted into the hashtable so that this array
50// can be shared at some point in the future.
51//
52// Candidate selection
53//
54// An object is considered a deduplication candidate if all of the following
55// statements are true:
56//
57// - The object is an instance of java.lang.String
58//
59// - The object is being evacuated from a young heap region
60//
61// - The object is being evacuated to a young/survivor heap region and the
62//   object's age is equal to the deduplication age threshold
63//
64//   or
65//
66//   The object is being evacuated to an old heap region and the object's age is
67//   less than the deduplication age threshold
68//
69// Once an string object has been promoted to an old region, or its age is higher
70// than the deduplication age threshold, is will never become a candidate again.
71// This approach avoids making the same object a candidate more than once.
72//
73// Interned strings are a bit special. They are explicitly deduplicated just before
74// being inserted into the StringTable (to avoid counteracting C2 optimizations done
75// on string literals), then they also become deduplication candidates if they reach
76// the deduplication age threshold or are evacuated to an old heap region. The second
77// attempt to deduplicate such strings will be in vain, but we have no fast way of
78// filtering them out. This has not shown to be a problem, as the number of interned
79// strings is usually dwarfed by the number of normal (non-interned) strings.
80//
81// For additional information on string deduplication, please see JEP 192,
82// http://openjdk.java.net/jeps/192
83//
84
85#include "memory/allocation.hpp"
86#include "oops/oop.hpp"
87
88class OopClosure;
89class BoolObjectClosure;
90class ThreadClosure;
91class outputStream;
92class G1StringDedupTable;
93class G1GCPhaseTimes;
94
95//
96// Main interface for interacting with string deduplication.
97//
98class G1StringDedup : public AllStatic {
99private:
100  // Single state for checking if both G1 and string deduplication is enabled.
101  static bool _enabled;
102
103  // Candidate selection policies, returns true if the given object is
104  // candidate for string deduplication.
105  static bool is_candidate_from_mark(oop obj);
106  static bool is_candidate_from_evacuation(bool from_young, bool to_young, oop obj);
107
108public:
109  // Returns true if both G1 and string deduplication is enabled.
110  static bool is_enabled() {
111    return _enabled;
112  }
113
114  // Initialize string deduplication.
115  static void initialize();
116
117  // Stop the deduplication thread.
118  static void stop();
119
120  // Immediately deduplicates the given String object, bypassing the
121  // the deduplication queue.
122  static void deduplicate(oop java_string);
123
124  // Enqueues a deduplication candidate for later processing by the deduplication
125  // thread. Before enqueuing, these functions apply the appropriate candidate
126  // selection policy to filters out non-candidates.
127  static void enqueue_from_mark(oop java_string);
128  static void enqueue_from_evacuation(bool from_young, bool to_young,
129                                      unsigned int queue, oop java_string);
130
131  static void oops_do(OopClosure* keep_alive);
132  static void unlink(BoolObjectClosure* is_alive);
133  static void unlink_or_oops_do(BoolObjectClosure* is_alive, OopClosure* keep_alive,
134                                bool allow_resize_and_rehash, G1GCPhaseTimes* phase_times = NULL);
135
136  static void threads_do(ThreadClosure* tc);
137  static void print_worker_threads_on(outputStream* st);
138  static void verify();
139};
140
141//
142// This closure encapsulates the state and the closures needed when scanning
143// the deduplication queue and table during the unlink_or_oops_do() operation.
144// A single instance of this closure is created and then shared by all worker
145// threads participating in the scan. The _next_queue and _next_bucket fields
146// provide a simple mechanism for GC workers to claim exclusive access to a
147// queue or a table partition.
148//
149class G1StringDedupUnlinkOrOopsDoClosure : public StackObj {
150private:
151  BoolObjectClosure*  _is_alive;
152  OopClosure*         _keep_alive;
153  G1StringDedupTable* _resized_table;
154  G1StringDedupTable* _rehashed_table;
155  size_t              _next_queue;
156  size_t              _next_bucket;
157
158public:
159  G1StringDedupUnlinkOrOopsDoClosure(BoolObjectClosure* is_alive,
160                                     OopClosure* keep_alive,
161                                     bool allow_resize_and_rehash);
162  ~G1StringDedupUnlinkOrOopsDoClosure();
163
164  bool is_resizing() {
165    return _resized_table != NULL;
166  }
167
168  G1StringDedupTable* resized_table() {
169    return _resized_table;
170  }
171
172  bool is_rehashing() {
173    return _rehashed_table != NULL;
174  }
175
176  // Atomically claims the next available queue for exclusive access by
177  // the current thread. Returns the queue number of the claimed queue.
178  size_t claim_queue();
179
180  // Atomically claims the next available table partition for exclusive
181  // access by the current thread. Returns the table bucket number where
182  // the claimed partition starts.
183  size_t claim_table_partition(size_t partition_size);
184
185  // Applies and returns the result from the is_alive closure, or
186  // returns true if no such closure was provided.
187  bool is_alive(oop o) {
188    if (_is_alive != NULL) {
189      return _is_alive->do_object_b(o);
190    }
191    return true;
192  }
193
194  // Applies the keep_alive closure, or does nothing if no such
195  // closure was provided.
196  void keep_alive(oop* p) {
197    if (_keep_alive != NULL) {
198      _keep_alive->do_oop(p);
199    }
200  }
201};
202
203#endif // SHARE_VM_GC_G1_G1STRINGDEDUP_HPP
204