1 /*
  2  * Copyright (c) 2002, 2023, Oracle and/or its affiliates. All rights reserved.
  3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
  4  *
  5  * This code is free software; you can redistribute it and/or modify it
  6  * under the terms of the GNU General Public License version 2 only, as
  7  * published by the Free Software Foundation.
  8  *
  9  * This code is distributed in the hope that it will be useful, but WITHOUT
 10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 12  * version 2 for more details (a copy is included in the LICENSE file that
 13  * accompanied this code).
 14  *
 15  * You should have received a copy of the GNU General Public License version
 16  * 2 along with this work; if not, write to the Free Software Foundation,
 17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 18  *
 19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 20  * or visit www.oracle.com if you need additional information or have any
 21  * questions.
 22  *
 23  */
 24 
 25 #include "precompiled.hpp"
 26 #include "classfile/javaClasses.inline.hpp"
 27 #include "gc/parallel/mutableSpace.hpp"
 28 #include "gc/parallel/parallelScavengeHeap.hpp"
 29 #include "gc/parallel/psOldGen.hpp"
 30 #include "gc/parallel/psPromotionManager.inline.hpp"
 31 #include "gc/parallel/psScavenge.inline.hpp"
 32 #include "gc/shared/continuationGCSupport.inline.hpp"
 33 #include "gc/shared/gcTrace.hpp"
 34 #include "gc/shared/preservedMarks.inline.hpp"
 35 #include "gc/shared/taskqueue.inline.hpp"
 36 #include "logging/log.hpp"
 37 #include "logging/logStream.hpp"
 38 #include "memory/allocation.inline.hpp"
 39 #include "memory/iterator.inline.hpp"
 40 #include "memory/memRegion.hpp"
 41 #include "memory/padded.inline.hpp"
 42 #include "memory/resourceArea.hpp"
 43 #include "oops/access.inline.hpp"
 44 #include "oops/compressedOops.inline.hpp"
 45 
 46 PaddedEnd<PSPromotionManager>* PSPromotionManager::_manager_array = nullptr;
 47 PSPromotionManager::PSScannerTasksQueueSet* PSPromotionManager::_stack_array_depth = nullptr;
 48 PreservedMarksSet*             PSPromotionManager::_preserved_marks_set = nullptr;
 49 PSOldGen*                      PSPromotionManager::_old_gen = nullptr;
 50 MutableSpace*                  PSPromotionManager::_young_space = nullptr;
 51 
 52 void PSPromotionManager::initialize() {
 53   ParallelScavengeHeap* heap = ParallelScavengeHeap::heap();
 54 
 55   _old_gen = heap->old_gen();
 56   _young_space = heap->young_gen()->to_space();
 57 
 58   const uint promotion_manager_num = ParallelGCThreads;
 59 
 60   // To prevent false sharing, we pad the PSPromotionManagers
 61   // and make sure that the first instance starts at a cache line.
 62   assert(_manager_array == nullptr, "Attempt to initialize twice");
 63   _manager_array = PaddedArray<PSPromotionManager, mtGC>::create_unfreeable(promotion_manager_num);
 64 
 65   _stack_array_depth = new PSScannerTasksQueueSet(ParallelGCThreads);
 66 
 67   // Create and register the PSPromotionManager(s) for the worker threads.
 68   for(uint i=0; i<ParallelGCThreads; i++) {
 69     stack_array_depth()->register_queue(i, _manager_array[i].claimed_stack_depth());
 70   }
 71   // The VMThread gets its own PSPromotionManager, which is not available
 72   // for work stealing.
 73 
 74   assert(_preserved_marks_set == nullptr, "Attempt to initialize twice");
 75   _preserved_marks_set = new PreservedMarksSet(true /* in_c_heap */);
 76   _preserved_marks_set->init(promotion_manager_num);
 77   for (uint i = 0; i < promotion_manager_num; i += 1) {
 78     _manager_array[i].register_preserved_marks(_preserved_marks_set->get(i));
 79   }
 80 }
 81 
 82 // Helper functions to get around the circular dependency between
 83 // psScavenge.inline.hpp and psPromotionManager.inline.hpp.
 84 bool PSPromotionManager::should_scavenge(oop* p, bool check_to_space) {
 85   return PSScavenge::should_scavenge(p, check_to_space);
 86 }
 87 bool PSPromotionManager::should_scavenge(narrowOop* p, bool check_to_space) {
 88   return PSScavenge::should_scavenge(p, check_to_space);
 89 }
 90 
 91 PSPromotionManager* PSPromotionManager::gc_thread_promotion_manager(uint index) {
 92   assert(index < ParallelGCThreads, "index out of range");
 93   assert(_manager_array != nullptr, "Sanity");
 94   return &_manager_array[index];
 95 }
 96 
 97 PSPromotionManager* PSPromotionManager::vm_thread_promotion_manager() {
 98   assert(_manager_array != nullptr, "Sanity");
 99   return &_manager_array[0];
100 }
101 
102 void PSPromotionManager::pre_scavenge() {
103   ParallelScavengeHeap* heap = ParallelScavengeHeap::heap();
104 
105   _preserved_marks_set->assert_empty();
106   _young_space = heap->young_gen()->to_space();
107 
108   for(uint i=0; i<ParallelGCThreads; i++) {
109     manager_array(i)->reset();
110   }
111 }
112 
113 bool PSPromotionManager::post_scavenge(YoungGCTracer& gc_tracer) {
114   bool promotion_failure_occurred = false;
115 
116   TASKQUEUE_STATS_ONLY(print_taskqueue_stats());
117   for (uint i = 0; i < ParallelGCThreads; i++) {
118     PSPromotionManager* manager = manager_array(i);
119     assert(manager->claimed_stack_depth()->is_empty(), "should be empty");
120     if (manager->_promotion_failed_info.has_failed()) {
121       gc_tracer.report_promotion_failed(manager->_promotion_failed_info);
122       promotion_failure_occurred = true;
123     }
124     manager->flush_labs();
125     manager->flush_string_dedup_requests();
126   }
127   if (!promotion_failure_occurred) {
128     // If there was no promotion failure, the preserved mark stacks
129     // should be empty.
130     _preserved_marks_set->assert_empty();
131   }
132   return promotion_failure_occurred;
133 }
134 
135 #if TASKQUEUE_STATS
136 void
137 PSPromotionManager::print_local_stats(outputStream* const out, uint i) const {
138   #define FMT " " SIZE_FORMAT_W(10)
139   out->print_cr("%3u" FMT FMT FMT FMT,
140                 i, _array_chunk_pushes, _array_chunk_steals,
141                 _arrays_chunked, _array_chunks_processed);
142   #undef FMT
143 }
144 
145 static const char* const pm_stats_hdr[] = {
146   "    ----partial array----     arrays      array",
147   "thr       push      steal    chunked     chunks",
148   "--- ---------- ---------- ---------- ----------"
149 };
150 
151 void PSPromotionManager::print_taskqueue_stats() {
152   if (!log_is_enabled(Trace, gc, task, stats)) {
153     return;
154   }
155   Log(gc, task, stats) log;
156   ResourceMark rm;
157   LogStream ls(log.trace());
158 
159   stack_array_depth()->print_taskqueue_stats(&ls, "Oop Queue");
160 
161   const uint hlines = sizeof(pm_stats_hdr) / sizeof(pm_stats_hdr[0]);
162   for (uint i = 0; i < hlines; ++i) ls.print_cr("%s", pm_stats_hdr[i]);
163   for (uint i = 0; i < ParallelGCThreads; ++i) {
164     manager_array(i)->print_local_stats(&ls, i);
165   }
166 }
167 
168 void PSPromotionManager::reset_stats() {
169   claimed_stack_depth()->stats.reset();
170   _array_chunk_pushes = _array_chunk_steals = 0;
171   _arrays_chunked = _array_chunks_processed = 0;
172 }
173 #endif // TASKQUEUE_STATS
174 
175 PSPromotionManager::PSPromotionManager() {
176   ParallelScavengeHeap* heap = ParallelScavengeHeap::heap();
177 
178   // We set the old lab's start array.
179   _old_lab.set_start_array(old_gen()->start_array());
180 
181   uint queue_size;
182   queue_size = claimed_stack_depth()->max_elems();
183 
184   if (ParallelGCThreads == 1) {
185     _target_stack_size = 0;
186   } else {
187     // don't let the target stack size to be more than 1/4 of the entries
188     _target_stack_size = (uint) MIN2((uint) GCDrainStackTargetSize,
189                                      (uint) (queue_size / 4));
190   }
191 
192   _array_chunk_size = ParGCArrayScanChunk;
193   // let's choose 1.5x the chunk size
194   _min_array_size_for_chunking = 3 * _array_chunk_size / 2;
195 
196   _preserved_marks = nullptr;
197 
198   reset();
199 }
200 
201 void PSPromotionManager::reset() {
202   assert(stacks_empty(), "reset of non-empty stack");
203 
204   // We need to get an assert in here to make sure the labs are always flushed.
205 
206   // Do not prefill the LAB's, save heap wastage!
207   HeapWord* lab_base = young_space()->top();
208   _young_lab.initialize(MemRegion(lab_base, (size_t)0));
209   _young_gen_is_full = false;
210 
211   lab_base = old_gen()->object_space()->top();
212   _old_lab.initialize(MemRegion(lab_base, (size_t)0));
213   _old_gen_is_full = false;
214 
215   _promotion_failed_info.reset();
216 
217   TASKQUEUE_STATS_ONLY(reset_stats());
218 }
219 
220 void PSPromotionManager::register_preserved_marks(PreservedMarks* preserved_marks) {
221   assert(_preserved_marks == nullptr, "do not set it twice");
222   _preserved_marks = preserved_marks;
223 }
224 
225 void PSPromotionManager::restore_preserved_marks() {
226   _preserved_marks_set->restore(&ParallelScavengeHeap::heap()->workers());
227 }
228 
229 void PSPromotionManager::drain_stacks_depth(bool totally_drain) {
230   const uint threshold = totally_drain ? 0
231                                        : _target_stack_size;
232 
233   PSScannerTasksQueue* const tq = claimed_stack_depth();
234   do {
235     ScannerTask task;
236 
237     // Drain overflow stack first, so other threads can steal from
238     // claimed stack while we work.
239     while (tq->pop_overflow(task)) {
240       // In PSCardTable::scavenge_contents_parallel(), when work is distributed
241       // among different workers, an object is never split between multiple workers.
242       // Therefore, if a worker gets owned a large objArray, it may accumulate
243       // many tasks (corresponding to every element in this array) in its
244       // task queue. When there are too many overflow tasks, publishing them
245       // (via try_push_to_taskqueue()) can incur noticeable overhead in Young GC
246       // pause, so it is better to process them locally until large-objArray-splitting is implemented.
247       process_popped_location_depth(task);
248     }
249 
250     while (tq->pop_local(task, threshold)) {
251       process_popped_location_depth(task);
252     }
253   } while (!tq->overflow_empty());
254 
255   assert(!totally_drain || tq->taskqueue_empty(), "Sanity");
256   assert(totally_drain || tq->size() <= _target_stack_size, "Sanity");
257   assert(tq->overflow_empty(), "Sanity");
258 }
259 
260 void PSPromotionManager::flush_labs() {
261   assert(stacks_empty(), "Attempt to flush lab with live stack");
262 
263   // If either promotion lab fills up, we can flush the
264   // lab but not refill it, so check first.
265   assert(!_young_lab.is_flushed() || _young_gen_is_full, "Sanity");
266   if (!_young_lab.is_flushed())
267     _young_lab.flush();
268 
269   assert(!_old_lab.is_flushed() || _old_gen_is_full, "Sanity");
270   if (!_old_lab.is_flushed())
271     _old_lab.flush();
272 
273   // Let PSScavenge know if we overflowed
274   if (_young_gen_is_full) {
275     PSScavenge::set_survivor_overflow(true);
276   }
277 }
278 
279 template <class T> void PSPromotionManager::process_array_chunk_work(
280                                                  oop obj,
281                                                  int start, int end) {
282   assert(start <= end, "invariant");
283   T* const base      = (T*)objArrayOop(obj)->base();
284   T* p               = base + start;
285   T* const chunk_end = base + end;
286   while (p < chunk_end) {
287     if (PSScavenge::should_scavenge(p)) {
288       claim_or_forward_depth(p);
289     }
290     ++p;
291   }
292 }
293 
294 void PSPromotionManager::process_array_chunk(PartialArrayScanTask task) {
295   assert(PSChunkLargeArrays, "invariant");
296 
297   oop old = task.to_source_array();
298   assert(old->forward_safe_klass()->is_objArray_klass(), "invariant");
299   assert(old->is_forwarded(), "invariant");
300 
301   TASKQUEUE_STATS_ONLY(++_array_chunks_processed);
302 
303   oop const obj = old->forwardee();
304 
305   int start;
306   int const end = arrayOop(old)->length();
307   if (end > (int) _min_array_size_for_chunking) {
308     // we'll chunk more
309     start = end - _array_chunk_size;
310     assert(start > 0, "invariant");
311     arrayOop(old)->set_length(start);
312     push_depth(ScannerTask(PartialArrayScanTask(old)));
313     TASKQUEUE_STATS_ONLY(++_array_chunk_pushes);
314   } else {
315     // this is the final chunk for this array
316     start = 0;
317     int const actual_length = arrayOop(obj)->length();
318     arrayOop(old)->set_length(actual_length);
319   }
320 
321   if (UseCompressedOops) {
322     process_array_chunk_work<narrowOop>(obj, start, end);
323   } else {
324     process_array_chunk_work<oop>(obj, start, end);
325   }
326 }
327 
328 oop PSPromotionManager::oop_promotion_failed(oop obj, markWord obj_mark) {
329   assert(_old_gen_is_full || PromotionFailureALot, "Sanity");
330 
331   // Attempt to CAS in the header.
332   // This tests if the header is still the same as when
333   // this started.  If it is the same (i.e., no forwarding
334   // pointer has been installed), then this thread owns
335   // it.
336   if (obj->forward_to_self_atomic(obj_mark) == nullptr) {
337     // We won any races, we "own" this object.
338     assert(obj == obj->forwardee(), "Sanity");
339 
340     _promotion_failed_info.register_copy_failure(obj->size());
341 
342     ContinuationGCSupport::transform_stack_chunk(obj);
343 
344     push_contents(obj);
345 
346     // Save the markWord of promotion-failed objs in _preserved_marks for later
347     // restoration. This way we don't have to walk the young-gen to locate
348     // these promotion-failed objs.
349     _preserved_marks->push_always(obj, obj_mark);
350   }  else {
351     // We lost, someone else "owns" this object
352     guarantee(obj->is_forwarded(), "Object must be forwarded if the cas failed.");
353 
354     // No unallocation to worry about.
355     obj = obj->forwardee();
356   }
357 
358   return obj;
359 }