1 /*
  2  * Copyright (c) 2017, 2021, Red Hat, Inc. All rights reserved.
  3  * Copyright Amazon.com Inc. or its affiliates. All Rights Reserved.
  4  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
  5  *
  6  * This code is free software; you can redistribute it and/or modify it
  7  * under the terms of the GNU General Public License version 2 only, as
  8  * published by the Free Software Foundation.
  9  *
 10  * This code is distributed in the hope that it will be useful, but WITHOUT
 11  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 12  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 13  * version 2 for more details (a copy is included in the LICENSE file that
 14  * accompanied this code).
 15  *
 16  * You should have received a copy of the GNU General Public License version
 17  * 2 along with this work; if not, write to the Free Software Foundation,
 18  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 19  *
 20  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 21  * or visit www.oracle.com if you need additional information or have any
 22  * questions.
 23  *
 24  */
 25 
 26 #include "precompiled.hpp"
 27 
 28 #include "gc/shared/workerDataArray.inline.hpp"
 29 #include "gc/shenandoah/shenandoahCollectorPolicy.hpp"
 30 #include "gc/shenandoah/shenandoahPhaseTimings.hpp"
 31 #include "gc/shenandoah/shenandoahHeap.inline.hpp"
 32 #include "gc/shenandoah/shenandoahUtils.hpp"
 33 #include "gc/shenandoah/heuristics/shenandoahHeuristics.hpp"
 34 #include "runtime/orderAccess.hpp"
 35 #include "utilities/ostream.hpp"
 36 
 37 #define SHENANDOAH_PHASE_NAME_FORMAT "%-30s"
 38 #define SHENANDOAH_S_TIME_FORMAT "%8.3lf"
 39 #define SHENANDOAH_US_TIME_FORMAT "%8.0lf"
 40 #define SHENANDOAH_US_WORKER_TIME_FORMAT "%3.0lf"
 41 #define SHENANDOAH_US_WORKER_NOTIME_FORMAT "%3s"
 42 #define SHENANDOAH_PARALLELISM_FORMAT "%4.2lf"
 43 
 44 #define SHENANDOAH_PHASE_DECLARE_NAME(type, title) \
 45   title,
 46 
 47 const char* ShenandoahPhaseTimings::_phase_names[] = {
 48   SHENANDOAH_PHASE_DO(SHENANDOAH_PHASE_DECLARE_NAME)
 49 };
 50 
 51 #undef SHENANDOAH_PHASE_DECLARE_NAME
 52 
 53 ShenandoahPhaseTimings::ShenandoahPhaseTimings(uint max_workers) :
 54   _max_workers(max_workers) {
 55   assert(_max_workers > 0, "Must have some GC threads");
 56 
 57   // Initialize everything to sane defaults
 58   for (uint i = 0; i < _num_phases; i++) {
 59 #define SHENANDOAH_WORKER_DATA_NULL(type, title) \
 60     _worker_data[i] = nullptr;
 61     SHENANDOAH_PAR_PHASE_DO(,, SHENANDOAH_WORKER_DATA_NULL)
 62 #undef SHENANDOAH_WORKER_DATA_NULL
 63     _cycle_data[i] = uninitialized();
 64   }
 65 
 66   // Then punch in the worker-related data.
 67   // Every worker phase get a bunch of internal objects, except
 68   // the very first slot, which is "<total>" and is not populated.
 69   for (uint i = 0; i < _num_phases; i++) {
 70     if (is_worker_phase(Phase(i))) {
 71       int c = 0;
 72 #define SHENANDOAH_WORKER_DATA_INIT(type, title) \
 73       if (c++ != 0) _worker_data[i + c] = new ShenandoahWorkerData(nullptr, title, _max_workers);
 74       SHENANDOAH_PAR_PHASE_DO(,, SHENANDOAH_WORKER_DATA_INIT)
 75 #undef SHENANDOAH_WORKER_DATA_INIT
 76     }
 77   }
 78 
 79   _policy = ShenandoahHeap::heap()->shenandoah_policy();
 80   assert(_policy != nullptr, "Can not be null");
 81 }
 82 
 83 ShenandoahPhaseTimings::Phase ShenandoahPhaseTimings::worker_par_phase(Phase phase, ParPhase par_phase) {
 84   assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase));
 85   Phase p = Phase(phase + 1 + par_phase);
 86   assert(p >= 0 && p < _num_phases, "Out of bound for: %s", phase_name(phase));
 87   return p;
 88 }
 89 
 90 ShenandoahWorkerData* ShenandoahPhaseTimings::worker_data(Phase phase, ParPhase par_phase) {
 91   Phase p = worker_par_phase(phase, par_phase);
 92   ShenandoahWorkerData* wd = _worker_data[p];
 93   assert(wd != nullptr, "Counter initialized: %s", phase_name(p));
 94   return wd;
 95 }
 96 
 97 bool ShenandoahPhaseTimings::is_worker_phase(Phase phase) {
 98   assert(phase >= 0 && phase < _num_phases, "Out of bounds");
 99   switch (phase) {
100     case init_evac:
101     case init_scan_rset:
102     case finish_mark:
103     case purge_weak_par:
104     case full_gc_mark:
105     case full_gc_update_roots:
106     case full_gc_adjust_roots:
107     case degen_gc_stw_mark:
108     case degen_gc_mark:
109     case degen_gc_update_roots:
110     case full_gc_weakrefs:
111     case full_gc_purge_class_unload:
112     case full_gc_purge_weak_par:
113     case degen_gc_coalesce_and_fill:
114     case degen_gc_weakrefs:
115     case degen_gc_purge_class_unload:
116     case degen_gc_purge_weak_par:
117     case heap_iteration_roots:
118     case conc_mark:
119     case conc_mark_roots:
120     case conc_thread_roots:
121     case conc_weak_roots_work:
122     case conc_weak_refs:
123     case conc_strong_roots:
124     case conc_coalesce_and_fill:
125     case promote_in_place:
126       return true;
127     default:
128       return false;
129   }
130 }
131 
132 bool ShenandoahPhaseTimings::is_root_work_phase(Phase phase) {
133   switch (phase) {
134     case finish_mark:
135     case init_evac:
136     case degen_gc_update_roots:
137     case full_gc_mark:
138     case full_gc_update_roots:
139     case full_gc_adjust_roots:
140       return true;
141     default:
142       return false;
143   }
144 }
145 
146 void ShenandoahPhaseTimings::set_cycle_data(Phase phase, double time, bool should_aggregate) {
147   const double cycle_data = _cycle_data[phase];
148   if (should_aggregate) {
149     _cycle_data[phase] = (cycle_data == uninitialized()) ? time :  (cycle_data + time);
150   } else {
151 #ifdef ASSERT
152     assert(cycle_data == uninitialized(), "Should not be set yet: %s, current value: %lf", phase_name(phase), cycle_data);
153 #endif
154     _cycle_data[phase] = time;
155   }
156 }
157 
158 void ShenandoahPhaseTimings::record_phase_time(Phase phase, double time, bool should_aggregate) {
159   if (!_policy->is_at_shutdown()) {
160     set_cycle_data(phase, time, should_aggregate);
161   }
162 }
163 
164 void ShenandoahPhaseTimings::record_workers_start(Phase phase) {
165   assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase));
166 
167   // Special case: these phases can enter multiple times, need to reset
168   // their worker data every time.
169   if (phase == heap_iteration_roots) {
170     for (uint i = 1; i < _num_par_phases; i++) {
171       worker_data(phase, ParPhase(i))->reset();
172     }
173   }
174 
175 #ifdef ASSERT
176   for (uint i = 1; i < _num_par_phases; i++) {
177     ShenandoahWorkerData* wd = worker_data(phase, ParPhase(i));
178     for (uint c = 0; c < _max_workers; c++) {
179       assert(wd->get(c) == ShenandoahWorkerData::uninitialized(),
180              "Should not be set: %s", phase_name(worker_par_phase(phase, ParPhase(i))));
181     }
182   }
183 #endif
184 }
185 
186 void ShenandoahPhaseTimings::record_workers_end(Phase phase) {
187   assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase));
188 }
189 
190 void ShenandoahPhaseTimings::flush_par_workers_to_cycle() {
191   for (uint pi = 0; pi < _num_phases; pi++) {
192     Phase phase = Phase(pi);
193     if (is_worker_phase(phase)) {
194       double s = uninitialized();
195       for (uint i = 1; i < _num_par_phases; i++) {
196         ShenandoahWorkerData* wd = worker_data(phase, ParPhase(i));
197         double ws = uninitialized();
198         for (uint c = 0; c < _max_workers; c++) {
199           double v = wd->get(c);
200           if (v != ShenandoahWorkerData::uninitialized()) {
201             if (ws == uninitialized()) {
202               ws = v;
203             } else {
204               ws += v;
205             }
206           }
207         }
208         if (ws != uninitialized()) {
209           // add to each line in phase
210           set_cycle_data(Phase(phase + i + 1), ws);
211           if (s == uninitialized()) {
212             s = ws;
213           } else {
214             s += ws;
215           }
216         }
217       }
218       if (s != uninitialized()) {
219         // add to total for phase
220         set_cycle_data(Phase(phase + 1), s);
221       }
222     }
223   }
224 }
225 
226 void ShenandoahPhaseTimings::flush_cycle_to_global() {
227   for (uint i = 0; i < _num_phases; i++) {
228     if (_cycle_data[i] != uninitialized()) {
229       _global_data[i].add(_cycle_data[i]);
230       _cycle_data[i] = uninitialized();
231     }
232     if (_worker_data[i] != nullptr) {
233       _worker_data[i]->reset();
234     }
235   }
236   OrderAccess::fence();
237 }
238 
239 void ShenandoahPhaseTimings::print_cycle_on(outputStream* out) const {
240   out->cr();
241   out->print_cr("All times are wall-clock times, except per-root-class counters, that are sum over");
242   out->print_cr("all workers. Dividing the <total> over the root stage time estimates parallelism.");
243   out->cr();
244   for (uint i = 0; i < _num_phases; i++) {
245     double v = _cycle_data[i] * 1000000.0;
246     if (v > 0) {
247       out->print(SHENANDOAH_PHASE_NAME_FORMAT " " SHENANDOAH_US_TIME_FORMAT " us", _phase_names[i], v);
248 
249       if (is_worker_phase(Phase(i))) {
250         double total = _cycle_data[i + 1] * 1000000.0;
251         if (total > 0) {
252           out->print(", parallelism: " SHENANDOAH_PARALLELISM_FORMAT "x", total / v);
253         }
254       }
255 
256       if (_worker_data[i] != nullptr) {
257         out->print(", workers (us): ");
258         for (uint c = 0; c < _max_workers; c++) {
259           double tv = _worker_data[i]->get(c);
260           if (tv != ShenandoahWorkerData::uninitialized()) {
261             out->print(SHENANDOAH_US_WORKER_TIME_FORMAT ", ", tv * 1000000.0);
262           } else {
263             out->print(SHENANDOAH_US_WORKER_NOTIME_FORMAT ", ", "---");
264           }
265         }
266       }
267       out->cr();
268     }
269   }
270 }
271 
272 void ShenandoahPhaseTimings::print_global_on(outputStream* out) const {
273   out->cr();
274   out->print_cr("GC STATISTICS:");
275   out->print_cr("  \"(G)\" (gross) pauses include VM time: time to notify and block threads, do the pre-");
276   out->print_cr("        and post-safepoint housekeeping. Use -Xlog:safepoint+stats to dissect.");
277   out->print_cr("  \"(N)\" (net) pauses are the times spent in the actual GC code.");
278   out->print_cr("  \"a\" is average time for each phase, look at levels to see if average makes sense.");
279   out->print_cr("  \"lvls\" are quantiles: 0%% (minimum), 25%%, 50%% (median), 75%%, 100%% (maximum).");
280   out->cr();
281   out->print_cr("  All times are wall-clock times, except per-root-class counters, that are sum over");
282   out->print_cr("  all workers. Dividing the <total> over the root stage time estimates parallelism.");
283   out->cr();
284 
285   out->print_cr("  Pacing delays are measured from entering the pacing code till exiting it. Therefore,");
286   out->print_cr("  observed pacing delays may be higher than the threshold when paced thread spent more");
287   out->print_cr("  time in the pacing code. It usually happens when thread is de-scheduled while paced,");
288   out->print_cr("  OS takes longer to unblock the thread, or JVM experiences an STW pause.");
289   out->cr();
290   out->print_cr("  Higher delay would prevent application outpacing the GC, but it will hide the GC latencies");
291   out->print_cr("  from the STW pause times. Pacing affects the individual threads, and so it would also be");
292   out->print_cr("  invisible to the usual profiling tools, but would add up to end-to-end application latency.");
293   out->print_cr("  Raise max pacing delay with care.");
294   out->cr();
295 
296   for (uint i = 0; i < _num_phases; i++) {
297     if (_global_data[i].maximum() != 0) {
298       out->print_cr(SHENANDOAH_PHASE_NAME_FORMAT " = " SHENANDOAH_S_TIME_FORMAT " s "
299                     "(a = " SHENANDOAH_US_TIME_FORMAT " us) "
300                     "(n = " INT32_FORMAT_W(5) ") (lvls, us = "
301                     SHENANDOAH_US_TIME_FORMAT ", "
302                     SHENANDOAH_US_TIME_FORMAT ", "
303                     SHENANDOAH_US_TIME_FORMAT ", "
304                     SHENANDOAH_US_TIME_FORMAT ", "
305                     SHENANDOAH_US_TIME_FORMAT ")",
306                     _phase_names[i],
307                     _global_data[i].sum(),
308                     _global_data[i].avg() * 1000000.0,
309                     _global_data[i].num(),
310                     _global_data[i].percentile(0) * 1000000.0,
311                     _global_data[i].percentile(25) * 1000000.0,
312                     _global_data[i].percentile(50) * 1000000.0,
313                     _global_data[i].percentile(75) * 1000000.0,
314                     _global_data[i].maximum() * 1000000.0
315       );
316     }
317   }
318 }
319 
320 ShenandoahWorkerTimingsTracker::ShenandoahWorkerTimingsTracker(ShenandoahPhaseTimings::Phase phase,
321         ShenandoahPhaseTimings::ParPhase par_phase, uint worker_id, bool cumulative) :
322         _timings(ShenandoahHeap::heap()->phase_timings()),
323         _phase(phase), _par_phase(par_phase), _worker_id(worker_id) {
324 
325   assert(_timings->worker_data(_phase, _par_phase)->get(_worker_id) == ShenandoahWorkerData::uninitialized() || cumulative,
326          "Should not be set yet: %s", ShenandoahPhaseTimings::phase_name(_timings->worker_par_phase(_phase, _par_phase)));
327   _start_time = os::elapsedTime();
328 }
329 
330 ShenandoahWorkerTimingsTracker::~ShenandoahWorkerTimingsTracker() {
331   _timings->worker_data(_phase, _par_phase)->set_or_add(_worker_id, os::elapsedTime() - _start_time);
332 
333   if (ShenandoahPhaseTimings::is_root_work_phase(_phase)) {
334     ShenandoahPhaseTimings::Phase root_phase = _phase;
335     ShenandoahPhaseTimings::Phase cur_phase = _timings->worker_par_phase(root_phase, _par_phase);
336     _event.commit(GCId::current(), _worker_id, ShenandoahPhaseTimings::phase_name(cur_phase));
337   }
338 }