1 /*
2 * Copyright (c) 2017, 2021, Red Hat, Inc. All rights reserved.
3 * Copyright Amazon.com Inc. or its affiliates. All Rights Reserved.
4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5 *
6 * This code is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License version 2 only, as
8 * published by the Free Software Foundation.
9 *
10 * This code is distributed in the hope that it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
13 * version 2 for more details (a copy is included in the LICENSE file that
14 * accompanied this code).
15 *
16 * You should have received a copy of the GNU General Public License version
17 * 2 along with this work; if not, write to the Free Software Foundation,
18 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
19 *
20 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
21 * or visit www.oracle.com if you need additional information or have any
22 * questions.
23 *
24 */
25
26 #include "precompiled.hpp"
27
28 #include "gc/shared/workerDataArray.inline.hpp"
29 #include "gc/shenandoah/shenandoahCollectorPolicy.hpp"
30 #include "gc/shenandoah/shenandoahPhaseTimings.hpp"
31 #include "gc/shenandoah/shenandoahHeap.inline.hpp"
32 #include "gc/shenandoah/shenandoahUtils.hpp"
33 #include "gc/shenandoah/heuristics/shenandoahHeuristics.hpp"
34 #include "runtime/orderAccess.hpp"
35 #include "utilities/ostream.hpp"
36
37 #define SHENANDOAH_PHASE_NAME_FORMAT "%-30s"
38 #define SHENANDOAH_S_TIME_FORMAT "%8.3lf"
39 #define SHENANDOAH_US_TIME_FORMAT "%8.0lf"
40 #define SHENANDOAH_US_WORKER_TIME_FORMAT "%3.0lf"
41 #define SHENANDOAH_US_WORKER_NOTIME_FORMAT "%3s"
42 #define SHENANDOAH_PARALLELISM_FORMAT "%4.2lf"
43
44 #define SHENANDOAH_PHASE_DECLARE_NAME(type, title) \
45 title,
46
47 const char* ShenandoahPhaseTimings::_phase_names[] = {
48 SHENANDOAH_PHASE_DO(SHENANDOAH_PHASE_DECLARE_NAME)
49 };
50
51 #undef SHENANDOAH_PHASE_DECLARE_NAME
52
53 ShenandoahPhaseTimings::ShenandoahPhaseTimings(uint max_workers) :
54 _max_workers(max_workers) {
55 assert(_max_workers > 0, "Must have some GC threads");
56
57 // Initialize everything to sane defaults
58 for (uint i = 0; i < _num_phases; i++) {
59 #define SHENANDOAH_WORKER_DATA_NULL(type, title) \
60 _worker_data[i] = nullptr;
61 SHENANDOAH_PAR_PHASE_DO(,, SHENANDOAH_WORKER_DATA_NULL)
62 #undef SHENANDOAH_WORKER_DATA_NULL
63 _cycle_data[i] = uninitialized();
64 }
65
66 // Then punch in the worker-related data.
67 // Every worker phase get a bunch of internal objects, except
68 // the very first slot, which is "<total>" and is not populated.
69 for (uint i = 0; i < _num_phases; i++) {
70 if (is_worker_phase(Phase(i))) {
71 int c = 0;
72 #define SHENANDOAH_WORKER_DATA_INIT(type, title) \
73 if (c++ != 0) _worker_data[i + c] = new ShenandoahWorkerData(nullptr, title, _max_workers);
74 SHENANDOAH_PAR_PHASE_DO(,, SHENANDOAH_WORKER_DATA_INIT)
75 #undef SHENANDOAH_WORKER_DATA_INIT
76 }
77 }
78
79 _policy = ShenandoahHeap::heap()->shenandoah_policy();
80 assert(_policy != nullptr, "Can not be null");
81 }
82
83 ShenandoahPhaseTimings::Phase ShenandoahPhaseTimings::worker_par_phase(Phase phase, ParPhase par_phase) {
84 assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase));
85 Phase p = Phase(phase + 1 + par_phase);
86 assert(p >= 0 && p < _num_phases, "Out of bound for: %s", phase_name(phase));
87 return p;
88 }
89
90 ShenandoahWorkerData* ShenandoahPhaseTimings::worker_data(Phase phase, ParPhase par_phase) {
91 Phase p = worker_par_phase(phase, par_phase);
92 ShenandoahWorkerData* wd = _worker_data[p];
93 assert(wd != nullptr, "Counter initialized: %s", phase_name(p));
94 return wd;
95 }
96
97 bool ShenandoahPhaseTimings::is_worker_phase(Phase phase) {
98 assert(phase >= 0 && phase < _num_phases, "Out of bounds");
99 switch (phase) {
100 case init_evac:
101 case init_scan_rset:
102 case finish_mark:
103 case purge_weak_par:
104 case full_gc_mark:
105 case full_gc_update_roots:
106 case full_gc_adjust_roots:
107 case degen_gc_stw_mark:
108 case degen_gc_mark:
109 case degen_gc_update_roots:
110 case full_gc_weakrefs:
111 case full_gc_purge_class_unload:
112 case full_gc_purge_weak_par:
113 case degen_gc_coalesce_and_fill:
114 case degen_gc_weakrefs:
115 case degen_gc_purge_class_unload:
116 case degen_gc_purge_weak_par:
117 case heap_iteration_roots:
118 case conc_mark:
119 case conc_mark_roots:
120 case conc_thread_roots:
121 case conc_weak_roots_work:
122 case conc_weak_refs:
123 case conc_strong_roots:
124 case conc_coalesce_and_fill:
125 case promote_in_place:
126 return true;
127 default:
128 return false;
129 }
130 }
131
132 bool ShenandoahPhaseTimings::is_root_work_phase(Phase phase) {
133 switch (phase) {
134 case finish_mark:
135 case init_evac:
136 case degen_gc_update_roots:
137 case full_gc_mark:
138 case full_gc_update_roots:
139 case full_gc_adjust_roots:
140 return true;
141 default:
142 return false;
143 }
144 }
145
146 void ShenandoahPhaseTimings::set_cycle_data(Phase phase, double time, bool should_aggregate) {
147 const double cycle_data = _cycle_data[phase];
148 if (should_aggregate) {
149 _cycle_data[phase] = (cycle_data == uninitialized()) ? time : (cycle_data + time);
150 } else {
151 #ifdef ASSERT
152 assert(cycle_data == uninitialized(), "Should not be set yet: %s, current value: %lf", phase_name(phase), cycle_data);
153 #endif
154 _cycle_data[phase] = time;
155 }
156 }
157
158 void ShenandoahPhaseTimings::record_phase_time(Phase phase, double time, bool should_aggregate) {
159 if (!_policy->is_at_shutdown()) {
160 set_cycle_data(phase, time, should_aggregate);
161 }
162 }
163
164 void ShenandoahPhaseTimings::record_workers_start(Phase phase) {
165 assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase));
166
167 // Special case: these phases can enter multiple times, need to reset
168 // their worker data every time.
169 if (phase == heap_iteration_roots) {
170 for (uint i = 1; i < _num_par_phases; i++) {
171 worker_data(phase, ParPhase(i))->reset();
172 }
173 }
174
175 #ifdef ASSERT
176 for (uint i = 1; i < _num_par_phases; i++) {
177 ShenandoahWorkerData* wd = worker_data(phase, ParPhase(i));
178 for (uint c = 0; c < _max_workers; c++) {
179 assert(wd->get(c) == ShenandoahWorkerData::uninitialized(),
180 "Should not be set: %s", phase_name(worker_par_phase(phase, ParPhase(i))));
181 }
182 }
183 #endif
184 }
185
186 void ShenandoahPhaseTimings::record_workers_end(Phase phase) {
187 assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase));
188 }
189
190 void ShenandoahPhaseTimings::flush_par_workers_to_cycle() {
191 for (uint pi = 0; pi < _num_phases; pi++) {
192 Phase phase = Phase(pi);
193 if (is_worker_phase(phase)) {
194 double s = uninitialized();
195 for (uint i = 1; i < _num_par_phases; i++) {
196 ShenandoahWorkerData* wd = worker_data(phase, ParPhase(i));
197 double ws = uninitialized();
198 for (uint c = 0; c < _max_workers; c++) {
199 double v = wd->get(c);
200 if (v != ShenandoahWorkerData::uninitialized()) {
201 if (ws == uninitialized()) {
202 ws = v;
203 } else {
204 ws += v;
205 }
206 }
207 }
208 if (ws != uninitialized()) {
209 // add to each line in phase
210 set_cycle_data(Phase(phase + i + 1), ws);
211 if (s == uninitialized()) {
212 s = ws;
213 } else {
214 s += ws;
215 }
216 }
217 }
218 if (s != uninitialized()) {
219 // add to total for phase
220 set_cycle_data(Phase(phase + 1), s);
221 }
222 }
223 }
224 }
225
226 void ShenandoahPhaseTimings::flush_cycle_to_global() {
227 for (uint i = 0; i < _num_phases; i++) {
228 if (_cycle_data[i] != uninitialized()) {
229 _global_data[i].add(_cycle_data[i]);
230 _cycle_data[i] = uninitialized();
231 }
232 if (_worker_data[i] != nullptr) {
233 _worker_data[i]->reset();
234 }
235 }
236 OrderAccess::fence();
237 }
238
239 void ShenandoahPhaseTimings::print_cycle_on(outputStream* out) const {
240 out->cr();
241 out->print_cr("All times are wall-clock times, except per-root-class counters, that are sum over");
242 out->print_cr("all workers. Dividing the <total> over the root stage time estimates parallelism.");
243 out->cr();
244 for (uint i = 0; i < _num_phases; i++) {
245 double v = _cycle_data[i] * 1000000.0;
246 if (v > 0) {
247 out->print(SHENANDOAH_PHASE_NAME_FORMAT " " SHENANDOAH_US_TIME_FORMAT " us", _phase_names[i], v);
248
249 if (is_worker_phase(Phase(i))) {
250 double total = _cycle_data[i + 1] * 1000000.0;
251 if (total > 0) {
252 out->print(", parallelism: " SHENANDOAH_PARALLELISM_FORMAT "x", total / v);
253 }
254 }
255
256 if (_worker_data[i] != nullptr) {
257 out->print(", workers (us): ");
258 for (uint c = 0; c < _max_workers; c++) {
259 double tv = _worker_data[i]->get(c);
260 if (tv != ShenandoahWorkerData::uninitialized()) {
261 out->print(SHENANDOAH_US_WORKER_TIME_FORMAT ", ", tv * 1000000.0);
262 } else {
263 out->print(SHENANDOAH_US_WORKER_NOTIME_FORMAT ", ", "---");
264 }
265 }
266 }
267 out->cr();
268 }
269 }
270 }
271
272 void ShenandoahPhaseTimings::print_global_on(outputStream* out) const {
273 out->cr();
274 out->print_cr("GC STATISTICS:");
275 out->print_cr(" \"(G)\" (gross) pauses include VM time: time to notify and block threads, do the pre-");
276 out->print_cr(" and post-safepoint housekeeping. Use -Xlog:safepoint+stats to dissect.");
277 out->print_cr(" \"(N)\" (net) pauses are the times spent in the actual GC code.");
278 out->print_cr(" \"a\" is average time for each phase, look at levels to see if average makes sense.");
279 out->print_cr(" \"lvls\" are quantiles: 0%% (minimum), 25%%, 50%% (median), 75%%, 100%% (maximum).");
280 out->cr();
281 out->print_cr(" All times are wall-clock times, except per-root-class counters, that are sum over");
282 out->print_cr(" all workers. Dividing the <total> over the root stage time estimates parallelism.");
283 out->cr();
284
285 out->print_cr(" Pacing delays are measured from entering the pacing code till exiting it. Therefore,");
286 out->print_cr(" observed pacing delays may be higher than the threshold when paced thread spent more");
287 out->print_cr(" time in the pacing code. It usually happens when thread is de-scheduled while paced,");
288 out->print_cr(" OS takes longer to unblock the thread, or JVM experiences an STW pause.");
289 out->cr();
290 out->print_cr(" Higher delay would prevent application outpacing the GC, but it will hide the GC latencies");
291 out->print_cr(" from the STW pause times. Pacing affects the individual threads, and so it would also be");
292 out->print_cr(" invisible to the usual profiling tools, but would add up to end-to-end application latency.");
293 out->print_cr(" Raise max pacing delay with care.");
294 out->cr();
295
296 for (uint i = 0; i < _num_phases; i++) {
297 if (_global_data[i].maximum() != 0) {
298 out->print_cr(SHENANDOAH_PHASE_NAME_FORMAT " = " SHENANDOAH_S_TIME_FORMAT " s "
299 "(a = " SHENANDOAH_US_TIME_FORMAT " us) "
300 "(n = " INT32_FORMAT_W(5) ") (lvls, us = "
301 SHENANDOAH_US_TIME_FORMAT ", "
302 SHENANDOAH_US_TIME_FORMAT ", "
303 SHENANDOAH_US_TIME_FORMAT ", "
304 SHENANDOAH_US_TIME_FORMAT ", "
305 SHENANDOAH_US_TIME_FORMAT ")",
306 _phase_names[i],
307 _global_data[i].sum(),
308 _global_data[i].avg() * 1000000.0,
309 _global_data[i].num(),
310 _global_data[i].percentile(0) * 1000000.0,
311 _global_data[i].percentile(25) * 1000000.0,
312 _global_data[i].percentile(50) * 1000000.0,
313 _global_data[i].percentile(75) * 1000000.0,
314 _global_data[i].maximum() * 1000000.0
315 );
316 }
317 }
318 }
319
320 ShenandoahWorkerTimingsTracker::ShenandoahWorkerTimingsTracker(ShenandoahPhaseTimings::Phase phase,
321 ShenandoahPhaseTimings::ParPhase par_phase, uint worker_id, bool cumulative) :
322 _timings(ShenandoahHeap::heap()->phase_timings()),
323 _phase(phase), _par_phase(par_phase), _worker_id(worker_id) {
324
325 assert(_timings->worker_data(_phase, _par_phase)->get(_worker_id) == ShenandoahWorkerData::uninitialized() || cumulative,
326 "Should not be set yet: %s", ShenandoahPhaseTimings::phase_name(_timings->worker_par_phase(_phase, _par_phase)));
327 _start_time = os::elapsedTime();
328 }
329
330 ShenandoahWorkerTimingsTracker::~ShenandoahWorkerTimingsTracker() {
331 _timings->worker_data(_phase, _par_phase)->set_or_add(_worker_id, os::elapsedTime() - _start_time);
332
333 if (ShenandoahPhaseTimings::is_root_work_phase(_phase)) {
334 ShenandoahPhaseTimings::Phase root_phase = _phase;
335 ShenandoahPhaseTimings::Phase cur_phase = _timings->worker_par_phase(root_phase, _par_phase);
336 _event.commit(GCId::current(), _worker_id, ShenandoahPhaseTimings::phase_name(cur_phase));
337 }
338 }