1 /* 2 * Copyright (c) 2017, 2021, Red Hat, Inc. All rights reserved. 3 * Copyright Amazon.com Inc. or its affiliates. All Rights Reserved. 4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 5 * 6 * This code is free software; you can redistribute it and/or modify it 7 * under the terms of the GNU General Public License version 2 only, as 8 * published by the Free Software Foundation. 9 * 10 * This code is distributed in the hope that it will be useful, but WITHOUT 11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License 13 * version 2 for more details (a copy is included in the LICENSE file that 14 * accompanied this code). 15 * 16 * You should have received a copy of the GNU General Public License version 17 * 2 along with this work; if not, write to the Free Software Foundation, 18 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. 19 * 20 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA 21 * or visit www.oracle.com if you need additional information or have any 22 * questions. 23 * 24 */ 25 26 #include "precompiled.hpp" 27 28 #include "gc/shared/workerDataArray.inline.hpp" 29 #include "gc/shenandoah/shenandoahCollectorPolicy.hpp" 30 #include "gc/shenandoah/shenandoahPhaseTimings.hpp" 31 #include "gc/shenandoah/shenandoahHeap.inline.hpp" 32 #include "gc/shenandoah/shenandoahUtils.hpp" 33 #include "gc/shenandoah/heuristics/shenandoahHeuristics.hpp" 34 #include "runtime/orderAccess.hpp" 35 #include "utilities/ostream.hpp" 36 37 #define SHENANDOAH_PHASE_NAME_FORMAT "%-30s" 38 #define SHENANDOAH_S_TIME_FORMAT "%8.3lf" 39 #define SHENANDOAH_US_TIME_FORMAT "%8.0lf" 40 #define SHENANDOAH_US_WORKER_TIME_FORMAT "%3.0lf" 41 #define SHENANDOAH_US_WORKER_NOTIME_FORMAT "%3s" 42 #define SHENANDOAH_PARALLELISM_FORMAT "%4.2lf" 43 44 #define SHENANDOAH_PHASE_DECLARE_NAME(type, title) \ 45 title, 46 47 const char* ShenandoahPhaseTimings::_phase_names[] = { 48 SHENANDOAH_PHASE_DO(SHENANDOAH_PHASE_DECLARE_NAME) 49 }; 50 51 #undef SHENANDOAH_PHASE_DECLARE_NAME 52 53 ShenandoahPhaseTimings::ShenandoahPhaseTimings(uint max_workers) : 54 _max_workers(max_workers) { 55 assert(_max_workers > 0, "Must have some GC threads"); 56 57 // Initialize everything to sane defaults 58 for (uint i = 0; i < _num_phases; i++) { 59 #define SHENANDOAH_WORKER_DATA_NULL(type, title) \ 60 _worker_data[i] = nullptr; 61 SHENANDOAH_PAR_PHASE_DO(,, SHENANDOAH_WORKER_DATA_NULL) 62 #undef SHENANDOAH_WORKER_DATA_NULL 63 _cycle_data[i] = uninitialized(); 64 } 65 66 // Then punch in the worker-related data. 67 // Every worker phase get a bunch of internal objects, except 68 // the very first slot, which is "<total>" and is not populated. 69 for (uint i = 0; i < _num_phases; i++) { 70 if (is_worker_phase(Phase(i))) { 71 int c = 0; 72 #define SHENANDOAH_WORKER_DATA_INIT(type, title) \ 73 if (c++ != 0) _worker_data[i + c] = new ShenandoahWorkerData(nullptr, title, _max_workers); 74 SHENANDOAH_PAR_PHASE_DO(,, SHENANDOAH_WORKER_DATA_INIT) 75 #undef SHENANDOAH_WORKER_DATA_INIT 76 } 77 } 78 79 _policy = ShenandoahHeap::heap()->shenandoah_policy(); 80 assert(_policy != nullptr, "Can not be null"); 81 } 82 83 ShenandoahPhaseTimings::Phase ShenandoahPhaseTimings::worker_par_phase(Phase phase, ParPhase par_phase) { 84 assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase)); 85 Phase p = Phase(phase + 1 + par_phase); 86 assert(p >= 0 && p < _num_phases, "Out of bound for: %s", phase_name(phase)); 87 return p; 88 } 89 90 ShenandoahWorkerData* ShenandoahPhaseTimings::worker_data(Phase phase, ParPhase par_phase) { 91 Phase p = worker_par_phase(phase, par_phase); 92 ShenandoahWorkerData* wd = _worker_data[p]; 93 assert(wd != nullptr, "Counter initialized: %s", phase_name(p)); 94 return wd; 95 } 96 97 bool ShenandoahPhaseTimings::is_worker_phase(Phase phase) { 98 assert(phase >= 0 && phase < _num_phases, "Out of bounds"); 99 switch (phase) { 100 case init_evac: 101 case init_scan_rset: 102 case finish_mark: 103 case purge_weak_par: 104 case full_gc_mark: 105 case full_gc_update_roots: 106 case full_gc_adjust_roots: 107 case degen_gc_stw_mark: 108 case degen_gc_mark: 109 case degen_gc_update_roots: 110 case full_gc_weakrefs: 111 case full_gc_purge_class_unload: 112 case full_gc_purge_weak_par: 113 case degen_gc_coalesce_and_fill: 114 case degen_gc_weakrefs: 115 case degen_gc_purge_class_unload: 116 case degen_gc_purge_weak_par: 117 case heap_iteration_roots: 118 case conc_mark: 119 case conc_mark_roots: 120 case conc_thread_roots: 121 case conc_weak_roots_work: 122 case conc_weak_refs: 123 case conc_strong_roots: 124 case conc_coalesce_and_fill: 125 case promote_in_place: 126 return true; 127 default: 128 return false; 129 } 130 } 131 132 bool ShenandoahPhaseTimings::is_root_work_phase(Phase phase) { 133 switch (phase) { 134 case finish_mark: 135 case init_evac: 136 case degen_gc_update_roots: 137 case full_gc_mark: 138 case full_gc_update_roots: 139 case full_gc_adjust_roots: 140 return true; 141 default: 142 return false; 143 } 144 } 145 146 void ShenandoahPhaseTimings::set_cycle_data(Phase phase, double time, bool should_aggregate) { 147 const double cycle_data = _cycle_data[phase]; 148 if (should_aggregate) { 149 _cycle_data[phase] = (cycle_data == uninitialized()) ? time : (cycle_data + time); 150 } else { 151 #ifdef ASSERT 152 assert(cycle_data == uninitialized(), "Should not be set yet: %s, current value: %lf", phase_name(phase), cycle_data); 153 #endif 154 _cycle_data[phase] = time; 155 } 156 } 157 158 void ShenandoahPhaseTimings::record_phase_time(Phase phase, double time, bool should_aggregate) { 159 if (!_policy->is_at_shutdown()) { 160 set_cycle_data(phase, time, should_aggregate); 161 } 162 } 163 164 void ShenandoahPhaseTimings::record_workers_start(Phase phase) { 165 assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase)); 166 167 // Special case: these phases can enter multiple times, need to reset 168 // their worker data every time. 169 if (phase == heap_iteration_roots) { 170 for (uint i = 1; i < _num_par_phases; i++) { 171 worker_data(phase, ParPhase(i))->reset(); 172 } 173 } 174 175 #ifdef ASSERT 176 for (uint i = 1; i < _num_par_phases; i++) { 177 ShenandoahWorkerData* wd = worker_data(phase, ParPhase(i)); 178 for (uint c = 0; c < _max_workers; c++) { 179 assert(wd->get(c) == ShenandoahWorkerData::uninitialized(), 180 "Should not be set: %s", phase_name(worker_par_phase(phase, ParPhase(i)))); 181 } 182 } 183 #endif 184 } 185 186 void ShenandoahPhaseTimings::record_workers_end(Phase phase) { 187 assert(is_worker_phase(phase), "Phase should accept worker phase times: %s", phase_name(phase)); 188 } 189 190 void ShenandoahPhaseTimings::flush_par_workers_to_cycle() { 191 for (uint pi = 0; pi < _num_phases; pi++) { 192 Phase phase = Phase(pi); 193 if (is_worker_phase(phase)) { 194 double s = uninitialized(); 195 for (uint i = 1; i < _num_par_phases; i++) { 196 ShenandoahWorkerData* wd = worker_data(phase, ParPhase(i)); 197 double ws = uninitialized(); 198 for (uint c = 0; c < _max_workers; c++) { 199 double v = wd->get(c); 200 if (v != ShenandoahWorkerData::uninitialized()) { 201 if (ws == uninitialized()) { 202 ws = v; 203 } else { 204 ws += v; 205 } 206 } 207 } 208 if (ws != uninitialized()) { 209 // add to each line in phase 210 set_cycle_data(Phase(phase + i + 1), ws); 211 if (s == uninitialized()) { 212 s = ws; 213 } else { 214 s += ws; 215 } 216 } 217 } 218 if (s != uninitialized()) { 219 // add to total for phase 220 set_cycle_data(Phase(phase + 1), s); 221 } 222 } 223 } 224 } 225 226 void ShenandoahPhaseTimings::flush_cycle_to_global() { 227 for (uint i = 0; i < _num_phases; i++) { 228 if (_cycle_data[i] != uninitialized()) { 229 _global_data[i].add(_cycle_data[i]); 230 _cycle_data[i] = uninitialized(); 231 } 232 if (_worker_data[i] != nullptr) { 233 _worker_data[i]->reset(); 234 } 235 } 236 OrderAccess::fence(); 237 } 238 239 void ShenandoahPhaseTimings::print_cycle_on(outputStream* out) const { 240 out->cr(); 241 out->print_cr("All times are wall-clock times, except per-root-class counters, that are sum over"); 242 out->print_cr("all workers. Dividing the <total> over the root stage time estimates parallelism."); 243 out->cr(); 244 for (uint i = 0; i < _num_phases; i++) { 245 double v = _cycle_data[i] * 1000000.0; 246 if (v > 0) { 247 out->print(SHENANDOAH_PHASE_NAME_FORMAT " " SHENANDOAH_US_TIME_FORMAT " us", _phase_names[i], v); 248 249 if (is_worker_phase(Phase(i))) { 250 double total = _cycle_data[i + 1] * 1000000.0; 251 if (total > 0) { 252 out->print(", parallelism: " SHENANDOAH_PARALLELISM_FORMAT "x", total / v); 253 } 254 } 255 256 if (_worker_data[i] != nullptr) { 257 out->print(", workers (us): "); 258 for (uint c = 0; c < _max_workers; c++) { 259 double tv = _worker_data[i]->get(c); 260 if (tv != ShenandoahWorkerData::uninitialized()) { 261 out->print(SHENANDOAH_US_WORKER_TIME_FORMAT ", ", tv * 1000000.0); 262 } else { 263 out->print(SHENANDOAH_US_WORKER_NOTIME_FORMAT ", ", "---"); 264 } 265 } 266 } 267 out->cr(); 268 } 269 } 270 } 271 272 void ShenandoahPhaseTimings::print_global_on(outputStream* out) const { 273 out->cr(); 274 out->print_cr("GC STATISTICS:"); 275 out->print_cr(" \"(G)\" (gross) pauses include VM time: time to notify and block threads, do the pre-"); 276 out->print_cr(" and post-safepoint housekeeping. Use -Xlog:safepoint+stats to dissect."); 277 out->print_cr(" \"(N)\" (net) pauses are the times spent in the actual GC code."); 278 out->print_cr(" \"a\" is average time for each phase, look at levels to see if average makes sense."); 279 out->print_cr(" \"lvls\" are quantiles: 0%% (minimum), 25%%, 50%% (median), 75%%, 100%% (maximum)."); 280 out->cr(); 281 out->print_cr(" All times are wall-clock times, except per-root-class counters, that are sum over"); 282 out->print_cr(" all workers. Dividing the <total> over the root stage time estimates parallelism."); 283 out->cr(); 284 285 out->print_cr(" Pacing delays are measured from entering the pacing code till exiting it. Therefore,"); 286 out->print_cr(" observed pacing delays may be higher than the threshold when paced thread spent more"); 287 out->print_cr(" time in the pacing code. It usually happens when thread is de-scheduled while paced,"); 288 out->print_cr(" OS takes longer to unblock the thread, or JVM experiences an STW pause."); 289 out->cr(); 290 out->print_cr(" Higher delay would prevent application outpacing the GC, but it will hide the GC latencies"); 291 out->print_cr(" from the STW pause times. Pacing affects the individual threads, and so it would also be"); 292 out->print_cr(" invisible to the usual profiling tools, but would add up to end-to-end application latency."); 293 out->print_cr(" Raise max pacing delay with care."); 294 out->cr(); 295 296 for (uint i = 0; i < _num_phases; i++) { 297 if (_global_data[i].maximum() != 0) { 298 out->print_cr(SHENANDOAH_PHASE_NAME_FORMAT " = " SHENANDOAH_S_TIME_FORMAT " s " 299 "(a = " SHENANDOAH_US_TIME_FORMAT " us) " 300 "(n = " INT32_FORMAT_W(5) ") (lvls, us = " 301 SHENANDOAH_US_TIME_FORMAT ", " 302 SHENANDOAH_US_TIME_FORMAT ", " 303 SHENANDOAH_US_TIME_FORMAT ", " 304 SHENANDOAH_US_TIME_FORMAT ", " 305 SHENANDOAH_US_TIME_FORMAT ")", 306 _phase_names[i], 307 _global_data[i].sum(), 308 _global_data[i].avg() * 1000000.0, 309 _global_data[i].num(), 310 _global_data[i].percentile(0) * 1000000.0, 311 _global_data[i].percentile(25) * 1000000.0, 312 _global_data[i].percentile(50) * 1000000.0, 313 _global_data[i].percentile(75) * 1000000.0, 314 _global_data[i].maximum() * 1000000.0 315 ); 316 } 317 } 318 } 319 320 ShenandoahWorkerTimingsTracker::ShenandoahWorkerTimingsTracker(ShenandoahPhaseTimings::Phase phase, 321 ShenandoahPhaseTimings::ParPhase par_phase, uint worker_id, bool cumulative) : 322 _timings(ShenandoahHeap::heap()->phase_timings()), 323 _phase(phase), _par_phase(par_phase), _worker_id(worker_id) { 324 325 assert(_timings->worker_data(_phase, _par_phase)->get(_worker_id) == ShenandoahWorkerData::uninitialized() || cumulative, 326 "Should not be set yet: %s", ShenandoahPhaseTimings::phase_name(_timings->worker_par_phase(_phase, _par_phase))); 327 _start_time = os::elapsedTime(); 328 } 329 330 ShenandoahWorkerTimingsTracker::~ShenandoahWorkerTimingsTracker() { 331 _timings->worker_data(_phase, _par_phase)->set_or_add(_worker_id, os::elapsedTime() - _start_time); 332 333 if (ShenandoahPhaseTimings::is_root_work_phase(_phase)) { 334 ShenandoahPhaseTimings::Phase root_phase = _phase; 335 ShenandoahPhaseTimings::Phase cur_phase = _timings->worker_par_phase(root_phase, _par_phase); 336 _event.commit(GCId::current(), _worker_id, ShenandoahPhaseTimings::phase_name(cur_phase)); 337 } 338 }