comparison src/share/vm/gc_implementation/g1/g1GCPhaseTimes.cpp @ 6219:922993931b3d

7178361: G1: Make sure that PrintGC and PrintGCDetails use the same timing for the GC pause Summary: Also reviewed by: vitalyd@gmail.com. Move the timing out of G1CollectorPolicy into the G1GCPhaseTimes class Reviewed-by: johnc
author brutisso
date Wed, 11 Jul 2012 22:47:38 +0200
parents
children bb3f6194fedb
comparison
equal deleted inserted replaced
6196:3759236eea14 6219:922993931b3d
1 /*
2 * Copyright (c) 2012, Oracle and/or its affiliates. All rights reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20 * or visit www.oracle.com if you need additional information or have any
21 * questions.
22 *
23 */
24
25
26 #include "precompiled.hpp"
27 #include "gc_implementation/g1/g1CollectedHeap.inline.hpp"
28 #include "gc_implementation/g1/g1GCPhaseTimes.hpp"
29 #include "gc_implementation/g1/g1Log.hpp"
30
31 // Helper class for avoiding interleaved logging
32 class LineBuffer: public StackObj {
33
34 private:
35 static const int BUFFER_LEN = 1024;
36 static const int INDENT_CHARS = 3;
37 char _buffer[BUFFER_LEN];
38 int _indent_level;
39 int _cur;
40
41 void vappend(const char* format, va_list ap) {
42 int res = vsnprintf(&_buffer[_cur], BUFFER_LEN - _cur, format, ap);
43 if (res != -1) {
44 _cur += res;
45 } else {
46 DEBUG_ONLY(warning("buffer too small in LineBuffer");)
47 _buffer[BUFFER_LEN -1] = 0;
48 _cur = BUFFER_LEN; // vsnprintf above should not add to _buffer if we are called again
49 }
50 }
51
52 public:
53 explicit LineBuffer(int indent_level): _indent_level(indent_level), _cur(0) {
54 for (; (_cur < BUFFER_LEN && _cur < (_indent_level * INDENT_CHARS)); _cur++) {
55 _buffer[_cur] = ' ';
56 }
57 }
58
59 #ifndef PRODUCT
60 ~LineBuffer() {
61 assert(_cur == _indent_level * INDENT_CHARS, "pending data in buffer - append_and_print_cr() not called?");
62 }
63 #endif
64
65 void append(const char* format, ...) {
66 va_list ap;
67 va_start(ap, format);
68 vappend(format, ap);
69 va_end(ap);
70 }
71
72 void append_and_print_cr(const char* format, ...) {
73 va_list ap;
74 va_start(ap, format);
75 vappend(format, ap);
76 va_end(ap);
77 gclog_or_tty->print_cr("%s", _buffer);
78 _cur = _indent_level * INDENT_CHARS;
79 }
80 };
81
82 G1GCPhaseTimes::G1GCPhaseTimes(uint max_gc_threads) :
83 _max_gc_threads(max_gc_threads),
84 _min_clear_cc_time_ms(-1.0),
85 _max_clear_cc_time_ms(-1.0),
86 _cur_clear_cc_time_ms(0.0),
87 _cum_clear_cc_time_ms(0.0),
88 _num_cc_clears(0L)
89 {
90 assert(max_gc_threads > 0, "Must have some GC threads");
91 _par_last_gc_worker_start_times_ms = new double[_max_gc_threads];
92 _par_last_ext_root_scan_times_ms = new double[_max_gc_threads];
93 _par_last_satb_filtering_times_ms = new double[_max_gc_threads];
94 _par_last_update_rs_times_ms = new double[_max_gc_threads];
95 _par_last_update_rs_processed_buffers = new double[_max_gc_threads];
96 _par_last_scan_rs_times_ms = new double[_max_gc_threads];
97 _par_last_obj_copy_times_ms = new double[_max_gc_threads];
98 _par_last_termination_times_ms = new double[_max_gc_threads];
99 _par_last_termination_attempts = new double[_max_gc_threads];
100 _par_last_gc_worker_end_times_ms = new double[_max_gc_threads];
101 _par_last_gc_worker_times_ms = new double[_max_gc_threads];
102 _par_last_gc_worker_other_times_ms = new double[_max_gc_threads];
103 }
104
105 void G1GCPhaseTimes::note_gc_start(double pause_start_time_sec, uint active_gc_threads,
106 bool is_young_gc, bool is_initial_mark_gc, GCCause::Cause gc_cause) {
107 assert(active_gc_threads > 0, "The number of threads must be > 0");
108 assert(active_gc_threads <= _max_gc_threads, "The number of active threads must be <= the max nubmer of threads");
109 _active_gc_threads = active_gc_threads;
110 _pause_start_time_sec = pause_start_time_sec;
111 _is_young_gc = is_young_gc;
112 _is_initial_mark_gc = is_initial_mark_gc;
113 _gc_cause = gc_cause;
114
115 #ifdef ASSERT
116 // initialise the timing data to something well known so that we can spot
117 // if something is not set properly
118
119 for (uint i = 0; i < _max_gc_threads; ++i) {
120 _par_last_gc_worker_start_times_ms[i] = -1234.0;
121 _par_last_ext_root_scan_times_ms[i] = -1234.0;
122 _par_last_satb_filtering_times_ms[i] = -1234.0;
123 _par_last_update_rs_times_ms[i] = -1234.0;
124 _par_last_update_rs_processed_buffers[i] = -1234.0;
125 _par_last_scan_rs_times_ms[i] = -1234.0;
126 _par_last_obj_copy_times_ms[i] = -1234.0;
127 _par_last_termination_times_ms[i] = -1234.0;
128 _par_last_termination_attempts[i] = -1234.0;
129 _par_last_gc_worker_end_times_ms[i] = -1234.0;
130 _par_last_gc_worker_times_ms[i] = -1234.0;
131 _par_last_gc_worker_other_times_ms[i] = -1234.0;
132 }
133 #endif
134 }
135
136 void G1GCPhaseTimes::note_gc_end(double pause_end_time_sec) {
137 if (G1Log::fine()) {
138 double pause_time_ms = (pause_end_time_sec - _pause_start_time_sec) * MILLIUNITS;
139
140 for (uint i = 0; i < _active_gc_threads; i++) {
141 _par_last_gc_worker_times_ms[i] = _par_last_gc_worker_end_times_ms[i] -
142 _par_last_gc_worker_start_times_ms[i];
143
144 double worker_known_time = _par_last_ext_root_scan_times_ms[i] +
145 _par_last_satb_filtering_times_ms[i] +
146 _par_last_update_rs_times_ms[i] +
147 _par_last_scan_rs_times_ms[i] +
148 _par_last_obj_copy_times_ms[i] +
149 _par_last_termination_times_ms[i];
150
151 _par_last_gc_worker_other_times_ms[i] = _par_last_gc_worker_times_ms[i] -
152 worker_known_time;
153 }
154
155 print(pause_time_ms);
156 }
157
158 }
159
160 void G1GCPhaseTimes::print_par_stats(int level,
161 const char* str,
162 double* data,
163 bool showDecimals) {
164 double min = data[0], max = data[0];
165 double total = 0.0;
166 LineBuffer buf(level);
167 buf.append("[%s (ms):", str);
168 for (uint i = 0; i < _active_gc_threads; ++i) {
169 double val = data[i];
170 if (val < min)
171 min = val;
172 if (val > max)
173 max = val;
174 total += val;
175 if (G1Log::finest()) {
176 if (showDecimals) {
177 buf.append(" %.1lf", val);
178 } else {
179 buf.append(" %d", (int)val);
180 }
181 }
182 }
183
184 if (G1Log::finest()) {
185 buf.append_and_print_cr("");
186 }
187 double avg = total / (double) _active_gc_threads;
188 if (showDecimals) {
189 buf.append_and_print_cr(" Min: %.1lf, Avg: %.1lf, Max: %.1lf, Diff: %.1lf, Sum: %.1lf]",
190 min, avg, max, max - min, total);
191 } else {
192 buf.append_and_print_cr(" Min: %d, Avg: %d, Max: %d, Diff: %d, Sum: %d]",
193 (int)min, (int)avg, (int)max, (int)max - (int)min, (int)total);
194 }
195 }
196
197 void G1GCPhaseTimes::print_stats(int level, const char* str, double value) {
198 LineBuffer(level).append_and_print_cr("[%s: %.1lf ms]", str, value);
199 }
200
201 void G1GCPhaseTimes::print_stats(int level, const char* str, double value, int workers) {
202 LineBuffer(level).append_and_print_cr("[%s: %.1lf ms, GC Workers: %d]", str, value, workers);
203 }
204
205 void G1GCPhaseTimes::print_stats(int level, const char* str, int value) {
206 LineBuffer(level).append_and_print_cr("[%s: %d]", str, value);
207 }
208
209 double G1GCPhaseTimes::avg_value(double* data) {
210 if (G1CollectedHeap::use_parallel_gc_threads()) {
211 double ret = 0.0;
212 for (uint i = 0; i < _active_gc_threads; ++i) {
213 ret += data[i];
214 }
215 return ret / (double) _active_gc_threads;
216 } else {
217 return data[0];
218 }
219 }
220
221 double G1GCPhaseTimes::max_value(double* data) {
222 if (G1CollectedHeap::use_parallel_gc_threads()) {
223 double ret = data[0];
224 for (uint i = 1; i < _active_gc_threads; ++i) {
225 if (data[i] > ret) {
226 ret = data[i];
227 }
228 }
229 return ret;
230 } else {
231 return data[0];
232 }
233 }
234
235 double G1GCPhaseTimes::sum_of_values(double* data) {
236 if (G1CollectedHeap::use_parallel_gc_threads()) {
237 double sum = 0.0;
238 for (uint i = 0; i < _active_gc_threads; i++) {
239 sum += data[i];
240 }
241 return sum;
242 } else {
243 return data[0];
244 }
245 }
246
247 double G1GCPhaseTimes::max_sum(double* data1, double* data2) {
248 double ret = data1[0] + data2[0];
249
250 if (G1CollectedHeap::use_parallel_gc_threads()) {
251 for (uint i = 1; i < _active_gc_threads; ++i) {
252 double data = data1[i] + data2[i];
253 if (data > ret) {
254 ret = data;
255 }
256 }
257 }
258 return ret;
259 }
260
261 void G1GCPhaseTimes::collapse_par_times() {
262 _ext_root_scan_time = avg_value(_par_last_ext_root_scan_times_ms);
263 _satb_filtering_time = avg_value(_par_last_satb_filtering_times_ms);
264 _update_rs_time = avg_value(_par_last_update_rs_times_ms);
265 _update_rs_processed_buffers =
266 sum_of_values(_par_last_update_rs_processed_buffers);
267 _scan_rs_time = avg_value(_par_last_scan_rs_times_ms);
268 _obj_copy_time = avg_value(_par_last_obj_copy_times_ms);
269 _termination_time = avg_value(_par_last_termination_times_ms);
270 }
271
272 double G1GCPhaseTimes::accounted_time_ms() {
273 // Subtract the root region scanning wait time. It's initialized to
274 // zero at the start of the pause.
275 double misc_time_ms = _root_region_scan_wait_time_ms;
276
277 misc_time_ms += _cur_collection_par_time_ms;
278
279 // Now subtract the time taken to fix up roots in generated code
280 misc_time_ms += _cur_collection_code_root_fixup_time_ms;
281
282 // Subtract the time taken to clean the card table from the
283 // current value of "other time"
284 misc_time_ms += _cur_clear_ct_time_ms;
285
286 return misc_time_ms;
287 }
288
289 void G1GCPhaseTimes::print(double pause_time_ms) {
290
291 if (PrintGCTimeStamps) {
292 gclog_or_tty->stamp();
293 gclog_or_tty->print(": ");
294 }
295
296 GCCauseString gc_cause_str = GCCauseString("GC pause", _gc_cause)
297 .append(_is_young_gc ? " (young)" : " (mixed)")
298 .append(_is_initial_mark_gc ? " (initial-mark)" : "");
299 gclog_or_tty->print_cr("[%s, %3.7f secs]", (const char*)gc_cause_str, pause_time_ms / 1000.0);
300
301 if (!G1Log::finer()) {
302 return;
303 }
304
305 if (_root_region_scan_wait_time_ms > 0.0) {
306 print_stats(1, "Root Region Scan Waiting", _root_region_scan_wait_time_ms);
307 }
308 if (G1CollectedHeap::use_parallel_gc_threads()) {
309 print_stats(1, "Parallel Time", _cur_collection_par_time_ms, _active_gc_threads);
310 print_par_stats(2, "GC Worker Start", _par_last_gc_worker_start_times_ms);
311 print_par_stats(2, "Ext Root Scanning", _par_last_ext_root_scan_times_ms);
312 if (_satb_filtering_time > 0.0) {
313 print_par_stats(2, "SATB Filtering", _par_last_satb_filtering_times_ms);
314 }
315 print_par_stats(2, "Update RS", _par_last_update_rs_times_ms);
316 if (G1Log::finest()) {
317 print_par_stats(3, "Processed Buffers", _par_last_update_rs_processed_buffers,
318 false /* showDecimals */);
319 }
320 print_par_stats(2, "Scan RS", _par_last_scan_rs_times_ms);
321 print_par_stats(2, "Object Copy", _par_last_obj_copy_times_ms);
322 print_par_stats(2, "Termination", _par_last_termination_times_ms);
323 if (G1Log::finest()) {
324 print_par_stats(3, "Termination Attempts", _par_last_termination_attempts,
325 false /* showDecimals */);
326 }
327 print_par_stats(2, "GC Worker Other", _par_last_gc_worker_other_times_ms);
328 print_par_stats(2, "GC Worker Total", _par_last_gc_worker_times_ms);
329 print_par_stats(2, "GC Worker End", _par_last_gc_worker_end_times_ms);
330 } else {
331 print_stats(1, "Ext Root Scanning", _ext_root_scan_time);
332 if (_satb_filtering_time > 0.0) {
333 print_stats(1, "SATB Filtering", _satb_filtering_time);
334 }
335 print_stats(1, "Update RS", _update_rs_time);
336 if (G1Log::finest()) {
337 print_stats(2, "Processed Buffers", (int)_update_rs_processed_buffers);
338 }
339 print_stats(1, "Scan RS", _scan_rs_time);
340 print_stats(1, "Object Copying", _obj_copy_time);
341 }
342 print_stats(1, "Code Root Fixup", _cur_collection_code_root_fixup_time_ms);
343 print_stats(1, "Clear CT", _cur_clear_ct_time_ms);
344 if (Verbose && G1Log::finest()) {
345 print_stats(1, "Cur Clear CC", _cur_clear_cc_time_ms);
346 print_stats(1, "Cum Clear CC", _cum_clear_cc_time_ms);
347 print_stats(1, "Min Clear CC", _min_clear_cc_time_ms);
348 print_stats(1, "Max Clear CC", _max_clear_cc_time_ms);
349 if (_num_cc_clears > 0) {
350 print_stats(1, "Avg Clear CC", _cum_clear_cc_time_ms / ((double)_num_cc_clears));
351 }
352 }
353 double misc_time_ms = pause_time_ms - accounted_time_ms();
354 print_stats(1, "Other", misc_time_ms);
355 print_stats(2, "Choose CSet",
356 (_recorded_young_cset_choice_time_ms +
357 _recorded_non_young_cset_choice_time_ms));
358 print_stats(2, "Ref Proc", _cur_ref_proc_time_ms);
359 print_stats(2, "Ref Enq", _cur_ref_enq_time_ms);
360 print_stats(2, "Free CSet",
361 (_recorded_young_free_cset_time_ms +
362 _recorded_non_young_free_cset_time_ms));
363 }
364
365 void G1GCPhaseTimes::record_cc_clear_time_ms(double ms) {
366 if (!(Verbose && G1Log::finest())) {
367 return;
368 }
369
370 if (_min_clear_cc_time_ms < 0.0 || ms <= _min_clear_cc_time_ms) {
371 _min_clear_cc_time_ms = ms;
372 }
373 if (_max_clear_cc_time_ms < 0.0 || ms >= _max_clear_cc_time_ms) {
374 _max_clear_cc_time_ms = ms;
375 }
376 _cur_clear_cc_time_ms = ms;
377 _cum_clear_cc_time_ms += ms;
378 _num_cc_clears++;
379 }