brutisso@3923: /* tschatzl@6402: * Copyright (c) 2013, 2014 Oracle and/or its affiliates. All rights reserved. brutisso@3923: * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. brutisso@3923: * brutisso@3923: * This code is free software; you can redistribute it and/or modify it brutisso@3923: * under the terms of the GNU General Public License version 2 only, as brutisso@3923: * published by the Free Software Foundation. brutisso@3923: * brutisso@3923: * This code is distributed in the hope that it will be useful, but WITHOUT brutisso@3923: * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or brutisso@3923: * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License brutisso@3923: * version 2 for more details (a copy is included in the LICENSE file that brutisso@3923: * accompanied this code). brutisso@3923: * brutisso@3923: * You should have received a copy of the GNU General Public License version brutisso@3923: * 2 along with this work; if not, write to the Free Software Foundation, brutisso@3923: * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. brutisso@3923: * brutisso@3923: * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA brutisso@3923: * or visit www.oracle.com if you need additional information or have any brutisso@3923: * questions. brutisso@3923: * brutisso@3923: */ brutisso@3923: brutisso@3923: brutisso@3923: #include "precompiled.hpp" brutisso@3923: #include "gc_implementation/g1/g1CollectedHeap.inline.hpp" brutisso@3923: #include "gc_implementation/g1/g1GCPhaseTimes.hpp" brutisso@3923: #include "gc_implementation/g1/g1Log.hpp" pliden@6413: #include "gc_implementation/g1/g1StringDedup.hpp" brutisso@3923: brutisso@3923: // Helper class for avoiding interleaved logging brutisso@3923: class LineBuffer: public StackObj { brutisso@3923: brutisso@3923: private: brutisso@3923: static const int BUFFER_LEN = 1024; brutisso@3923: static const int INDENT_CHARS = 3; brutisso@3923: char _buffer[BUFFER_LEN]; brutisso@3923: int _indent_level; brutisso@3923: int _cur; brutisso@3923: brutisso@3923: void vappend(const char* format, va_list ap) { brutisso@3923: int res = vsnprintf(&_buffer[_cur], BUFFER_LEN - _cur, format, ap); brutisso@3923: if (res != -1) { brutisso@3923: _cur += res; brutisso@3923: } else { brutisso@3923: DEBUG_ONLY(warning("buffer too small in LineBuffer");) brutisso@3923: _buffer[BUFFER_LEN -1] = 0; brutisso@3923: _cur = BUFFER_LEN; // vsnprintf above should not add to _buffer if we are called again brutisso@3923: } brutisso@3923: } brutisso@3923: brutisso@3923: public: brutisso@3923: explicit LineBuffer(int indent_level): _indent_level(indent_level), _cur(0) { brutisso@3923: for (; (_cur < BUFFER_LEN && _cur < (_indent_level * INDENT_CHARS)); _cur++) { brutisso@3923: _buffer[_cur] = ' '; brutisso@3923: } brutisso@3923: } brutisso@3923: brutisso@3923: #ifndef PRODUCT brutisso@3923: ~LineBuffer() { brutisso@3923: assert(_cur == _indent_level * INDENT_CHARS, "pending data in buffer - append_and_print_cr() not called?"); brutisso@3923: } brutisso@3923: #endif brutisso@3923: brutisso@3923: void append(const char* format, ...) { brutisso@3923: va_list ap; brutisso@3923: va_start(ap, format); brutisso@3923: vappend(format, ap); brutisso@3923: va_end(ap); brutisso@3923: } brutisso@3923: brutisso@3923: void append_and_print_cr(const char* format, ...) { brutisso@3923: va_list ap; brutisso@3923: va_start(ap, format); brutisso@3923: vappend(format, ap); brutisso@3923: va_end(ap); brutisso@3923: gclog_or_tty->print_cr("%s", _buffer); brutisso@3923: _cur = _indent_level * INDENT_CHARS; brutisso@3923: } brutisso@3923: }; brutisso@3923: brutisso@4015: template brutisso@4015: void WorkerDataArray::print(int level, const char* title) { brutisso@4015: if (_length == 1) { brutisso@4015: // No need for min, max, average and sum for only one worker brutisso@4015: LineBuffer buf(level); brutisso@4015: buf.append("[%s: ", title); brutisso@4015: buf.append(_print_format, _data[0]); brutisso@4015: buf.append_and_print_cr("]"); brutisso@4015: return; brutisso@4015: } brutisso@4015: brutisso@4015: T min = _data[0]; brutisso@4015: T max = _data[0]; brutisso@4015: T sum = 0; brutisso@4015: brutisso@4015: LineBuffer buf(level); brutisso@4015: buf.append("[%s:", title); brutisso@4015: for (uint i = 0; i < _length; ++i) { brutisso@4015: T val = _data[i]; brutisso@4015: min = MIN2(val, min); brutisso@4015: max = MAX2(val, max); brutisso@4015: sum += val; brutisso@4015: if (G1Log::finest()) { brutisso@4015: buf.append(" "); brutisso@4015: buf.append(_print_format, val); brutisso@4015: } brutisso@4015: } brutisso@4015: brutisso@4015: if (G1Log::finest()) { brutisso@4015: buf.append_and_print_cr(""); brutisso@4015: } brutisso@4015: brutisso@4015: double avg = (double)sum / (double)_length; brutisso@4015: buf.append(" Min: "); brutisso@4015: buf.append(_print_format, min); brutisso@4015: buf.append(", Avg: "); brutisso@4015: buf.append("%.1lf", avg); // Always print average as a double brutisso@4015: buf.append(", Max: "); brutisso@4015: buf.append(_print_format, max); brutisso@4015: buf.append(", Diff: "); brutisso@4015: buf.append(_print_format, max - min); brutisso@4015: if (_print_sum) { brutisso@4015: // for things like the start and end times the sum is not brutisso@4015: // that relevant brutisso@4015: buf.append(", Sum: "); brutisso@4015: buf.append(_print_format, sum); brutisso@4015: } brutisso@4015: buf.append_and_print_cr("]"); brutisso@4015: } brutisso@4015: jmasa@4097: #ifndef PRODUCT brutisso@4015: brutisso@4475: template <> const int WorkerDataArray::_uninitialized = -1; brutisso@4475: template <> const double WorkerDataArray::_uninitialized = -1.0; brutisso@4475: template <> const size_t WorkerDataArray::_uninitialized = (size_t)-1; brutisso@4475: brutisso@4015: template brutisso@4015: void WorkerDataArray::reset() { brutisso@4015: for (uint i = 0; i < _length; i++) { brutisso@4475: _data[i] = (T)_uninitialized; brutisso@4015: } brutisso@4015: } brutisso@4015: brutisso@4015: template brutisso@4015: void WorkerDataArray::verify() { brutisso@4015: for (uint i = 0; i < _length; i++) { brutisso@4475: assert(_data[i] != _uninitialized, brutisso@4475: err_msg("Invalid data for worker " UINT32_FORMAT ", data: %lf, uninitialized: %lf", brutisso@4475: i, (double)_data[i], (double)_uninitialized)); brutisso@4015: } brutisso@4015: } brutisso@4015: brutisso@4015: #endif brutisso@4015: brutisso@3923: G1GCPhaseTimes::G1GCPhaseTimes(uint max_gc_threads) : brutisso@3923: _max_gc_threads(max_gc_threads), brutisso@4015: _last_gc_worker_start_times_ms(_max_gc_threads, "%.1lf", false), brutisso@4015: _last_ext_root_scan_times_ms(_max_gc_threads, "%.1lf"), brutisso@4015: _last_satb_filtering_times_ms(_max_gc_threads, "%.1lf"), brutisso@4015: _last_update_rs_times_ms(_max_gc_threads, "%.1lf"), brutisso@4015: _last_update_rs_processed_buffers(_max_gc_threads, "%d"), brutisso@4015: _last_scan_rs_times_ms(_max_gc_threads, "%.1lf"), johnc@5548: _last_strong_code_root_scan_times_ms(_max_gc_threads, "%.1lf"), johnc@5548: _last_strong_code_root_mark_times_ms(_max_gc_threads, "%.1lf"), brutisso@4015: _last_obj_copy_times_ms(_max_gc_threads, "%.1lf"), brutisso@4015: _last_termination_times_ms(_max_gc_threads, "%.1lf"), brutisso@4015: _last_termination_attempts(_max_gc_threads, SIZE_FORMAT), brutisso@4015: _last_gc_worker_end_times_ms(_max_gc_threads, "%.1lf", false), brutisso@4015: _last_gc_worker_times_ms(_max_gc_threads, "%.1lf"), pliden@6413: _last_gc_worker_other_times_ms(_max_gc_threads, "%.1lf"), pliden@6413: _cur_string_dedup_queue_fixup_worker_times_ms(_max_gc_threads, "%.1lf"), pliden@6413: _cur_string_dedup_table_fixup_worker_times_ms(_max_gc_threads, "%.1lf") brutisso@3923: { brutisso@3923: assert(max_gc_threads > 0, "Must have some GC threads"); brutisso@3923: } brutisso@3923: brutisso@4015: void G1GCPhaseTimes::note_gc_start(uint active_gc_threads) { brutisso@3923: assert(active_gc_threads > 0, "The number of threads must be > 0"); brutisso@3923: assert(active_gc_threads <= _max_gc_threads, "The number of active threads must be <= the max nubmer of threads"); brutisso@3923: _active_gc_threads = active_gc_threads; brutisso@3923: brutisso@4015: _last_gc_worker_start_times_ms.reset(); brutisso@4015: _last_ext_root_scan_times_ms.reset(); brutisso@4015: _last_satb_filtering_times_ms.reset(); brutisso@4015: _last_update_rs_times_ms.reset(); brutisso@4015: _last_update_rs_processed_buffers.reset(); brutisso@4015: _last_scan_rs_times_ms.reset(); johnc@5548: _last_strong_code_root_scan_times_ms.reset(); johnc@5548: _last_strong_code_root_mark_times_ms.reset(); brutisso@4015: _last_obj_copy_times_ms.reset(); brutisso@4015: _last_termination_times_ms.reset(); brutisso@4015: _last_termination_attempts.reset(); brutisso@4015: _last_gc_worker_end_times_ms.reset(); brutisso@4015: _last_gc_worker_times_ms.reset(); brutisso@4015: _last_gc_worker_other_times_ms.reset(); brutisso@3923: } brutisso@3923: brutisso@4015: void G1GCPhaseTimes::note_gc_end() { brutisso@4015: _last_gc_worker_start_times_ms.verify(); brutisso@4015: _last_ext_root_scan_times_ms.verify(); brutisso@4015: _last_satb_filtering_times_ms.verify(); brutisso@4015: _last_update_rs_times_ms.verify(); brutisso@4015: _last_update_rs_processed_buffers.verify(); brutisso@4015: _last_scan_rs_times_ms.verify(); johnc@5548: _last_strong_code_root_scan_times_ms.verify(); johnc@5548: _last_strong_code_root_mark_times_ms.verify(); brutisso@4015: _last_obj_copy_times_ms.verify(); brutisso@4015: _last_termination_times_ms.verify(); brutisso@4015: _last_termination_attempts.verify(); brutisso@4015: _last_gc_worker_end_times_ms.verify(); brutisso@3923: brutisso@4475: for (uint i = 0; i < _active_gc_threads; i++) { brutisso@4475: double worker_time = _last_gc_worker_end_times_ms.get(i) - _last_gc_worker_start_times_ms.get(i); brutisso@4475: _last_gc_worker_times_ms.set(i, worker_time); brutisso@3923: brutisso@4475: double worker_known_time = _last_ext_root_scan_times_ms.get(i) + johnc@5078: _last_satb_filtering_times_ms.get(i) + johnc@5078: _last_update_rs_times_ms.get(i) + johnc@5078: _last_scan_rs_times_ms.get(i) + johnc@5548: _last_strong_code_root_scan_times_ms.get(i) + johnc@5548: _last_strong_code_root_mark_times_ms.get(i) + johnc@5078: _last_obj_copy_times_ms.get(i) + johnc@5078: _last_termination_times_ms.get(i); brutisso@3923: brutisso@4475: double worker_other_time = worker_time - worker_known_time; brutisso@4475: _last_gc_worker_other_times_ms.set(i, worker_other_time); brutisso@4475: } brutisso@3923: brutisso@4015: _last_gc_worker_times_ms.verify(); brutisso@4015: _last_gc_worker_other_times_ms.verify(); brutisso@3923: } brutisso@3923: pliden@6413: void G1GCPhaseTimes::note_string_dedup_fixup_start() { pliden@6413: _cur_string_dedup_queue_fixup_worker_times_ms.reset(); pliden@6413: _cur_string_dedup_table_fixup_worker_times_ms.reset(); pliden@6413: } pliden@6413: pliden@6413: void G1GCPhaseTimes::note_string_dedup_fixup_end() { pliden@6413: _cur_string_dedup_queue_fixup_worker_times_ms.verify(); pliden@6413: _cur_string_dedup_table_fixup_worker_times_ms.verify(); pliden@6413: } pliden@6413: brutisso@3923: void G1GCPhaseTimes::print_stats(int level, const char* str, double value) { brutisso@3923: LineBuffer(level).append_and_print_cr("[%s: %.1lf ms]", str, value); brutisso@3923: } brutisso@3923: brutisso@3923: void G1GCPhaseTimes::print_stats(int level, const char* str, double value, int workers) { brutisso@3923: LineBuffer(level).append_and_print_cr("[%s: %.1lf ms, GC Workers: %d]", str, value, workers); brutisso@3923: } brutisso@3923: brutisso@3923: double G1GCPhaseTimes::accounted_time_ms() { brutisso@3923: // Subtract the root region scanning wait time. It's initialized to brutisso@3923: // zero at the start of the pause. brutisso@3923: double misc_time_ms = _root_region_scan_wait_time_ms; brutisso@3923: brutisso@3923: misc_time_ms += _cur_collection_par_time_ms; brutisso@3923: brutisso@3923: // Now subtract the time taken to fix up roots in generated code brutisso@3923: misc_time_ms += _cur_collection_code_root_fixup_time_ms; brutisso@3923: johnc@5548: // Strong code root migration time johnc@5548: misc_time_ms += _cur_strong_code_root_migration_time_ms; johnc@5548: tschatzl@6402: // Strong code root purge time tschatzl@6402: misc_time_ms += _cur_strong_code_root_purge_time_ms; tschatzl@6402: pliden@6413: if (G1StringDedup::is_enabled()) { pliden@6413: // String dedup fixup time pliden@6413: misc_time_ms += _cur_string_dedup_fixup_time_ms; pliden@6413: } pliden@6413: brutisso@3923: // Subtract the time taken to clean the card table from the brutisso@3923: // current value of "other time" brutisso@3923: misc_time_ms += _cur_clear_ct_time_ms; brutisso@3923: brutisso@3923: return misc_time_ms; brutisso@3923: } brutisso@3923: brutisso@4015: void G1GCPhaseTimes::print(double pause_time_sec) { brutisso@3923: if (_root_region_scan_wait_time_ms > 0.0) { brutisso@3923: print_stats(1, "Root Region Scan Waiting", _root_region_scan_wait_time_ms); brutisso@3923: } brutisso@3923: if (G1CollectedHeap::use_parallel_gc_threads()) { brutisso@3923: print_stats(1, "Parallel Time", _cur_collection_par_time_ms, _active_gc_threads); brutisso@4015: _last_gc_worker_start_times_ms.print(2, "GC Worker Start (ms)"); brutisso@4015: _last_ext_root_scan_times_ms.print(2, "Ext Root Scanning (ms)"); brutisso@4015: if (_last_satb_filtering_times_ms.sum() > 0.0) { brutisso@4015: _last_satb_filtering_times_ms.print(2, "SATB Filtering (ms)"); brutisso@3923: } johnc@5548: if (_last_strong_code_root_mark_times_ms.sum() > 0.0) { johnc@5548: _last_strong_code_root_mark_times_ms.print(2, "Code Root Marking (ms)"); johnc@5548: } brutisso@4015: _last_update_rs_times_ms.print(2, "Update RS (ms)"); brutisso@4015: _last_update_rs_processed_buffers.print(3, "Processed Buffers"); brutisso@4015: _last_scan_rs_times_ms.print(2, "Scan RS (ms)"); johnc@5548: _last_strong_code_root_scan_times_ms.print(2, "Code Root Scanning (ms)"); brutisso@4015: _last_obj_copy_times_ms.print(2, "Object Copy (ms)"); brutisso@4015: _last_termination_times_ms.print(2, "Termination (ms)"); brutisso@3923: if (G1Log::finest()) { brutisso@4015: _last_termination_attempts.print(3, "Termination Attempts"); brutisso@3923: } brutisso@4015: _last_gc_worker_other_times_ms.print(2, "GC Worker Other (ms)"); brutisso@4015: _last_gc_worker_times_ms.print(2, "GC Worker Total (ms)"); brutisso@4015: _last_gc_worker_end_times_ms.print(2, "GC Worker End (ms)"); brutisso@4015: } else { brutisso@4015: _last_ext_root_scan_times_ms.print(1, "Ext Root Scanning (ms)"); brutisso@4015: if (_last_satb_filtering_times_ms.sum() > 0.0) { brutisso@4015: _last_satb_filtering_times_ms.print(1, "SATB Filtering (ms)"); brutisso@3923: } johnc@5548: if (_last_strong_code_root_mark_times_ms.sum() > 0.0) { johnc@5548: _last_strong_code_root_mark_times_ms.print(1, "Code Root Marking (ms)"); johnc@5548: } brutisso@4015: _last_update_rs_times_ms.print(1, "Update RS (ms)"); brutisso@4015: _last_update_rs_processed_buffers.print(2, "Processed Buffers"); brutisso@4015: _last_scan_rs_times_ms.print(1, "Scan RS (ms)"); johnc@5548: _last_strong_code_root_scan_times_ms.print(1, "Code Root Scanning (ms)"); brutisso@4015: _last_obj_copy_times_ms.print(1, "Object Copy (ms)"); brutisso@3923: } brutisso@3923: print_stats(1, "Code Root Fixup", _cur_collection_code_root_fixup_time_ms); johnc@5548: print_stats(1, "Code Root Migration", _cur_strong_code_root_migration_time_ms); tschatzl@6402: print_stats(1, "Code Root Purge", _cur_strong_code_root_purge_time_ms); pliden@6413: if (G1StringDedup::is_enabled()) { pliden@6413: print_stats(1, "String Dedup Fixup", _cur_string_dedup_fixup_time_ms, _active_gc_threads); pliden@6413: _cur_string_dedup_queue_fixup_worker_times_ms.print(2, "Queue Fixup (ms)"); pliden@6413: _cur_string_dedup_table_fixup_worker_times_ms.print(2, "Table Fixup (ms)"); pliden@6413: } brutisso@3923: print_stats(1, "Clear CT", _cur_clear_ct_time_ms); brutisso@4015: double misc_time_ms = pause_time_sec * MILLIUNITS - accounted_time_ms(); brutisso@3923: print_stats(1, "Other", misc_time_ms); brutisso@4015: if (_cur_verify_before_time_ms > 0.0) { brutisso@4015: print_stats(2, "Verify Before", _cur_verify_before_time_ms); brutisso@4015: } tschatzl@6406: if (G1CollectedHeap::heap()->evacuation_failed()) { tschatzl@6406: double evac_fail_handling = _cur_evac_fail_recalc_used + _cur_evac_fail_remove_self_forwards + tschatzl@6406: _cur_evac_fail_restore_remsets; tschatzl@6406: print_stats(2, "Evacuation Failure", evac_fail_handling); tschatzl@6406: if (G1Log::finest()) { tschatzl@6406: print_stats(3, "Recalculate Used", _cur_evac_fail_recalc_used); tschatzl@6406: print_stats(3, "Remove Self Forwards", _cur_evac_fail_remove_self_forwards); tschatzl@6406: print_stats(3, "Restore RemSet", _cur_evac_fail_restore_remsets); tschatzl@6406: } tschatzl@6406: } brutisso@3923: print_stats(2, "Choose CSet", brutisso@3923: (_recorded_young_cset_choice_time_ms + brutisso@3923: _recorded_non_young_cset_choice_time_ms)); brutisso@3923: print_stats(2, "Ref Proc", _cur_ref_proc_time_ms); brutisso@3923: print_stats(2, "Ref Enq", _cur_ref_enq_time_ms); tschatzl@6405: if (G1DeferredRSUpdate) { tschatzl@6405: print_stats(2, "Redirty Cards", _recorded_redirty_logged_cards_time_ms); tschatzl@6405: } brutisso@3923: print_stats(2, "Free CSet", brutisso@3923: (_recorded_young_free_cset_time_ms + brutisso@3923: _recorded_non_young_free_cset_time_ms)); tschatzl@6404: if (G1Log::finest()) { tschatzl@6404: print_stats(3, "Young Free CSet", _recorded_young_free_cset_time_ms); tschatzl@6404: print_stats(3, "Non-Young Free CSet", _recorded_non_young_free_cset_time_ms); tschatzl@6404: } brutisso@4015: if (_cur_verify_after_time_ms > 0.0) { brutisso@4015: print_stats(2, "Verify After", _cur_verify_after_time_ms); brutisso@4015: } brutisso@3923: }