From d634ddefdd7712f4c3ac070d8493be5ba2de2aef Mon Sep 17 00:00:00 2001 From: Thomas Schatzl Date: Mon, 7 Nov 2022 12:30:57 +0000 Subject: [PATCH] 8295354: Remove G1 incremental non-copy time calculation Reviewed-by: ayang, iwalulya --- src/hotspot/share/gc/g1/g1Analytics.cpp | 9 +- src/hotspot/share/gc/g1/g1Analytics.hpp | 1 - src/hotspot/share/gc/g1/g1CollectionSet.cpp | 94 ++----------------- src/hotspot/share/gc/g1/g1CollectionSet.hpp | 54 ----------- .../share/gc/g1/g1ConcurrentRefine.cpp | 2 - src/hotspot/share/gc/g1/g1Policy.cpp | 30 +++--- src/hotspot/share/gc/g1/g1Policy.hpp | 17 +++- 7 files changed, 40 insertions(+), 167 deletions(-) diff --git a/src/hotspot/share/gc/g1/g1Analytics.cpp b/src/hotspot/share/gc/g1/g1Analytics.cpp index 49079e420bc..5e29ecf95f0 100644 --- a/src/hotspot/share/gc/g1/g1Analytics.cpp +++ b/src/hotspot/share/gc/g1/g1Analytics.cpp @@ -83,7 +83,6 @@ G1Analytics::G1Analytics(const G1Predictions* predictor) : _cost_per_byte_copied_ms_seq(TruncatedSeqLength), _pending_cards_seq(TruncatedSeqLength), _rs_length_seq(TruncatedSeqLength), - _rs_length_diff_seq(TruncatedSeqLength), _constant_other_time_ms_seq(TruncatedSeqLength), _young_other_cost_per_region_ms_seq(TruncatedSeqLength), _non_young_other_cost_per_region_ms_seq(TruncatedSeqLength), @@ -105,7 +104,6 @@ G1Analytics::G1Analytics(const G1Predictions* predictor) : _card_scan_to_merge_ratio_seq.set_initial(young_card_scan_to_merge_ratio_defaults[index]); _cost_per_card_scan_ms_seq.set_initial(young_only_cost_per_card_scan_ms_defaults[index]); _rs_length_seq.set_initial(0); - _rs_length_diff_seq.set_initial(0.0); _cost_per_byte_copied_ms_seq.set_initial(cost_per_byte_ms_defaults[index]); _constant_other_time_ms_seq.add(constant_other_time_ms_defaults[index]); @@ -192,10 +190,6 @@ void G1Analytics::report_card_scan_to_merge_ratio(double merge_to_scan_ratio, bo _card_scan_to_merge_ratio_seq.add(merge_to_scan_ratio, for_young_only_phase); } -void G1Analytics::report_rs_length_diff(double rs_length_diff, bool for_young_only_phase) { - _rs_length_diff_seq.add(rs_length_diff, for_young_only_phase); -} - void G1Analytics::report_cost_per_byte_ms(double cost_per_byte_ms, bool for_young_only_phase) { _cost_per_byte_copied_ms_seq.add(cost_per_byte_ms, for_young_only_phase); } @@ -277,8 +271,7 @@ double G1Analytics::predict_cleanup_time_ms() const { } size_t G1Analytics::predict_rs_length(bool for_young_only_phase) const { - return predict_size(&_rs_length_seq, for_young_only_phase) + - predict_size(&_rs_length_diff_seq, for_young_only_phase); + return predict_size(&_rs_length_seq, for_young_only_phase); } size_t G1Analytics::predict_pending_cards(bool for_young_only_phase) const { diff --git a/src/hotspot/share/gc/g1/g1Analytics.hpp b/src/hotspot/share/gc/g1/g1Analytics.hpp index 3ae4deb8558..fd9c25e6757 100644 --- a/src/hotspot/share/gc/g1/g1Analytics.hpp +++ b/src/hotspot/share/gc/g1/g1Analytics.hpp @@ -62,7 +62,6 @@ class G1Analytics: public CHeapObj { G1PhaseDependentSeq _pending_cards_seq; G1PhaseDependentSeq _rs_length_seq; - G1PhaseDependentSeq _rs_length_diff_seq; TruncatedSeq _constant_other_time_ms_seq; TruncatedSeq _young_other_cost_per_region_ms_seq; diff --git a/src/hotspot/share/gc/g1/g1CollectionSet.cpp b/src/hotspot/share/gc/g1/g1CollectionSet.cpp index 7a6721c52ed..9d1e0347776 100644 --- a/src/hotspot/share/gc/g1/g1CollectionSet.cpp +++ b/src/hotspot/share/gc/g1/g1CollectionSet.cpp @@ -23,6 +23,7 @@ */ #include "precompiled.hpp" +#include "gc/g1/g1Analytics.hpp" #include "gc/g1/g1CollectedHeap.inline.hpp" #include "gc/g1/g1CollectionSet.hpp" #include "gc/g1/g1CollectionSetCandidates.hpp" @@ -47,10 +48,6 @@ G1GCPhaseTimes* G1CollectionSet::phase_times() { return _policy->phase_times(); } -double G1CollectionSet::predict_region_non_copy_time_ms(HeapRegion* hr) const { - return _policy->predict_region_non_copy_time_ms(hr, collector_state()->in_young_only_phase()); -} - G1CollectionSet::G1CollectionSet(G1CollectedHeap* g1h, G1Policy* policy) : _g1h(g1h), _policy(policy), @@ -63,20 +60,13 @@ G1CollectionSet::G1CollectionSet(G1CollectedHeap* g1h, G1Policy* policy) : _collection_set_max_length(0), _num_optional_regions(0), _bytes_used_before(0), - _recorded_rs_length(0), _inc_build_state(Inactive), _inc_part_start(0), - _inc_collection_set_stats(NULL), - _inc_bytes_used_before(0), - _inc_recorded_rs_length(0), - _inc_recorded_rs_length_diff(0), - _inc_predicted_non_copy_time_ms(0.0), - _inc_predicted_non_copy_time_ms_diff(0.0) { + _inc_bytes_used_before(0) { } G1CollectionSet::~G1CollectionSet() { FREE_C_HEAP_ARRAY(uint, _collection_set_regions); - FREE_C_HEAP_ARRAY(IncCollectionSetRegionStat, _inc_collection_set_stats); free_optional_regions(); clear_candidates(); } @@ -99,7 +89,6 @@ void G1CollectionSet::initialize(uint max_region_length) { guarantee(_collection_set_regions == NULL, "Must only initialize once."); _collection_set_max_length = max_region_length; _collection_set_regions = NEW_C_HEAP_ARRAY(uint, max_region_length, mtGC); - _inc_collection_set_stats = NEW_C_HEAP_ARRAY(IncCollectionSetRegionStat, max_region_length, mtGC); } void G1CollectionSet::free_optional_regions() { @@ -115,10 +104,6 @@ bool G1CollectionSet::has_candidates() { return _candidates != NULL && !_candidates->is_empty(); } -void G1CollectionSet::set_recorded_rs_length(size_t rs_length) { - _recorded_rs_length = rs_length; -} - // Add the heap region at the head of the non-incremental collection set void G1CollectionSet::add_old_region(HeapRegion* hr) { assert_at_safepoint_on_vm_thread(); @@ -134,7 +119,6 @@ void G1CollectionSet::add_old_region(HeapRegion* hr) { _collection_set_regions[_collection_set_cur_length++] = hr->hrm_index(); _bytes_used_before += hr->used(); - _recorded_rs_length += hr->rem_set()->occupied(); _old_region_length++; _g1h->old_set_remove(hr); @@ -152,38 +136,15 @@ void G1CollectionSet::add_optional_region(HeapRegion* hr) { void G1CollectionSet::start_incremental_building() { assert(_collection_set_cur_length == 0, "Collection set must be empty before starting a new collection set."); assert(_inc_build_state == Inactive, "Precondition"); -#ifdef ASSERT - for (uint i = 0; i < _collection_set_max_length; i++) { - _inc_collection_set_stats[i].reset(); - } -#endif _inc_bytes_used_before = 0; - _inc_recorded_rs_length = 0; - _inc_recorded_rs_length_diff = 0; - _inc_predicted_non_copy_time_ms = 0.0; - _inc_predicted_non_copy_time_ms_diff = 0.0; - update_incremental_marker(); } void G1CollectionSet::finalize_incremental_building() { assert(_inc_build_state == Active, "Precondition"); assert(SafepointSynchronize::is_at_safepoint(), "should be at a safepoint"); - - // The two "main" fields, _inc_recorded_rs_length and - // _inc_predicted_non_copy_time_ms, are updated by the thread - // that adds a new region to the CSet. Further updates by the - // concurrent refinement thread that samples the young RSet lengths - // are accumulated in the *_diff fields. Here we add the diffs to - // the "main" fields. - - _inc_recorded_rs_length += _inc_recorded_rs_length_diff; - _inc_predicted_non_copy_time_ms += _inc_predicted_non_copy_time_ms_diff; - - _inc_recorded_rs_length_diff = 0; - _inc_predicted_non_copy_time_ms_diff = 0.0; } void G1CollectionSet::clear() { @@ -239,31 +200,6 @@ void G1CollectionSet::iterate_part_from(HeapRegionClosure* cl, worker_id); } -void G1CollectionSet::update_young_region_prediction(HeapRegion* hr, - size_t new_rs_length) { - // Update the CSet information that is dependent on the new RS length - assert(hr->is_young(), "Precondition"); - assert(!SafepointSynchronize::is_at_safepoint(), "should not be at a safepoint"); - - IncCollectionSetRegionStat* stat = &_inc_collection_set_stats[hr->hrm_index()]; - - size_t old_rs_length = stat->_rs_length; - assert(old_rs_length <= new_rs_length, - "Remembered set decreased (changed from " SIZE_FORMAT " to " SIZE_FORMAT " region %u type %s)", - old_rs_length, new_rs_length, hr->hrm_index(), hr->get_short_type_str()); - size_t rs_length_diff = new_rs_length - old_rs_length; - stat->_rs_length = new_rs_length; - _inc_recorded_rs_length_diff += rs_length_diff; - - double old_non_copy_time = stat->_non_copy_time_ms; - assert(old_non_copy_time >= 0.0, "Non copy time for region %u not initialized yet, is %.3f", hr->hrm_index(), old_non_copy_time); - double new_non_copy_time = predict_region_non_copy_time_ms(hr); - double non_copy_time_ms_diff = new_non_copy_time - old_non_copy_time; - - stat->_non_copy_time_ms = new_non_copy_time; - _inc_predicted_non_copy_time_ms_diff += non_copy_time_ms_diff; -} - void G1CollectionSet::add_young_region_common(HeapRegion* hr) { assert(hr->is_young(), "invariant"); assert(_inc_build_state == Active, "Precondition"); @@ -285,20 +221,6 @@ void G1CollectionSet::add_young_region_common(HeapRegion* hr) { // Ignore calls to this due to retirement during full gc. if (!_g1h->collector_state()->in_full_gc()) { - size_t rs_length = hr->rem_set()->occupied(); - double non_copy_time = predict_region_non_copy_time_ms(hr); - - // Cache the values we have added to the aggregated information - // in the heap region in case we have to remove this region from - // the incremental collection set, or it is updated by the - // rset sampling code - - IncCollectionSetRegionStat* stat = &_inc_collection_set_stats[hr->hrm_index()]; - stat->_rs_length = rs_length; - stat->_non_copy_time_ms = non_copy_time; - - _inc_recorded_rs_length += rs_length; - _inc_predicted_non_copy_time_ms += non_copy_time; _inc_bytes_used_before += hr->used(); } @@ -400,7 +322,8 @@ double G1CollectionSet::finalize_young_part(double target_pause_time_ms, G1Survi guarantee(target_pause_time_ms > 0.0, "target_pause_time_ms = %1.6lf should be positive", target_pause_time_ms); - size_t pending_cards = _policy->pending_cards_at_gc_start() + _g1h->hot_card_cache()->num_entries(); + size_t pending_cards = _policy->pending_cards_at_gc_start() + + _g1h->hot_card_cache()->num_entries(); log_trace(gc, ergo, cset)("Start choosing CSet. Pending cards: " SIZE_FORMAT " target pause time: %1.2fms", pending_cards, target_pause_time_ms); @@ -417,12 +340,11 @@ double G1CollectionSet::finalize_young_part(double target_pause_time_ms, G1Survi _bytes_used_before = _inc_bytes_used_before; - // The number of recorded young regions is the incremental - // collection set's current size - set_recorded_rs_length(_inc_recorded_rs_length); - double predicted_base_time_ms = _policy->predict_base_time_ms(pending_cards); - double predicted_eden_time = _inc_predicted_non_copy_time_ms + _policy->predict_eden_copy_time_ms(eden_region_length); + // Base time already includes the whole remembered set related time, so do not add that here + // again. + double predicted_eden_time = _policy->predict_young_region_other_time_ms(eden_region_length) + + _policy->predict_eden_copy_time_ms(eden_region_length); double remaining_time_ms = MAX2(target_pause_time_ms - (predicted_base_time_ms + predicted_eden_time), 0.0); log_trace(gc, ergo, cset)("Added young regions to CSet. Eden: %u regions, Survivors: %u regions, " diff --git a/src/hotspot/share/gc/g1/g1CollectionSet.hpp b/src/hotspot/share/gc/g1/g1CollectionSet.hpp index 74d5ed47c5f..68c271f6687 100644 --- a/src/hotspot/share/gc/g1/g1CollectionSet.hpp +++ b/src/hotspot/share/gc/g1/g1CollectionSet.hpp @@ -161,11 +161,6 @@ class G1CollectionSet { // pause, and updated as more regions are added to the collection set. size_t _bytes_used_before; - // The number of cards in the remembered set in the collection set. Set from - // the incrementally built collection set at the start of an evacuation - // pause, and updated as more regions are added to the collection set. - size_t _recorded_rs_length; - enum CSetBuildType { Active, // We are actively building the collection set Inactive // We are not actively building the collection set @@ -174,22 +169,6 @@ class G1CollectionSet { CSetBuildType _inc_build_state; size_t _inc_part_start; - // Information about eden regions in the incremental collection set. - struct IncCollectionSetRegionStat { - // The predicted non-copy time that was added to the total incremental value - // for the collection set. - double _non_copy_time_ms; - // The remembered set length that was added to the total incremental value - // for the collection set. - size_t _rs_length; - -#ifdef ASSERT - // Resets members to "uninitialized" values. - void reset() { _rs_length = ~(size_t)0; _non_copy_time_ms = -1.0; } -#endif - }; - - IncCollectionSetRegionStat* _inc_collection_set_stats; // The associated information that is maintained while the incremental // collection set is being built with *young* regions. Used to populate // the recorded info for the evacuation pause. @@ -199,38 +178,11 @@ class G1CollectionSet { // an evacuation pause. size_t _inc_bytes_used_before; - // The RSet lengths recorded for regions in the CSet. It is updated - // by the thread that adds a new region to the CSet. We assume that - // only one thread can be allocating a new CSet region (currently, - // it does so after taking the Heap_lock) hence no need to - // synchronize updates to this field. - size_t _inc_recorded_rs_length; - - // A concurrent refinement thread periodically samples the young - // region RSets and needs to update _inc_recorded_rs_length as - // the RSets grow. Instead of having to synchronize updates to that - // field we accumulate them in this field and add it to - // _inc_recorded_rs_length_diff at the start of a GC. - size_t _inc_recorded_rs_length_diff; - - // The predicted elapsed time it will take to collect the regions in - // the CSet. This is updated by the thread that adds a new region to - // the CSet. See the comment for _inc_recorded_rs_length about - // MT-safety assumptions. - double _inc_predicted_non_copy_time_ms; - - // See the comment for _inc_recorded_rs_length_diff. - double _inc_predicted_non_copy_time_ms_diff; - - void set_recorded_rs_length(size_t rs_length); - G1CollectorState* collector_state() const; G1GCPhaseTimes* phase_times(); void verify_young_cset_indices() const NOT_DEBUG_RETURN; - double predict_region_non_copy_time_ms(HeapRegion* hr) const; - // Update the incremental collection set information when adding a region. void add_young_region_common(HeapRegion* hr); @@ -322,8 +274,6 @@ public: void iterate_optional(HeapRegionClosure* cl) const; - size_t recorded_rs_length() { return _recorded_rs_length; } - size_t bytes_used_before() const { return _bytes_used_before; } @@ -341,10 +291,6 @@ public: // pause. void abandon_optional_collection_set(G1ParScanThreadStateSet* pss); - // Update information about hr in the aggregated information for - // the incrementally built collection set. - void update_young_region_prediction(HeapRegion* hr, size_t new_rs_length); - // Add eden region to the collection set. void add_eden_region(HeapRegion* hr); diff --git a/src/hotspot/share/gc/g1/g1ConcurrentRefine.cpp b/src/hotspot/share/gc/g1/g1ConcurrentRefine.cpp index affe78f6c08..3d6fd3163a9 100644 --- a/src/hotspot/share/gc/g1/g1ConcurrentRefine.cpp +++ b/src/hotspot/share/gc/g1/g1ConcurrentRefine.cpp @@ -288,8 +288,6 @@ public: bool do_heap_region(HeapRegion* r) override { size_t rs_length = r->rem_set()->occupied(); _sampled_rs_length += rs_length; - // Update the collection set policy information for this region. - _cset->update_young_region_prediction(r, rs_length); return false; } diff --git a/src/hotspot/share/gc/g1/g1Policy.cpp b/src/hotspot/share/gc/g1/g1Policy.cpp index 644da0b55a1..a6ff6301534 100644 --- a/src/hotspot/share/gc/g1/g1Policy.cpp +++ b/src/hotspot/share/gc/g1/g1Policy.cpp @@ -508,13 +508,14 @@ uint G1Policy::calculate_desired_eden_length_before_mixed(double base_time_ms, } double G1Policy::predict_survivor_regions_evac_time() const { - double survivor_regions_evac_time = 0.0; const GrowableArray* survivor_regions = _g1h->survivor()->regions(); + double survivor_regions_evac_time = predict_young_region_other_time_ms(_g1h->survivor()->length()); for (GrowableArrayIterator it = survivor_regions->begin(); it != survivor_regions->end(); ++it) { - survivor_regions_evac_time += predict_region_total_time_ms(*it, collector_state()->in_young_only_phase()); + survivor_regions_evac_time += predict_region_copy_time_ms(*it); } + return survivor_regions_evac_time; } @@ -853,10 +854,6 @@ void G1Policy::record_young_collection_end(bool concurrent_operation_is_full_mar } _analytics->report_card_scan_to_merge_ratio(scan_to_merge_ratio, is_young_only_pause); - const size_t recorded_rs_length = _collection_set->recorded_rs_length(); - const size_t rs_length_diff = _rs_length > recorded_rs_length ? _rs_length - recorded_rs_length : 0; - _analytics->report_rs_length_diff(rs_length_diff, is_young_only_pause); - // Update prediction for copy cost per byte size_t copied_bytes = p->sum_thread_work_items(G1GCPhaseTimes::MergePSS, G1GCPhaseTimes::MergePSSCopiedBytes); @@ -877,11 +874,8 @@ void G1Policy::record_young_collection_end(bool concurrent_operation_is_full_mar _analytics->report_constant_other_time_ms(constant_other_time_ms(pause_time_ms)); - // Do not update RS lengths and the number of pending cards with information from mixed gc: - // these are is wildly different to during young only gc and mess up young gen sizing right - // after the mixed gc phase. - _analytics->report_pending_cards((double) _pending_cards_at_gc_start, is_young_only_pause); - _analytics->report_rs_length((double) _rs_length, is_young_only_pause); + _analytics->report_pending_cards((double)pending_cards_at_gc_start(), is_young_only_pause); + _analytics->report_rs_length((double)_rs_length, is_young_only_pause); } assert(!(G1GCPauseTypeHelper::is_concurrent_start_pause(this_pause) && collector_state()->mark_or_rebuild_in_progress()), @@ -1058,6 +1052,10 @@ size_t G1Policy::predict_bytes_to_copy(HeapRegion* hr) const { return bytes_to_copy; } +double G1Policy::predict_young_region_other_time_ms(uint count) const { + return _analytics->predict_young_other_time_ms(count); +} + double G1Policy::predict_eden_copy_time_ms(uint count, size_t* bytes_to_copy) const { if (count == 0) { return 0.0; @@ -1074,15 +1072,19 @@ double G1Policy::predict_region_copy_time_ms(HeapRegion* hr) const { return _analytics->predict_object_copy_time_ms(bytes_to_copy, collector_state()->in_young_only_phase()); } -double G1Policy::predict_region_non_copy_time_ms(HeapRegion* hr, - bool for_young_only_phase) const { +double G1Policy::predict_region_merge_scan_time(HeapRegion* hr, bool for_young_only_phase) const { size_t rs_length = hr->rem_set()->occupied(); size_t scan_card_num = _analytics->predict_scan_card_num(rs_length, for_young_only_phase); - double region_elapsed_time_ms = + return _analytics->predict_card_merge_time_ms(rs_length, collector_state()->in_young_only_phase()) + _analytics->predict_card_scan_time_ms(scan_card_num, collector_state()->in_young_only_phase()); +} +double G1Policy::predict_region_non_copy_time_ms(HeapRegion* hr, + bool for_young_only_phase) const { + + double region_elapsed_time_ms = predict_region_merge_scan_time(hr, for_young_only_phase); // The prediction of the "other" time for this region is based // upon the region type and NOT the GC type. if (hr->is_young()) { diff --git a/src/hotspot/share/gc/g1/g1Policy.hpp b/src/hotspot/share/gc/g1/g1Policy.hpp index 8df569cd531..71d6313dc12 100644 --- a/src/hotspot/share/gc/g1/g1Policy.hpp +++ b/src/hotspot/share/gc/g1/g1Policy.hpp @@ -142,14 +142,27 @@ public: double predict_base_time_ms(size_t pending_cards) const; private: + // Base time contains handling remembered sets and constant other time of the + // whole young gen, refinement buffers, and copying survivors. + // Basically everything but copying eden regions. double predict_base_time_ms(size_t pending_cards, size_t rs_length) const; + // Copy time for a region is copying live data. double predict_region_copy_time_ms(HeapRegion* hr) const; + // Merge-scan time for a region is handling remembered sets of that region (as a single unit). + double predict_region_merge_scan_time(HeapRegion* hr, bool for_young_only_phase) const; + // Non-copy time for a region is handling remembered sets and other time. + double predict_region_non_copy_time_ms(HeapRegion* hr, bool for_young_only_phase) const; public: - double predict_eden_copy_time_ms(uint count, size_t* bytes_to_copy = NULL) const; - double predict_region_non_copy_time_ms(HeapRegion* hr, bool for_young_only_phase) const; + // Predict other time for count young regions. + double predict_young_region_other_time_ms(uint count) const; + // Predict copying live data time for count eden regions. Return the predict bytes if + // bytes_to_copy is non-nullptr. + double predict_eden_copy_time_ms(uint count, size_t* bytes_to_copy = nullptr) const; + // Total time for a region is handling remembered sets (as a single unit), copying its live data + // and other time. double predict_region_total_time_ms(HeapRegion* hr, bool for_young_only_phase) const; void cset_regions_freed() {