Skip to content

Commit d038571

Browse files
author
Thomas Schatzl
committedSep 19, 2023
8030815: Code roots are not accounted for in region prediction
Reviewed-by: iwalulya, ayang
1 parent 138542d commit d038571

File tree

6 files changed

+93
-27
lines changed

6 files changed

+93
-27
lines changed
 

‎src/hotspot/share/gc/g1/g1Analytics.cpp

+19
Original file line numberDiff line numberDiff line change
@@ -80,9 +80,11 @@ G1Analytics::G1Analytics(const G1Predictions* predictor) :
8080
_card_scan_to_merge_ratio_seq(TruncatedSeqLength),
8181
_cost_per_card_scan_ms_seq(TruncatedSeqLength),
8282
_cost_per_card_merge_ms_seq(TruncatedSeqLength),
83+
_cost_per_code_root_ms_seq(TruncatedSeqLength),
8384
_cost_per_byte_copied_ms_seq(TruncatedSeqLength),
8485
_pending_cards_seq(TruncatedSeqLength),
8586
_rs_length_seq(TruncatedSeqLength),
87+
_code_root_rs_length_seq(TruncatedSeqLength),
8688
_constant_other_time_ms_seq(TruncatedSeqLength),
8789
_young_other_cost_per_region_ms_seq(TruncatedSeqLength),
8890
_non_young_other_cost_per_region_ms_seq(TruncatedSeqLength),
@@ -104,6 +106,7 @@ G1Analytics::G1Analytics(const G1Predictions* predictor) :
104106
_card_scan_to_merge_ratio_seq.set_initial(young_card_scan_to_merge_ratio_defaults[index]);
105107
_cost_per_card_scan_ms_seq.set_initial(young_only_cost_per_card_scan_ms_defaults[index]);
106108
_rs_length_seq.set_initial(0);
109+
_code_root_rs_length_seq.set_initial(0);
107110
_cost_per_byte_copied_ms_seq.set_initial(cost_per_byte_ms_defaults[index]);
108111

109112
_constant_other_time_ms_seq.add(constant_other_time_ms_defaults[index]);
@@ -186,6 +189,10 @@ void G1Analytics::report_cost_per_card_merge_ms(double cost_per_card_ms, bool fo
186189
_cost_per_card_merge_ms_seq.add(cost_per_card_ms, for_young_only_phase);
187190
}
188191

192+
void G1Analytics::report_cost_per_code_root_scan_ms(double cost_per_code_root_ms, bool for_young_only_phase) {
193+
_cost_per_code_root_ms_seq.add(cost_per_code_root_ms, for_young_only_phase);
194+
}
195+
189196
void G1Analytics::report_card_scan_to_merge_ratio(double merge_to_scan_ratio, bool for_young_only_phase) {
190197
_card_scan_to_merge_ratio_seq.add(merge_to_scan_ratio, for_young_only_phase);
191198
}
@@ -214,6 +221,10 @@ void G1Analytics::report_rs_length(double rs_length, bool for_young_only_phase)
214221
_rs_length_seq.add(rs_length, for_young_only_phase);
215222
}
216223

224+
void G1Analytics::report_code_root_rs_length(double code_root_rs_length, bool for_young_only_phase) {
225+
_code_root_rs_length_seq.add(code_root_rs_length, for_young_only_phase);
226+
}
227+
217228
double G1Analytics::predict_alloc_rate_ms() const {
218229
if (enough_samples_available(&_alloc_rate_ms_seq)) {
219230
return predict_zero_bounded(&_alloc_rate_ms_seq);
@@ -242,6 +253,10 @@ double G1Analytics::predict_card_merge_time_ms(size_t card_num, bool for_young_o
242253
return card_num * predict_zero_bounded(&_cost_per_card_merge_ms_seq, for_young_only_phase);
243254
}
244255

256+
double G1Analytics::predict_code_root_scan_time_ms(size_t code_root_num, bool for_young_only_phase) const {
257+
return code_root_num * predict_zero_bounded(&_cost_per_code_root_ms_seq, for_young_only_phase);
258+
}
259+
245260
double G1Analytics::predict_card_scan_time_ms(size_t card_num, bool for_young_only_phase) const {
246261
return card_num * predict_zero_bounded(&_cost_per_card_scan_ms_seq, for_young_only_phase);
247262
}
@@ -274,6 +289,10 @@ size_t G1Analytics::predict_rs_length(bool for_young_only_phase) const {
274289
return predict_size(&_rs_length_seq, for_young_only_phase);
275290
}
276291

292+
size_t G1Analytics::predict_code_root_rs_length(bool for_young_only_phase) const {
293+
return predict_size(&_code_root_rs_length_seq, for_young_only_phase);
294+
}
295+
277296
size_t G1Analytics::predict_pending_cards(bool for_young_only_phase) const {
278297
return predict_size(&_pending_cards_seq, for_young_only_phase);
279298
}

‎src/hotspot/share/gc/g1/g1Analytics.hpp

+8
Original file line numberDiff line numberDiff line change
@@ -57,11 +57,14 @@ class G1Analytics: public CHeapObj<mtGC> {
5757
G1PhaseDependentSeq _cost_per_card_scan_ms_seq;
5858
// The cost to merge a card during young-only and mixed gcs in ms.
5959
G1PhaseDependentSeq _cost_per_card_merge_ms_seq;
60+
// The cost to scan entries in the code root remembered set in ms.
61+
G1PhaseDependentSeq _cost_per_code_root_ms_seq;
6062
// The cost to copy a byte in ms.
6163
G1PhaseDependentSeq _cost_per_byte_copied_ms_seq;
6264

6365
G1PhaseDependentSeq _pending_cards_seq;
6466
G1PhaseDependentSeq _rs_length_seq;
67+
G1PhaseDependentSeq _code_root_rs_length_seq;
6568

6669
TruncatedSeq _constant_other_time_ms_seq;
6770
TruncatedSeq _young_other_cost_per_region_ms_seq;
@@ -127,6 +130,7 @@ class G1Analytics: public CHeapObj<mtGC> {
127130
void report_dirtied_cards_in_thread_buffers(size_t num_cards);
128131
void report_cost_per_card_scan_ms(double cost_per_remset_card_ms, bool for_young_only_phase);
129132
void report_cost_per_card_merge_ms(double cost_per_card_ms, bool for_young_only_phase);
133+
void report_cost_per_code_root_scan_ms(double cost_per_code_root_ms, bool for_young_only_phase);
130134
void report_card_scan_to_merge_ratio(double cards_per_entry_ratio, bool for_young_only_phase);
131135
void report_rs_length_diff(double rs_length_diff, bool for_young_only_phase);
132136
void report_cost_per_byte_ms(double cost_per_byte_ms, bool for_young_only_phase);
@@ -135,6 +139,7 @@ class G1Analytics: public CHeapObj<mtGC> {
135139
void report_constant_other_time_ms(double constant_other_time_ms);
136140
void report_pending_cards(double pending_cards, bool for_young_only_phase);
137141
void report_rs_length(double rs_length, bool for_young_only_phase);
142+
void report_code_root_rs_length(double code_root_rs_length, bool for_young_only_phase);
138143

139144
double predict_alloc_rate_ms() const;
140145
int num_alloc_rate_ms() const;
@@ -150,6 +155,8 @@ class G1Analytics: public CHeapObj<mtGC> {
150155
double predict_card_merge_time_ms(size_t card_num, bool for_young_only_phase) const;
151156
double predict_card_scan_time_ms(size_t card_num, bool for_young_only_phase) const;
152157

158+
double predict_code_root_scan_time_ms(size_t code_root_num, bool for_young_only_phase) const;
159+
153160
double predict_object_copy_time_ms(size_t bytes_to_copy, bool for_young_only_phase) const;
154161

155162
double predict_constant_other_time_ms() const;
@@ -163,6 +170,7 @@ class G1Analytics: public CHeapObj<mtGC> {
163170
double predict_cleanup_time_ms() const;
164171

165172
size_t predict_rs_length(bool for_young_only_phase) const;
173+
size_t predict_code_root_rs_length(bool for_young_only_phase) const;
166174
size_t predict_pending_cards(bool for_young_only_phase) const;
167175

168176
// Add a new GC of the given duration and end time to the record.

‎src/hotspot/share/gc/g1/g1ConcurrentRefine.cpp

+7-4
Original file line numberDiff line numberDiff line change
@@ -280,18 +280,21 @@ uint64_t G1ConcurrentRefine::adjust_threads_wait_ms() const {
280280
class G1ConcurrentRefine::RemSetSamplingClosure : public HeapRegionClosure {
281281
G1CollectionSet* _cset;
282282
size_t _sampled_rs_length;
283+
size_t _sampled_code_root_rs_length;
283284

284285
public:
285286
explicit RemSetSamplingClosure(G1CollectionSet* cset) :
286-
_cset(cset), _sampled_rs_length(0) {}
287+
_cset(cset), _sampled_rs_length(0), _sampled_code_root_rs_length(0) {}
287288

288289
bool do_heap_region(HeapRegion* r) override {
289-
size_t rs_length = r->rem_set()->occupied();
290-
_sampled_rs_length += rs_length;
290+
HeapRegionRemSet* rem_set = r->rem_set();
291+
_sampled_rs_length += rem_set->occupied();
292+
_sampled_code_root_rs_length += rem_set->code_roots_list_length();
291293
return false;
292294
}
293295

294296
size_t sampled_rs_length() const { return _sampled_rs_length; }
297+
size_t sampled_code_root_rs_length() const { return _sampled_code_root_rs_length; }
295298
};
296299

297300
// Adjust the target length (in regions) of the young gen, based on the the
@@ -311,7 +314,7 @@ void G1ConcurrentRefine::adjust_young_list_target_length() {
311314
G1CollectionSet* cset = G1CollectedHeap::heap()->collection_set();
312315
RemSetSamplingClosure cl{cset};
313316
cset->iterate(&cl);
314-
_policy->revise_young_list_target_length(cl.sampled_rs_length());
317+
_policy->revise_young_list_target_length(cl.sampled_rs_length(), cl.sampled_code_root_rs_length());
315318
}
316319
}
317320

‎src/hotspot/share/gc/g1/g1Policy.cpp

+41-13
Original file line numberDiff line numberDiff line change
@@ -189,13 +189,14 @@ void G1Policy::update_young_length_bounds() {
189189
assert(!Universe::is_fully_initialized() || SafepointSynchronize::is_at_safepoint(), "must be");
190190
bool for_young_only_phase = collector_state()->in_young_only_phase();
191191
update_young_length_bounds(_analytics->predict_pending_cards(for_young_only_phase),
192-
_analytics->predict_rs_length(for_young_only_phase));
192+
_analytics->predict_rs_length(for_young_only_phase),
193+
_analytics->predict_code_root_rs_length(for_young_only_phase));
193194
}
194195

195-
void G1Policy::update_young_length_bounds(size_t pending_cards, size_t rs_length) {
196+
void G1Policy::update_young_length_bounds(size_t pending_cards, size_t rs_length, size_t code_root_rs_length) {
196197
uint old_young_list_target_length = young_list_target_length();
197198

198-
uint new_young_list_desired_length = calculate_young_desired_length(pending_cards, rs_length);
199+
uint new_young_list_desired_length = calculate_young_desired_length(pending_cards, rs_length, code_root_rs_length);
199200
uint new_young_list_target_length = calculate_young_target_length(new_young_list_desired_length);
200201
uint new_young_list_max_length = calculate_young_max_length(new_young_list_target_length);
201202

@@ -234,7 +235,9 @@ void G1Policy::update_young_length_bounds(size_t pending_cards, size_t rs_length
234235
// value smaller than what is already allocated or what can actually be allocated.
235236
// This return value is only an expectation.
236237
//
237-
uint G1Policy::calculate_young_desired_length(size_t pending_cards, size_t rs_length) const {
238+
uint G1Policy::calculate_young_desired_length(size_t pending_cards,
239+
size_t rs_length,
240+
size_t code_root_rs_length) const {
238241
uint min_young_length_by_sizer = _young_gen_sizer.min_desired_young_length();
239242
uint max_young_length_by_sizer = _young_gen_sizer.max_desired_young_length();
240243

@@ -267,7 +270,7 @@ uint G1Policy::calculate_young_desired_length(size_t pending_cards, size_t rs_le
267270
if (use_adaptive_young_list_length()) {
268271
desired_eden_length_by_mmu = calculate_desired_eden_length_by_mmu();
269272

270-
double base_time_ms = predict_base_time_ms(pending_cards, rs_length);
273+
double base_time_ms = predict_base_time_ms(pending_cards, rs_length, code_root_rs_length);
271274
double retained_time_ms = predict_retained_regions_evac_time();
272275
double total_time_ms = base_time_ms + retained_time_ms;
273276

@@ -550,13 +553,13 @@ G1GCPhaseTimes* G1Policy::phase_times() const {
550553
return _phase_times;
551554
}
552555

553-
void G1Policy::revise_young_list_target_length(size_t rs_length) {
556+
void G1Policy::revise_young_list_target_length(size_t rs_length, size_t code_root_rs_length) {
554557
guarantee(use_adaptive_young_list_length(), "should not call this otherwise" );
555558

556559
size_t thread_buffer_cards = _analytics->predict_dirtied_cards_in_thread_buffers();
557560
G1DirtyCardQueueSet& dcqs = G1BarrierSet::dirty_card_queue_set();
558561
size_t pending_cards = dcqs.num_cards() + thread_buffer_cards;
559-
update_young_length_bounds(pending_cards, rs_length);
562+
update_young_length_bounds(pending_cards, rs_length, code_root_rs_length);
560563
}
561564

562565
void G1Policy::record_full_collection_start() {
@@ -890,6 +893,17 @@ void G1Policy::record_young_collection_end(bool concurrent_operation_is_full_mar
890893
}
891894
_analytics->report_card_scan_to_merge_ratio(scan_to_merge_ratio, is_young_only_pause);
892895

896+
// Update prediction for code root scan
897+
size_t const total_code_roots_scanned = p->sum_thread_work_items(G1GCPhaseTimes::CodeRoots, G1GCPhaseTimes::CodeRootsScannedNMethods) +
898+
p->sum_thread_work_items(G1GCPhaseTimes::OptCodeRoots, G1GCPhaseTimes::CodeRootsScannedNMethods);
899+
900+
if (total_code_roots_scanned >= G1NumCodeRootsCostSampleThreshold) {
901+
double avg_time_code_root_scan = average_time_ms(G1GCPhaseTimes::CodeRoots) +
902+
average_time_ms(G1GCPhaseTimes::OptCodeRoots);
903+
904+
_analytics->report_cost_per_code_root_scan_ms(avg_time_code_root_scan / total_code_roots_scanned, is_young_only_pause);
905+
}
906+
893907
// Update prediction for copy cost per byte
894908
size_t copied_bytes = p->sum_thread_work_items(G1GCPhaseTimes::MergePSS, G1GCPhaseTimes::MergePSSCopiedBytes);
895909

@@ -912,6 +926,7 @@ void G1Policy::record_young_collection_end(bool concurrent_operation_is_full_mar
912926

913927
_analytics->report_pending_cards((double)pending_cards_at_gc_start(), is_young_only_pause);
914928
_analytics->report_rs_length((double)_rs_length, is_young_only_pause);
929+
_analytics->report_code_root_rs_length((double)total_code_roots_scanned, is_young_only_pause);
915930
}
916931

917932
assert(!(G1GCPauseTypeHelper::is_concurrent_start_pause(this_pause) && collector_state()->mark_or_rebuild_in_progress()),
@@ -1033,7 +1048,8 @@ void G1Policy::record_young_gc_pause_end(bool evacuation_failed) {
10331048
}
10341049

10351050
double G1Policy::predict_base_time_ms(size_t pending_cards,
1036-
size_t rs_length) const {
1051+
size_t rs_length,
1052+
size_t code_root_rs_length) const {
10371053
bool in_young_only_phase = collector_state()->in_young_only_phase();
10381054

10391055
size_t unique_cards_from_rs = _analytics->predict_scan_card_num(rs_length, in_young_only_phase);
@@ -1043,22 +1059,26 @@ double G1Policy::predict_base_time_ms(size_t pending_cards,
10431059

10441060
double card_merge_time = _analytics->predict_card_merge_time_ms(pending_cards + rs_length, in_young_only_phase);
10451061
double card_scan_time = _analytics->predict_card_scan_time_ms(effective_scanned_cards, in_young_only_phase);
1062+
double code_root_scan_time = _analytics->predict_code_root_scan_time_ms(code_root_rs_length, in_young_only_phase);
10461063
double constant_other_time = _analytics->predict_constant_other_time_ms();
10471064
double survivor_evac_time = predict_survivor_regions_evac_time();
10481065

1049-
double total_time = card_merge_time + card_scan_time + constant_other_time + survivor_evac_time;
1066+
double total_time = card_merge_time + card_scan_time + code_root_scan_time + constant_other_time + survivor_evac_time;
10501067

10511068
log_trace(gc, ergo, heap)("Predicted base time: total %f lb_cards %zu rs_length %zu effective_scanned_cards %zu "
1052-
"card_merge_time %f card_scan_time %f constant_other_time %f survivor_evac_time %f",
1069+
"card_merge_time %f card_scan_time %f code_root_rs_length %zu code_root_scan_time %f "
1070+
"constant_other_time %f survivor_evac_time %f",
10531071
total_time, pending_cards, rs_length, effective_scanned_cards,
1054-
card_merge_time, card_scan_time, constant_other_time, survivor_evac_time);
1072+
card_merge_time, card_scan_time, code_root_rs_length, code_root_scan_time,
1073+
constant_other_time, survivor_evac_time);
10551074
return total_time;
10561075
}
10571076

10581077
double G1Policy::predict_base_time_ms(size_t pending_cards) const {
10591078
bool for_young_only_phase = collector_state()->in_young_only_phase();
10601079
size_t rs_length = _analytics->predict_rs_length(for_young_only_phase);
1061-
return predict_base_time_ms(pending_cards, rs_length);
1080+
size_t code_root_rs_length = _analytics->predict_code_root_rs_length(for_young_only_phase);
1081+
return predict_base_time_ms(pending_cards, rs_length, code_root_rs_length);
10621082
}
10631083

10641084
size_t G1Policy::predict_bytes_to_copy(HeapRegion* hr) const {
@@ -1100,10 +1120,18 @@ double G1Policy::predict_region_merge_scan_time(HeapRegion* hr, bool for_young_o
11001120
_analytics->predict_card_scan_time_ms(scan_card_num, for_young_only_phase);
11011121
}
11021122

1123+
double G1Policy::predict_region_code_root_scan_time(HeapRegion* hr, bool for_young_only_phase) const {
1124+
size_t code_root_length = hr->rem_set()->code_roots_list_length();
1125+
1126+
return
1127+
_analytics->predict_code_root_scan_time_ms(code_root_length, for_young_only_phase);
1128+
}
1129+
11031130
double G1Policy::predict_region_non_copy_time_ms(HeapRegion* hr,
11041131
bool for_young_only_phase) const {
11051132

1106-
double region_elapsed_time_ms = predict_region_merge_scan_time(hr, for_young_only_phase);
1133+
double region_elapsed_time_ms = predict_region_merge_scan_time(hr, for_young_only_phase) +
1134+
predict_region_code_root_scan_time(hr, for_young_only_phase);
11071135
// The prediction of the "other" time for this region is based
11081136
// upon the region type and NOT the GC type.
11091137
if (hr->is_young()) {

‎src/hotspot/share/gc/g1/g1Policy.hpp

+10-7
Original file line numberDiff line numberDiff line change
@@ -142,12 +142,15 @@ class G1Policy: public CHeapObj<mtGC> {
142142
// Base time contains handling remembered sets and constant other time of the
143143
// whole young gen, refinement buffers, and copying survivors.
144144
// Basically everything but copying eden regions.
145-
double predict_base_time_ms(size_t pending_cards, size_t rs_length) const;
145+
double predict_base_time_ms(size_t pending_cards, size_t rs_length, size_t code_root_length) const;
146146

147147
// Copy time for a region is copying live data.
148148
double predict_region_copy_time_ms(HeapRegion* hr, bool for_young_only_phase) const;
149-
// Merge-scan time for a region is handling remembered sets of that region (as a single unit).
149+
// Merge-scan time for a region is handling card-based remembered sets of that region
150+
// (as a single unit).
150151
double predict_region_merge_scan_time(HeapRegion* hr, bool for_young_only_phase) const;
152+
// Code root scan time prediction for the given region.
153+
double predict_region_code_root_scan_time(HeapRegion* hr, bool for_young_only_phase) const;
151154
// Non-copy time for a region is handling remembered sets and other time.
152155
double predict_region_non_copy_time_ms(HeapRegion* hr, bool for_young_only_phase) const;
153156

@@ -207,10 +210,10 @@ class G1Policy: public CHeapObj<mtGC> {
207210
double _mark_cleanup_start_sec;
208211

209212
// Updates the internal young gen maximum and target and desired lengths.
210-
// If no parameters are passed, predict pending cards and the RS length using
211-
// the prediction model.
213+
// If no parameters are passed, predict pending cards, card set remset length and
214+
// code root remset length using the prediction model.
212215
void update_young_length_bounds();
213-
void update_young_length_bounds(size_t pending_cards, size_t rs_length);
216+
void update_young_length_bounds(size_t pending_cards, size_t rs_length, size_t code_root_rs_length);
214217

215218
// Calculate and return the minimum desired eden length based on the MMU target.
216219
uint calculate_desired_eden_length_by_mmu() const;
@@ -238,7 +241,7 @@ class G1Policy: public CHeapObj<mtGC> {
238241

239242
// Calculate desired young length based on current situation without taking actually
240243
// available free regions into account.
241-
uint calculate_young_desired_length(size_t pending_cards, size_t rs_length) const;
244+
uint calculate_young_desired_length(size_t pending_cards, size_t rs_length, size_t code_root_rs_length) const;
242245
// Limit the given desired young length to available free regions.
243246
uint calculate_young_target_length(uint desired_young_length) const;
244247
// The GCLocker might cause us to need more regions than the target. Calculate
@@ -301,7 +304,7 @@ class G1Policy: public CHeapObj<mtGC> {
301304
// Check the current value of the young list RSet length and
302305
// compare it against the last prediction. If the current value is
303306
// higher, recalculate the young list target length prediction.
304-
void revise_young_list_target_length(size_t rs_length);
307+
void revise_young_list_target_length(size_t rs_length, size_t code_root_rs_length);
305308

306309
// This should be called after the heap is resized.
307310
void record_new_heap_size(uint new_number_of_regions);

‎src/hotspot/share/gc/g1/g1_globals.hpp

+8-3
Original file line numberDiff line numberDiff line change
@@ -325,9 +325,14 @@
325325
range(1, 256) \
326326
\
327327
product(uint, G1NumCardsCostSampleThreshold, 1000, DIAGNOSTIC, \
328-
"Threshold for the number of cards when reporting card cost " \
329-
"related prediction sample. That sample must involve the same or "\
330-
"more than that number of cards to be used.") \
328+
"Threshold for the number of cards when reporting remembered set "\
329+
"card cost related prediction samples. A sample must involve " \
330+
"the same or more than that number of cards to be used.") \
331+
\
332+
product(uint, G1NumCodeRootsCostSampleThreshold, 100, DIAGNOSTIC, \
333+
"Threshold for the number of code roots when reporting code root "\
334+
"scan cost related prediction samples. A sample must involve " \
335+
"the same or more than this number of code roots to be used.") \
331336
\
332337
GC_G1_EVACUATION_FAILURE_FLAGS(develop, \
333338
develop_pd, \

1 commit comments

Comments
 (1)

openjdk-notifier[bot] commented on Sep 19, 2023

@openjdk-notifier[bot]
Please sign in to comment.