/* * Copyright Amazon.com Inc. or its affiliates. All Rights Reserved. * Copyright (c) 2025, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions. * */ #include "gc/shenandoah/heuristics/shenandoahOldHeuristics.hpp" #include "gc/shenandoah/heuristics/shenandoahYoungHeuristics.hpp" #include "gc/shenandoah/shenandoahCollectorPolicy.hpp" #include "gc/shenandoah/shenandoahGenerationalHeap.hpp" #include "gc/shenandoah/shenandoahHeapRegion.inline.hpp" #include "gc/shenandoah/shenandoahOldGeneration.hpp" #include "gc/shenandoah/shenandoahYoungGeneration.hpp" #include "utilities/quickSort.hpp" ShenandoahYoungHeuristics::ShenandoahYoungHeuristics(ShenandoahYoungGeneration* generation) : ShenandoahGenerationalHeuristics(generation) { } void ShenandoahYoungHeuristics::choose_collection_set_from_regiondata(ShenandoahCollectionSet* cset, RegionData* data, size_t size, size_t actual_free) { // See comments in ShenandoahAdaptiveHeuristics::choose_collection_set_from_regiondata(): // we do the same here, but with the following adjustments for generational mode: // // In generational mode, the sort order within the data array is not strictly descending amounts // of garbage. In particular, regions that have reached tenure age will be sorted into this // array before younger regions that typically contain more garbage. This is one reason why, // for example, we continue examining regions even after rejecting a region that has // more live data than we can evacuate. // Better select garbage-first regions QuickSort::sort(data, (int) size, compare_by_garbage); size_t cur_young_garbage = add_preselected_regions_to_collection_set(cset, data, size); choose_young_collection_set(cset, data, size, actual_free, cur_young_garbage); log_cset_composition(cset); } void ShenandoahYoungHeuristics::choose_young_collection_set(ShenandoahCollectionSet* cset, const RegionData* data, size_t size, size_t actual_free, size_t cur_young_garbage) const { auto heap = ShenandoahGenerationalHeap::heap(); size_t capacity = heap->young_generation()->max_capacity(); size_t garbage_threshold = ShenandoahHeapRegion::region_size_bytes() * ShenandoahGarbageThreshold / 100; size_t ignore_threshold = ShenandoahHeapRegion::region_size_bytes() * ShenandoahIgnoreGarbageThreshold / 100; const uint tenuring_threshold = heap->age_census()->tenuring_threshold(); // This is young-gen collection or a mixed evacuation. // If this is mixed evacuation, the old-gen candidate regions have already been added. size_t max_cset = (size_t) (heap->young_generation()->get_evacuation_reserve() / ShenandoahEvacWaste); size_t cur_cset = 0; size_t free_target = (capacity * ShenandoahMinFreeThreshold) / 100 + max_cset; size_t min_garbage = (free_target > actual_free) ? (free_target - actual_free) : 0; log_info(gc, ergo)( "Adaptive CSet Selection for YOUNG. Max Evacuation: %zu%s, Actual Free: %zu%s.", byte_size_in_proper_unit(max_cset), proper_unit_for_byte_size(max_cset), byte_size_in_proper_unit(actual_free), proper_unit_for_byte_size(actual_free)); for (size_t idx = 0; idx < size; idx++) { ShenandoahHeapRegion* r = data[idx].get_region(); if (cset->is_preselected(r->index())) { continue; } if (r->age() < tenuring_threshold) { size_t new_cset = cur_cset + r->get_live_data_bytes(); size_t region_garbage = r->garbage(); size_t new_garbage = cur_young_garbage + region_garbage; bool add_regardless = (region_garbage > ignore_threshold) && (new_garbage < min_garbage); assert(r->is_young(), "Only young candidates expected in the data array"); if ((new_cset <= max_cset) && (add_regardless || (region_garbage > garbage_threshold))) { cur_cset = new_cset; cur_young_garbage = new_garbage; cset->add_region(r); } } // Note that we do not add aged regions if they were not pre-selected. The reason they were not preselected // is because there is not sufficient room in old-gen to hold their to-be-promoted live objects or because // they are to be promoted in place. } } bool ShenandoahYoungHeuristics::should_start_gc() { auto heap = ShenandoahGenerationalHeap::heap(); ShenandoahOldGeneration* old_generation = heap->old_generation(); ShenandoahOldHeuristics* old_heuristics = old_generation->heuristics(); // Checks that an old cycle has run for at least ShenandoahMinimumOldTimeMs before allowing a young cycle. if (ShenandoahMinimumOldTimeMs > 0) { if (old_generation->is_preparing_for_mark() || old_generation->is_concurrent_mark_in_progress()) { size_t old_time_elapsed = size_t(old_heuristics->elapsed_cycle_time() * 1000); if (old_time_elapsed < ShenandoahMinimumOldTimeMs) { // Do not decline_trigger() when waiting for minimum quantum of Old-gen marking. It is not at our discretion // to trigger at this time. log_debug(gc)("Young heuristics declines to trigger because old_time_elapsed < ShenandoahMinimumOldTimeMs"); return false; } } } // inherited triggers have already decided to start a cycle, so no further evaluation is required if (ShenandoahAdaptiveHeuristics::should_start_gc()) { return true; } // Get through promotions and mixed evacuations as quickly as possible. These cycles sometimes require significantly // more time than traditional young-generation cycles so start them up as soon as possible. This is a "mitigation" // for the reality that old-gen and young-gen activities are not truly "concurrent". If there is old-gen work to // be done, we start up the young-gen GC threads so they can do some of this old-gen work. As implemented, promotion // gets priority over old-gen marking. size_t promo_expedite_threshold = percent_of(heap->young_generation()->max_capacity(), ShenandoahExpeditePromotionsThreshold); size_t promo_potential = old_generation->get_promotion_potential(); if (promo_potential > promo_expedite_threshold) { // Detect unsigned arithmetic underflow assert(promo_potential < heap->capacity(), "Sanity"); log_trigger("Expedite promotion of " PROPERFMT, PROPERFMTARGS(promo_potential)); accept_trigger(); return true; } size_t mixed_candidates = old_heuristics->unprocessed_old_collection_candidates(); if (mixed_candidates > ShenandoahExpediteMixedThreshold && !heap->is_concurrent_weak_root_in_progress()) { // We need to run young GC in order to open up some free heap regions so we can finish mixed evacuations. // If concurrent weak root processing is in progress, it means the old cycle has chosen mixed collection // candidates, but has not completed. There is no point in trying to start the young cycle before the old // cycle completes. log_trigger("Expedite mixed evacuation of %zu regions", mixed_candidates); accept_trigger(); return true; } // Don't decline_trigger() here That was done in ShenandoahAdaptiveHeuristics::should_start_gc() return false; } // Return a conservative estimate of how much memory can be allocated before we need to start GC. The estimate is based // on memory that is currently available within young generation plus all of the memory that will be added to the young // generation at the end of the current cycle (as represented by young_regions_to_be_reclaimed) and on the anticipated // amount of time required to perform a GC. size_t ShenandoahYoungHeuristics::bytes_of_allocation_runway_before_gc_trigger(size_t young_regions_to_be_reclaimed) { size_t capacity = _space_info->max_capacity(); size_t usage = _space_info->used(); size_t available = (capacity > usage)? capacity - usage: 0; size_t allocated = _space_info->bytes_allocated_since_gc_start(); size_t available_young_collected = ShenandoahHeap::heap()->collection_set()->get_young_available_bytes_collected(); size_t anticipated_available = available + young_regions_to_be_reclaimed * ShenandoahHeapRegion::region_size_bytes() - available_young_collected; size_t spike_headroom = capacity * ShenandoahAllocSpikeFactor / 100; size_t penalties = capacity * _gc_time_penalties / 100; double rate = _allocation_rate.sample(allocated); // At what value of available, would avg and spike triggers occur? // if allocation_headroom < avg_cycle_time * avg_alloc_rate, then we experience avg trigger // if allocation_headroom < avg_cycle_time * rate, then we experience spike trigger if is_spiking // // allocation_headroom = // 0, if penalties > available or if penalties + spike_headroom > available // available - penalties - spike_headroom, otherwise // // so we trigger if available - penalties - spike_headroom < avg_cycle_time * avg_alloc_rate, which is to say // available < avg_cycle_time * avg_alloc_rate + penalties + spike_headroom // or if available < penalties + spike_headroom // // since avg_cycle_time * avg_alloc_rate > 0, the first test is sufficient to test both conditions // // thus, evac_slack_avg is MIN2(0, available - avg_cycle_time * avg_alloc_rate + penalties + spike_headroom) // // similarly, evac_slack_spiking is MIN2(0, available - avg_cycle_time * rate + penalties + spike_headroom) // but evac_slack_spiking is only relevant if is_spiking, as defined below. double avg_cycle_time = _gc_cycle_time_history->davg() + (_margin_of_error_sd * _gc_cycle_time_history->dsd()); double avg_alloc_rate = _allocation_rate.upper_bound(_margin_of_error_sd); size_t evac_slack_avg; if (anticipated_available > avg_cycle_time * avg_alloc_rate + penalties + spike_headroom) { evac_slack_avg = anticipated_available - (avg_cycle_time * avg_alloc_rate + penalties + spike_headroom); } else { // we have no slack because it's already time to trigger evac_slack_avg = 0; } bool is_spiking = _allocation_rate.is_spiking(rate, _spike_threshold_sd); size_t evac_slack_spiking; if (is_spiking) { if (anticipated_available > avg_cycle_time * rate + penalties + spike_headroom) { evac_slack_spiking = anticipated_available - (avg_cycle_time * rate + penalties + spike_headroom); } else { // we have no slack because it's already time to trigger evac_slack_spiking = 0; } } else { evac_slack_spiking = evac_slack_avg; } size_t threshold = min_free_threshold(); size_t evac_min_threshold = (anticipated_available > threshold)? anticipated_available - threshold: 0; return MIN3(evac_slack_spiking, evac_slack_avg, evac_min_threshold); }