jdk/src/hotspot/share/gc/parallel/mutableNUMASpace.cpp
2026-04-20 08:42:08 +00:00

579 lines
21 KiB
C++

/*
* Copyright (c) 2006, 2026, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*
*/
#include "gc/parallel/mutableNUMASpace.hpp"
#include "gc/shared/collectedHeap.hpp"
#include "gc/shared/gc_globals.hpp"
#include "gc/shared/pretouchTask.hpp"
#include "gc/shared/spaceDecorator.hpp"
#include "gc/shared/workerThread.hpp"
#include "memory/allocation.inline.hpp"
#include "oops/oop.inline.hpp"
#include "oops/typeArrayOop.hpp"
#include "runtime/atomic.hpp"
#include "runtime/java.hpp"
#include "runtime/javaThread.hpp"
#include "runtime/os.inline.hpp"
#include "runtime/threadSMR.hpp"
#include "utilities/align.hpp"
#include "utilities/globalDefinitions.hpp"
MutableNUMASpace::MutableNUMASpace(size_t page_size) : MutableSpace(page_size) {
_lgrp_spaces = new (mtGC) GrowableArray<LGRPSpace*>(0, mtGC);
_adaptation_cycles = 0;
_samples_count = 0;
size_t lgrp_limit = os::numa_get_groups_num();
uint *lgrp_ids = NEW_C_HEAP_ARRAY(uint, lgrp_limit, mtGC);
size_t lgrp_num = os::numa_get_leaf_groups(lgrp_ids, lgrp_limit);
assert(lgrp_num > 0, "There should be at least one locality group");
lgrp_spaces()->reserve(checked_cast<int>(lgrp_num));
// Add new spaces for the new nodes
for (size_t i = 0; i < lgrp_num; i++) {
lgrp_spaces()->append(new LGRPSpace(lgrp_ids[i], page_size));
}
FREE_C_HEAP_ARRAY(lgrp_ids);
}
MutableNUMASpace::~MutableNUMASpace() {
for (int i = 0; i < lgrp_spaces()->length(); i++) {
delete lgrp_spaces()->at(i);
}
delete lgrp_spaces();
}
#ifndef PRODUCT
void MutableNUMASpace::mangle_unused_area() {
// This method should do nothing.
// It can be called on a numa space during a full compaction.
}
void MutableNUMASpace::mangle_region(MemRegion mr) {
// This method should do nothing because numa spaces are not mangled.
}
#endif // NOT_PRODUCT
// There may be unallocated holes in the middle chunks
// that should be filled with dead objects to ensure parsability.
void MutableNUMASpace::ensure_parsability() {
for (int i = 0; i < lgrp_spaces()->length(); i++) {
LGRPSpace *ls = lgrp_spaces()->at(i);
MutableSpace *s = ls->space();
if (s->top() < top()) { // For all spaces preceding the one containing top()
size_t free_words = s->free_in_words();
if (free_words > 0) {
CollectedHeap::fill_with_objects(s->top(), free_words);
}
} else {
return;
}
}
}
size_t MutableNUMASpace::used_in_words() const {
size_t s = 0;
for (LGRPSpace* ls : *lgrp_spaces()) {
s += ls->space()->used_in_words();
}
return s;
}
size_t MutableNUMASpace::free_in_words() const {
size_t s = 0;
for (LGRPSpace* ls : *lgrp_spaces()) {
s += ls->space()->free_in_words();
}
return s;
}
size_t MutableNUMASpace::tlab_capacity() const {
size_t s = 0;
for (LGRPSpace* ls : *lgrp_spaces()) {
s += ls->space()->capacity_in_bytes();
}
return s / (size_t)lgrp_spaces()->length();
}
size_t MutableNUMASpace::tlab_used() const {
size_t s = 0;
for (LGRPSpace* ls : *lgrp_spaces()) {
s += ls->space()->used_in_bytes();
}
return s / (size_t)lgrp_spaces()->length();
}
size_t MutableNUMASpace::unsafe_max_tlab_alloc() const {
size_t s = 0;
for (LGRPSpace* ls : *lgrp_spaces()) {
s += ls->space()->free_in_bytes();
}
size_t average_free_in_bytes = s / (size_t)lgrp_spaces()->length();
// free_in_bytes() is aligned to MinObjAlignmentInBytes, but averaging across
// all LGRPs can produce a non-aligned result. We align the value here because
// it may be used directly for TLAB allocation, which requires the allocation
// size to be properly aligned.
size_t aligned_average = align_down(average_free_in_bytes, MinObjAlignmentInBytes);
return aligned_average;
}
// Bias region towards the first-touching lgrp. Set the right page sizes.
void MutableNUMASpace::bias_region(MemRegion mr, uint lgrp_id) {
assert(is_aligned(mr.start(), page_size()), "precondition");
assert(is_aligned(mr.end(), page_size()), "precondition");
if (mr.is_empty()) {
return;
}
// First we tell the OS which page size we want in the given range. The underlying
// large page can be broken down if we require small pages.
os::realign_memory((char*) mr.start(), mr.byte_size(), page_size());
// Then we uncommit the pages in the range.
os::disclaim_memory((char*) mr.start(), mr.byte_size());
// And make them local/first-touch biased.
os::numa_make_local((char*)mr.start(), mr.byte_size(), checked_cast<int>(lgrp_id));
}
// Update space layout. Perform adaptation.
void MutableNUMASpace::update() {
if (UseAdaptiveNUMAChunkSizing && adaptation_cycles() < samples_count()) {
// A NUMA space is never mangled
initialize(region(),
SpaceDecorator::Clear,
SpaceDecorator::DontMangle);
}
}
// Accumulate statistics about the allocation rate of each lgrp.
void MutableNUMASpace::accumulate_statistics() {
if (UseAdaptiveNUMAChunkSizing) {
for (int i = 0; i < lgrp_spaces()->length(); i++) {
lgrp_spaces()->at(i)->sample();
}
increment_samples_count();
}
}
// Get the current size of a chunk.
// This function computes the size of the chunk based on the
// difference between chunk ends. This allows it to work correctly in
// case the whole space is resized and during the process of adaptive
// chunk resizing.
size_t MutableNUMASpace::current_chunk_size(int i) {
HeapWord *cur_end, *prev_end;
if (i == 0) {
prev_end = bottom();
} else {
prev_end = lgrp_spaces()->at(i - 1)->space()->end();
}
if (i == lgrp_spaces()->length() - 1) {
cur_end = end();
} else {
cur_end = lgrp_spaces()->at(i)->space()->end();
}
if (cur_end > prev_end) {
return pointer_delta(cur_end, prev_end, sizeof(char));
}
return 0;
}
// Return the default chunk size by equally diving the space.
// page_size() aligned.
size_t MutableNUMASpace::default_chunk_size() {
// The number of pages may not be evenly divided.
return align_down(capacity_in_bytes() / lgrp_spaces()->length(), page_size());
}
// Produce a new chunk size. page_size() aligned.
// This function is expected to be called on sequence of i's from 0 to
// lgrp_spaces()->length().
size_t MutableNUMASpace::adaptive_chunk_size(int i, size_t limit) {
size_t pages_available = capacity_in_bytes() / page_size();
for (int j = 0; j < i; j++) {
pages_available -= align_down(current_chunk_size(j), page_size()) / page_size();
}
pages_available -= lgrp_spaces()->length() - i - 1;
assert(pages_available > 0, "No pages left");
float alloc_rate = 0;
for (int j = i; j < lgrp_spaces()->length(); j++) {
alloc_rate += lgrp_spaces()->at(j)->alloc_rate()->average();
}
size_t chunk_size = 0;
if (alloc_rate > 0) {
LGRPSpace *ls = lgrp_spaces()->at(i);
chunk_size = (size_t)(ls->alloc_rate()->average() / alloc_rate * pages_available) * page_size();
}
chunk_size = MAX2(chunk_size, page_size());
if (limit > 0) {
limit = align_down(limit, page_size());
if (chunk_size > current_chunk_size(i)) {
size_t upper_bound = pages_available * page_size();
if (upper_bound > limit &&
current_chunk_size(i) < upper_bound - limit) {
// The resulting upper bound should not exceed the available
// amount of memory (pages_available * page_size()).
upper_bound = current_chunk_size(i) + limit;
}
chunk_size = MIN2(chunk_size, upper_bound);
} else {
size_t lower_bound = page_size();
if (current_chunk_size(i) > limit) { // lower_bound shouldn't underflow.
lower_bound = current_chunk_size(i) - limit;
}
chunk_size = MAX2(chunk_size, lower_bound);
}
}
assert(chunk_size <= pages_available * page_size(), "Chunk size out of range");
return chunk_size;
}
// Return the bottom_region and the top_region. Align them to page_size() boundary.
// |------------------new_region---------------------------------|
// |----bottom_region--|---intersection---|------top_region------|
void MutableNUMASpace::select_tails(MemRegion new_region, MemRegion intersection,
MemRegion* bottom_region, MemRegion *top_region) {
assert(is_aligned(new_region.start(), page_size()), "precondition");
assert(is_aligned(new_region.end(), page_size()), "precondition");
assert(is_aligned(intersection.start(), page_size()), "precondition");
assert(is_aligned(intersection.end(), page_size()), "precondition");
// Is there bottom?
if (new_region.start() < intersection.start()) { // Yes
*bottom_region = MemRegion(new_region.start(), intersection.start());
} else {
*bottom_region = MemRegion();
}
// Is there top?
if (intersection.end() < new_region.end()) { // Yes
*top_region = MemRegion(intersection.end(), new_region.end());
} else {
*top_region = MemRegion();
}
}
void MutableNUMASpace::initialize(MemRegion mr,
bool clear_space,
bool mangle_space,
bool setup_pages,
WorkerThreads* pretouch_workers) {
assert(clear_space, "Reallocation will destroy data!");
assert(lgrp_spaces()->length() > 0, "There should be at least one space");
assert(is_aligned(mr.start(), page_size()), "precondition");
assert(is_aligned(mr.end(), page_size()), "precondition");
MemRegion old_region = region(), new_region;
set_bottom(mr.start());
set_end(mr.end());
// Must always clear the space
clear(SpaceDecorator::DontMangle);
size_t num_pages = mr.byte_size() / page_size();
if (num_pages < (size_t)lgrp_spaces()->length()) {
log_warning(gc)("Degraded NUMA config: #os-pages (%zu) < #CPU (%d); space-size: %zu, page-size: %zu",
num_pages, lgrp_spaces()->length(), mr.byte_size(), page_size());
// Keep only the first few CPUs.
lgrp_spaces()->trunc_to((int)num_pages);
}
// Handle space resize
MemRegion top_region, bottom_region;
if (!old_region.equals(region())) {
new_region = mr;
MemRegion intersection = new_region.intersection(old_region);
if (intersection.is_empty()) {
intersection = MemRegion(new_region.start(), new_region.start());
}
select_tails(new_region, intersection, &bottom_region, &top_region);
bias_region(bottom_region, lgrp_spaces()->at(0)->lgrp_id());
bias_region(top_region, lgrp_spaces()->at(lgrp_spaces()->length() - 1)->lgrp_id());
}
// Check if the space layout has changed significantly?
// This happens when the space has been resized so that either head or tail
// chunk became less than a page.
bool layout_valid = UseAdaptiveNUMAChunkSizing &&
current_chunk_size(0) > page_size() &&
current_chunk_size(lgrp_spaces()->length() - 1) > page_size();
for (int i = 0; i < lgrp_spaces()->length(); i++) {
LGRPSpace *ls = lgrp_spaces()->at(i);
MutableSpace *s = ls->space();
old_region = s->region();
size_t chunk_byte_size = 0;
if (i < lgrp_spaces()->length() - 1) {
if (!UseAdaptiveNUMAChunkSizing ||
NUMAChunkResizeWeight == 0 ||
samples_count() < AdaptiveSizePolicyReadyThreshold) {
// No adaptation. Divide the space equally.
chunk_byte_size = default_chunk_size();
} else
if (!layout_valid || NUMASpaceResizeRate == 0) {
// Fast adaptation. If no space resize rate is set, resize
// the chunks instantly.
chunk_byte_size = adaptive_chunk_size(i, 0);
} else {
// Slow adaptation. Resize the chunks moving no more than
// NUMASpaceResizeRate bytes per collection.
size_t limit = NUMASpaceResizeRate /
(lgrp_spaces()->length() * (lgrp_spaces()->length() + 1) / 2);
chunk_byte_size = adaptive_chunk_size(i, MAX2(limit * (i + 1), page_size()));
}
assert(chunk_byte_size >= page_size(), "Chunk size too small");
assert(chunk_byte_size <= capacity_in_bytes(), "Sanity check");
}
if (i == 0) { // Bottom chunk
if (i != lgrp_spaces()->length() - 1) {
new_region = MemRegion(bottom(), chunk_byte_size >> LogHeapWordSize);
} else {
new_region = MemRegion(bottom(), end());
}
} else if (i < lgrp_spaces()->length() - 1) { // Middle chunks
MutableSpace* ps = lgrp_spaces()->at(i - 1)->space();
new_region = MemRegion(ps->end(),
chunk_byte_size >> LogHeapWordSize);
} else { // Top chunk
MutableSpace* ps = lgrp_spaces()->at(i - 1)->space();
new_region = MemRegion(ps->end(), end());
}
guarantee(region().contains(new_region), "Region invariant");
// The general case:
// |---------------------|--invalid---|--------------------------|
// |------------------new_region---------------------------------|
// |----bottom_region--|---intersection---|------top_region------|
// |----old_region----|
// The intersection part has all pages in place we don't need to migrate them.
// Pages for the top and bottom part should be freed and then reallocated.
MemRegion intersection = old_region.intersection(new_region);
if (intersection.start() == nullptr || intersection.end() == nullptr) {
intersection = MemRegion(new_region.start(), new_region.start());
}
select_tails(new_region, intersection, &bottom_region, &top_region);
// In a system with static binding we have to change the bias whenever
// we reshape the heap.
bias_region(bottom_region, ls->lgrp_id());
bias_region(top_region, ls->lgrp_id());
if (AlwaysPreTouch) {
PretouchTask::pretouch("ParallelGC PreTouch bottom_region", (char*)bottom_region.start(), (char*)bottom_region.end(),
page_size(), pretouch_workers);
PretouchTask::pretouch("ParallelGC PreTouch top_region", (char*)top_region.start(), (char*)top_region.end(),
page_size(), pretouch_workers);
}
// Clear space (set top = bottom) but never mangle.
s->initialize(new_region, SpaceDecorator::Clear, SpaceDecorator::DontMangle, MutableSpace::DontSetupPages);
}
set_adaptation_cycles(samples_count());
}
// Set the top of the whole space.
// Mark the holes in chunks below the top() as invalid.
void MutableNUMASpace::set_top(HeapWord* value) {
bool found_top = false;
for (int i = 0; i < lgrp_spaces()->length();) {
LGRPSpace *ls = lgrp_spaces()->at(i);
MutableSpace *s = ls->space();
if (s->contains(value)) {
// Check if setting the chunk's top to a given value would create a hole less than
// a minimal object; assuming that's not the last chunk in which case we don't care.
if (i < lgrp_spaces()->length() - 1) {
size_t remainder = pointer_delta(s->end(), value);
const size_t min_fill_size = CollectedHeap::min_fill_size();
if (remainder < min_fill_size && remainder > 0) {
// Add a minimum size filler object; it will cross the chunk boundary.
CollectedHeap::fill_with_object(value, min_fill_size);
value += min_fill_size;
assert(!s->contains(value), "Should be in the next chunk");
// Restart the loop from the same chunk, since the value has moved
// to the next one.
continue;
}
}
s->set_top(value);
found_top = true;
} else {
if (found_top) {
s->set_top(s->bottom());
} else {
s->set_top(s->end());
}
}
i++;
}
MutableSpace::set_top(value);
}
void MutableNUMASpace::clear(bool mangle_space) {
MutableSpace::set_top(bottom());
for (int i = 0; i < lgrp_spaces()->length(); i++) {
// Never mangle NUMA spaces because the mangling will
// bind the memory to a possibly unwanted lgroup.
lgrp_spaces()->at(i)->space()->clear(SpaceDecorator::DontMangle);
}
}
MutableNUMASpace::LGRPSpace *MutableNUMASpace::lgrp_space_for_current_thread() const {
const int lgrp_id = os::numa_get_group_id();
int lgrp_spaces_index = lgrp_spaces()->find_if([&](LGRPSpace* space) {
return space->lgrp_id() == (uint)lgrp_id;
});
if (lgrp_spaces_index == -1) {
// Running on a CPU with no memory; pick another CPU based on %.
lgrp_spaces_index = lgrp_id % lgrp_spaces()->length();
}
return lgrp_spaces()->at(lgrp_spaces_index);
}
HeapWord* MutableNUMASpace::cas_allocate(size_t size) {
LGRPSpace *ls = lgrp_space_for_current_thread();
MutableSpace *s = ls->space();
HeapWord *p = s->cas_allocate(size);
if (p != nullptr) {
size_t remainder = pointer_delta(s->end(), p + size);
if (remainder < CollectedHeap::min_fill_size() && remainder > 0) {
if (s->cas_deallocate(p, size)) {
// We were the last to allocate and created a fragment less than
// a minimal object.
p = nullptr;
} else {
guarantee(false, "Deallocation should always succeed");
}
}
}
if (p != nullptr) {
HeapWord* cur_top, *cur_chunk_top = p + size;
while ((cur_top = top()) < cur_chunk_top) { // Keep _top updated.
if (top_addr()->compare_set(cur_top, cur_chunk_top)) {
break;
}
}
}
if (p == nullptr) {
ls->set_allocation_failed();
}
return p;
}
void MutableNUMASpace::print_short_on(outputStream* st) const {
MutableSpace::print_short_on(st);
st->print(" (");
for (int i = 0; i < lgrp_spaces()->length(); i++) {
st->print("lgrp %u: ", lgrp_spaces()->at(i)->lgrp_id());
lgrp_spaces()->at(i)->space()->print_short_on(st);
if (i < lgrp_spaces()->length() - 1) {
st->print(", ");
}
}
st->print(")");
}
void MutableNUMASpace::print_on(outputStream* st, const char* prefix) const {
MutableSpace::print_on(st, prefix);
StreamIndentor si(st, 1);
for (int i = 0; i < lgrp_spaces()->length(); i++) {
LGRPSpace *ls = lgrp_spaces()->at(i);
FormatBuffer<128> lgrp_message("lgrp %u ", ls->lgrp_id());
ls->space()->print_on(st, lgrp_message);
if (NUMAStats) {
StreamIndentor si2(st, 1);
for (int i = 0; i < lgrp_spaces()->length(); i++) {
lgrp_spaces()->at(i)->accumulate_statistics(page_size());
}
st->print("local/remote/unbiased/uncommitted: %zuK/"
"%zuK/%zuK/%zuK\n",
ls->space_stats()->_local_space / K,
ls->space_stats()->_remote_space / K,
ls->space_stats()->_unbiased_space / K,
ls->space_stats()->_uncommited_space / K);
}
}
}
void MutableNUMASpace::verify() {
// This can be called after setting an arbitrary value to the space's top,
// so an object can cross the chunk boundary. We ensure the parsability
// of the space and just walk the objects in linear fashion.
ensure_parsability();
MutableSpace::verify();
}
// Scan pages and gather stats about page placement and size.
void MutableNUMASpace::LGRPSpace::accumulate_statistics(size_t page_size) {
clear_space_stats();
char *start = (char*)align_up(space()->bottom(), page_size);
char* end = (char*)align_down(space()->end(), page_size);
for (char *p = start; p < end; ) {
static const size_t PagesPerIteration = 128;
const void* pages[PagesPerIteration];
int lgrp_ids[PagesPerIteration];
size_t npages = 0;
for (; npages < PagesPerIteration && p < end; p += os::vm_page_size()) {
pages[npages++] = p;
}
if (os::numa_get_group_ids_for_range(pages, lgrp_ids, npages)) {
for (size_t i = 0; i < npages; i++) {
if (lgrp_ids[i] < 0) {
space_stats()->_uncommited_space += os::vm_page_size();
} else if (checked_cast<uint>(lgrp_ids[i]) == lgrp_id()) {
space_stats()->_local_space += os::vm_page_size();
} else {
space_stats()->_remote_space += os::vm_page_size();
}
}
}
}
space_stats()->_unbiased_space = pointer_delta(start, space()->bottom(), sizeof(char)) +
pointer_delta(space()->end(), end, sizeof(char));
}