Skip to content

Commit

Permalink
8260591: Shenandoah: improve parallelism for concurrent thread root s…
Browse files Browse the repository at this point in the history
…cans

Reviewed-by: zgu, rkennke
  • Loading branch information
shipilev committed Feb 1, 2021
1 parent cf94208 commit ab727f0
Show file tree
Hide file tree
Showing 3 changed files with 32 additions and 19 deletions.
6 changes: 3 additions & 3 deletions src/hotspot/share/gc/shenandoah/shenandoahConcurrentGC.cpp
Expand Up @@ -596,9 +596,9 @@ class ShenandoahConcurrentEvacUpdateThreadTask : public AbstractGangTask {
ShenandoahJavaThreadsIterator _java_threads;

public:
ShenandoahConcurrentEvacUpdateThreadTask() :
ShenandoahConcurrentEvacUpdateThreadTask(uint n_workers) :
AbstractGangTask("Shenandoah Evacuate/Update Concurrent Thread Roots"),
_java_threads(ShenandoahPhaseTimings::conc_thread_roots) {
_java_threads(ShenandoahPhaseTimings::conc_thread_roots, n_workers) {
}

void work(uint worker_id) {
Expand All @@ -614,7 +614,7 @@ void ShenandoahConcurrentGC::op_thread_roots() {
ShenandoahHeap* const heap = ShenandoahHeap::heap();
assert(heap->is_evacuation_in_progress(), "Checked by caller");
ShenandoahGCWorkerPhase worker_phase(ShenandoahPhaseTimings::conc_thread_roots);
ShenandoahConcurrentEvacUpdateThreadTask task;
ShenandoahConcurrentEvacUpdateThreadTask task(heap->workers()->active_workers());
heap->workers()->run_task(&task);
}

Expand Down
37 changes: 23 additions & 14 deletions src/hotspot/share/gc/shenandoah/shenandoahRootProcessor.cpp
Expand Up @@ -37,20 +37,24 @@
#include "runtime/stackWatermarkSet.inline.hpp"
#include "runtime/thread.hpp"

ShenandoahJavaThreadsIterator::ShenandoahJavaThreadsIterator(ShenandoahPhaseTimings::Phase phase) :
ShenandoahJavaThreadsIterator::ShenandoahJavaThreadsIterator(ShenandoahPhaseTimings::Phase phase, uint n_workers) :
_threads(),
_length(_threads.length()),
_stride(MAX2(1u, _length / n_workers / _chunks_per_worker)),
_claimed(0),
_phase(phase) {
}

uint ShenandoahJavaThreadsIterator::claim() {
return Atomic::fetch_and_add(&_claimed, 1u);
return Atomic::fetch_and_add(&_claimed, _stride);
}

void ShenandoahJavaThreadsIterator::threads_do(ThreadClosure* cl, uint worker_id) {
ShenandoahWorkerTimingsTracker timer(_phase, ShenandoahPhaseTimings::ThreadRoots, worker_id);
for (uint i = claim(); i < _threads.length(); i = claim()) {
cl->do_thread(_threads.thread_at(i));
for (uint i = claim(); i < _length; i = claim()) {
for (uint t = i; t < MIN2(_length, i + _stride); t++) {
cl->do_thread(thread_at(t));
}
}
}

Expand Down Expand Up @@ -206,7 +210,7 @@ void ShenandoahConcurrentMarkThreadClosure::do_thread(Thread* thread) {
ShenandoahConcurrentRootScanner::ShenandoahConcurrentRootScanner(uint n_workers,
ShenandoahPhaseTimings::Phase phase) :
ShenandoahRootProcessor(phase),
_java_threads(phase),
_java_threads(phase, n_workers),
_vm_roots(phase),
_cld_roots(phase, n_workers),
_codecache_snapshot(NULL),
Expand All @@ -230,19 +234,24 @@ void ShenandoahConcurrentRootScanner::roots_do(OopClosure* oops, uint worker_id)
ShenandoahHeap* const heap = ShenandoahHeap::heap();
CLDToOopClosure clds_cl(oops, ClassLoaderData::_claim_strong);

ShenandoahConcurrentMarkThreadClosure thr_cl(oops);
_java_threads.threads_do(&thr_cl, worker_id);

// Process light-weight/limited parallel roots then
_vm_roots.oops_do(oops, worker_id);

if (!heap->unload_classes()) {
_cld_roots.cld_do(&clds_cl, worker_id);
ShenandoahWorkerTimingsTracker timer(_phase, ShenandoahPhaseTimings::CodeCacheRoots, worker_id);
CodeBlobToOopClosure blobs(oops, !CodeBlobToOopClosure::FixRelocations);
_codecache_snapshot->parallel_blobs_do(&blobs);
} else {
if (heap->unload_classes()) {
_cld_roots.always_strong_cld_do(&clds_cl, worker_id);
} else {
_cld_roots.cld_do(&clds_cl, worker_id);

{
ShenandoahWorkerTimingsTracker timer(_phase, ShenandoahPhaseTimings::CodeCacheRoots, worker_id);
CodeBlobToOopClosure blobs(oops, !CodeBlobToOopClosure::FixRelocations);
_codecache_snapshot->parallel_blobs_do(&blobs);
}
}

// Process heavy-weight/fully parallel roots the last
ShenandoahConcurrentMarkThreadClosure thr_cl(oops);
_java_threads.threads_do(&thr_cl, worker_id);
}

void ShenandoahConcurrentRootScanner::update_tlab_stats() {
Expand Down
8 changes: 6 additions & 2 deletions src/hotspot/share/gc/shenandoah/shenandoahRootProcessor.hpp
Expand Up @@ -67,16 +67,20 @@ class ShenandoahVMRoots {

class ShenandoahJavaThreadsIterator {
private:
static const uint _chunks_per_worker = 16; // educated guess

ThreadsListHandle _threads;
uint const _length;
uint const _stride;
volatile uint _claimed;
ShenandoahPhaseTimings::Phase _phase;

uint claim();
public:
ShenandoahJavaThreadsIterator(ShenandoahPhaseTimings::Phase phase);
ShenandoahJavaThreadsIterator(ShenandoahPhaseTimings::Phase phase, uint n_workers);
void threads_do(ThreadClosure* cl, uint worker_id);

uint length() const { return _threads.length(); }
uint length() const { return _length; }
Thread* thread_at(uint index) const { return _threads.thread_at(index); }
};

Expand Down

0 comments on commit ab727f0

Please sign in to comment.