truffle: src/share/vm/gc_implementation/g1/concurrentG1Refine.cpp comparison

comparison src/share/vm/gc_implementation/g1/concurrentG1Refine.cpp @ 889:15c5903cf9e1

6865703: G1: Parallelize hot card cache cleanup Summary: Have the GC worker threads clear the hot card cache in parallel by having each worker thread claim a chunk of the card cache and process the cards in that chunk. The size of the chunks that each thread will claim is determined at VM initialization from the size of the card cache and the number of worker threads. Reviewed-by: jmasa, tonyp

author	johnc
date	Mon, 03 Aug 2009 12:59:30 -0700
parents	bd02caa94611
children	6cb8e9df7174

comparison

equal deleted inserted replaced

-:59726d16b30d
+:15c5903cf9e1
 }
 return 0;
 }
 void ConcurrentG1Refine::init() {
+G1CollectedHeap* g1h = G1CollectedHeap::heap();
 if (G1ConcRSLogCacheSize > 0 || G1ConcRSCountTraversals) {
-G1CollectedHeap* g1h = G1CollectedHeap::heap();
 _n_card_counts =
 (unsigned) (g1h->g1_reserved_obj_bytes() >> CardTableModRefBS::card_shift);
 _card_counts = NEW_C_HEAP_ARRAY(unsigned char, _n_card_counts);
 for (size_t i = 0; i < _n_card_counts; i++) _card_counts[i] = 0;
 ModRefBarrierSet* bs = g1h->mr_bs();
 _use_cache = true;
 _hot_cache_size = (1 << G1ConcRSLogCacheSize);
 _hot_cache = NEW_C_HEAP_ARRAY(jbyte*, _hot_cache_size);
 _n_hot = 0;
 _hot_cache_idx = 0;
+// For refining the cards in the hot cache in parallel
+int n_workers = (ParallelGCThreads > 0 ?
+g1h->workers()->total_workers() : 1);
+_hot_cache_par_chunk_size = MAX2(1, _hot_cache_size / n_workers);
+_hot_cache_par_claimed_idx = 0;
 }
 }
 void ConcurrentG1Refine::stop() {
 if (_threads != NULL) {
 }
 void ConcurrentG1Refine::clean_up_cache(int worker_i, G1RemSet* g1rs) {
 assert(!use_cache(), "cache should be disabled");
-int start_ind = _hot_cache_idx-1;
+int start_idx;
-for (int i = 0; i < _n_hot; i++) {
-int ind = start_ind - i;
+while ((start_idx = _hot_cache_par_claimed_idx) < _n_hot) { // read once
-if (ind < 0) ind = ind + _hot_cache_size;
+int end_idx = start_idx + _hot_cache_par_chunk_size;
-jbyte* entry = _hot_cache[ind];
-if (entry != NULL) {
+if (start_idx ==
-g1rs->concurrentRefineOneCard(entry, worker_i);
+Atomic::cmpxchg(end_idx, &_hot_cache_par_claimed_idx, start_idx)) {
-}
+// The current worker has successfully claimed the chunk [start_idx..end_idx)
-}
+end_idx = MIN2(end_idx, _n_hot);
-_n_hot = 0;
+for (int i = start_idx; i < end_idx; i++) {
-_hot_cache_idx = 0;
+jbyte* entry = _hot_cache[i];
+if (entry != NULL) {
+g1rs->concurrentRefineOneCard(entry, worker_i);
+}
+}
+}
+}
 }
 void ConcurrentG1Refine::clear_and_record_card_counts() {
 if (G1ConcRSLogCacheSize == 0 && !G1ConcRSCountTraversals) return;
 _n_periods++;

Mercurial > hg > truffle

comparison src/share/vm/gc_implementation/g1/concurrentG1Refine.cpp @ 889:15c5903cf9e1