truffle: src/share/vm/gc_implementation/concurrentMarkSweep/concurrentMarkSweepGeneration.cpp comparison

comparison src/share/vm/gc_implementation/concurrentMarkSweep/concurrentMarkSweepGeneration.cpp @ 2369:92da084fefc9

6668573: CMS: reference processing crash if ParallelCMSThreads > ParallelGCThreads Summary: Use _max_num_q = max(discovery_degree, processing_degree), and let balance_queues() redistribute from discovery_degree to processing_degree of queues. This should also allow a more dynamic and flexible parallelism policy in the future. Reviewed-by: jmasa, johnc

author	ysr
date	Thu, 17 Mar 2011 10:32:46 -0700
parents	a181f3a124dd
children	b099aaf51bf8

comparison

equal deleted inserted replaced

-:dde920245681
+:92da084fefc9
 }
 void CMSCollector::ref_processor_init() {
 if (_ref_processor == NULL) {
 // Allocate and initialize a reference processor
-_ref_processor = ReferenceProcessor::create_ref_processor(
+_ref_processor =
-_span,                               // span
+new ReferenceProcessor(_span,                               // span
-_cmsGen->refs_discovery_is_atomic(), // atomic_discovery
+(ParallelGCThreads > 1) && ParallelRefProcEnabled, // mt processing
-_cmsGen->refs_discovery_is_mt(),     // mt_discovery
+(int) ParallelGCThreads,             // mt processing degree
-&_is_alive_closure,
+_cmsGen->refs_discovery_is_mt(),     // mt discovery
-ParallelGCThreads,
+(int) MAX2(ConcGCThreads, ParallelGCThreads), // mt discovery degree
-ParallelRefProcEnabled);
+_cmsGen->refs_discovery_is_atomic(), // discovery is not atomic
+&_is_alive_closure,                  // closure for liveness info
+false);                              // next field updates do not need write barrier
 // Initialize the _ref_processor field of CMSGen
 _cmsGen->set_ref_processor(_ref_processor);
 // Allocate a dummy ref processor for perm gen.
 ReferenceProcessor* rp2 = new ReferenceProcessor();
 warning("Failed to allocate CMS Revisit Stack");
 return;
 }
 // Support for multi-threaded concurrent phases
-if (CollectedHeap::use_parallel_gc_threads() && CMSConcurrentMTEnabled) {
+if (CMSConcurrentMTEnabled) {
 if (FLAG_IS_DEFAULT(ConcGCThreads)) {
 // just for now
 FLAG_SET_DEFAULT(ConcGCThreads, (ParallelGCThreads + 3)/4);
 }
 if (ConcGCThreads > 1) {
 }
 // Temporarily widen the span of the weak reference processing to
 // the entire heap.
 MemRegion new_span(GenCollectedHeap::heap()->reserved_region());
-ReferenceProcessorSpanMutator x(ref_processor(), new_span);
+ReferenceProcessorSpanMutator rp_mut_span(ref_processor(), new_span);
 // Temporarily, clear the "is_alive_non_header" field of the
 // reference processor.
-ReferenceProcessorIsAliveMutator y(ref_processor(), NULL);
+ReferenceProcessorIsAliveMutator rp_mut_closure(ref_processor(), NULL);
 // Temporarily make reference _processing_ single threaded (non-MT).
-ReferenceProcessorMTProcMutator z(ref_processor(), false);
+ReferenceProcessorMTProcMutator rp_mut_mt_processing(ref_processor(), false);
 // Temporarily make refs discovery atomic
-ReferenceProcessorAtomicMutator w(ref_processor(), true);
+ReferenceProcessorAtomicMutator rp_mut_atomic(ref_processor(), true);
+// Temporarily make reference _discovery_ single threaded (non-MT)
+ReferenceProcessorMTDiscoveryMutator rp_mut_discovery(ref_processor(), false);
 ref_processor()->set_enqueuing_is_done(false);
 ref_processor()->enable_discovery();
 ref_processor()->setup_policy(clear_all_soft_refs);
 // If an asynchronous collection finishes, the _modUnionTable is
 cms_space ->initialize_sequential_subtasks_for_marking(num_workers);
 perm_space->initialize_sequential_subtasks_for_marking(num_workers);
 // Refs discovery is already non-atomic.
 assert(!ref_processor()->discovery_is_atomic(), "Should be non-atomic");
-// Mutate the Refs discovery so it is MT during the
+assert(ref_processor()->discovery_is_mt(), "Discovery should be MT");
-// multi-threaded marking phase.
-ReferenceProcessorMTMutator mt(ref_processor(), num_workers > 1);
 DEBUG_ONLY(RememberKlassesChecker cmx(should_unload_classes());)
 conc_workers()->start_task(&tsk);
 while (tsk.yielded()) {
 tsk.coordinator_yield();
 conc_workers()->continue_task(&tsk);
 bool CMSCollector::do_marking_st(bool asynch) {
 ResourceMark rm;
 HandleMark   hm;
+// Temporarily make refs discovery single threaded (non-MT)
+ReferenceProcessorMTDiscoveryMutator rp_mut_discovery(ref_processor(), false);
 MarkFromRootsClosure markFromRootsClosure(this, _span, &_markBitMap,
 &_markStack, &_revisitStack, CMSYield && asynch);
 // the last argument to iterate indicates whether the iteration
 // should be incremental with periodic yields.
 _markBitMap.iterate(&markFromRootsClosure);
 assert(Thread::current()->is_ConcurrentGC_thread(), "Wrong thread");
 verify_work_stacks_empty();
 verify_overflow_empty();
 _abort_preclean = false;
 if (CMSPrecleaningEnabled) {
-// Precleaning is currently not MT but the reference processor
-// may be set for MT.  Disable it temporarily here.
-ReferenceProcessor* rp = ref_processor();
-ReferenceProcessorMTProcMutator z(rp, false);
 _eden_chunk_index = 0;
 size_t used = get_eden_used();
 size_t capacity = get_eden_capacity();
 // Don't start sampling unless we will get sufficiently
 // many samples.
 size_t CMSCollector::preclean_work(bool clean_refs, bool clean_survivor) {
 assert(_collectorState == Precleaning ||
 _collectorState == AbortablePreclean, "incorrect state");
 ResourceMark rm;
 HandleMark   hm;
+// Precleaning is currently not MT but the reference processor
+// may be set for MT.  Disable it temporarily here.
+ReferenceProcessor* rp = ref_processor();
+ReferenceProcessorMTDiscoveryMutator rp_mut_discovery(rp, false);
 // Do one pass of scrubbing the discovered reference lists
 // to remove any reference objects with strongly-reachable
 // referents.
 if (clean_refs) {
-ReferenceProcessor* rp = ref_processor();
 CMSPrecleanRefsYieldClosure yield_cl(this);
 assert(rp->span().equals(_span), "Spans should be equal");
 CMSKeepAliveClosure keep_alive(this, _span, &_markBitMap,
 &_markStack, &_revisitStack,
 true /* preclean */);
 // It turns out that even when we're using 1 thread, doing the work in a
 // separate thread causes wide variance in run times.  We can't help this
 // in the multi-threaded case, but we special-case n=1 here to get
 // repeatable measurements of the 1-thread overhead of the parallel code.
 if (n_workers > 1) {
-// Make refs discovery MT-safe
+// Make refs discovery MT-safe, if it isn't already: it may not
-ReferenceProcessorMTMutator mt(ref_processor(), true);
+// necessarily be so, since it's possible that we are doing
+// ST marking.
+ReferenceProcessorMTDiscoveryMutator mt(ref_processor(), true);
 GenCollectedHeap::StrongRootsScope srs(gch);
 workers->run_task(&tsk);
 } else {
 GenCollectedHeap::StrongRootsScope srs(gch);
 tsk.work(0);
 CMSCollector*    collector,
 const MemRegion& span,
 CMSBitMap*       mark_bit_map,
 AbstractWorkGang* workers,
 OopTaskQueueSet* task_queues):
+// XXX Should superclass AGTWOQ also know about AWG since it knows
+// about the task_queues used by the AWG? Then it could initialize
+// the terminator() object. See 6984287. The set_for_termination()
+// below is a temporary band-aid for the regression in 6984287.
 AbstractGangTaskWOopQueues("Process referents by policy in parallel",
 task_queues),
 _task(task),
 _collector(collector), _span(span), _mark_bit_map(mark_bit_map)
 {
 assert(_collector->_span.equals(_span) && !_span.is_empty(),
 "Inconsistency in _span");
-}
+set_for_termination(workers->active_workers());
+}
 OopTaskQueueSet* task_queues() { return queues(); }
 OopTaskQueue* work_queue(int i) { return task_queues()->queue(i); }
 // may have been a different number of threads doing the discovery
 // and a different number of discovered lists may have Ref objects.
 // That is OK as long as the Reference lists are balanced (see
 // balance_all_queues() and balance_queues()).
+rp->set_active_mt_degree(ParallelGCThreads);
-rp->set_mt_degree(ParallelGCThreads);
 CMSRefProcTaskExecutor task_executor(*this);
 rp->process_discovered_references(&_is_alive_closure,
 &cmsKeepAliveClosure,
 &cmsDrainMarkingStackClosure,
 &task_executor);

Mercurial > hg > truffle

comparison src/share/vm/gc_implementation/concurrentMarkSweep/concurrentMarkSweepGeneration.cpp @ 2369:92da084fefc9