| /* |
| * Copyright (C) 2014 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #include "concurrent_copying.h" |
| |
| #include "art_field-inl.h" |
| #include "barrier.h" |
| #include "base/enums.h" |
| #include "base/file_utils.h" |
| #include "base/histogram-inl.h" |
| #include "base/quasi_atomic.h" |
| #include "base/stl_util.h" |
| #include "base/systrace.h" |
| #include "class_root-inl.h" |
| #include "debugger.h" |
| #include "gc/accounting/atomic_stack.h" |
| #include "gc/accounting/heap_bitmap-inl.h" |
| #include "gc/accounting/mod_union_table-inl.h" |
| #include "gc/accounting/read_barrier_table.h" |
| #include "gc/accounting/space_bitmap-inl.h" |
| #include "gc/gc_pause_listener.h" |
| #include "gc/reference_processor.h" |
| #include "gc/space/image_space.h" |
| #include "gc/space/space-inl.h" |
| #include "gc/verification.h" |
| #include "image-inl.h" |
| #include "intern_table.h" |
| #include "mirror/class-inl.h" |
| #include "mirror/object-inl.h" |
| #include "mirror/object-refvisitor-inl.h" |
| #include "mirror/object_reference.h" |
| #include "scoped_thread_state_change-inl.h" |
| #include "thread-inl.h" |
| #include "thread_list.h" |
| #include "well_known_classes.h" |
| |
| namespace art { |
| namespace gc { |
| namespace collector { |
| |
| static constexpr size_t kDefaultGcMarkStackSize = 2 * MB; |
| // If kFilterModUnionCards then we attempt to filter cards that don't need to be dirty in the mod |
| // union table. Disabled since it does not seem to help the pause much. |
| static constexpr bool kFilterModUnionCards = kIsDebugBuild; |
| // If kDisallowReadBarrierDuringScan is true then the GC aborts if there are any read barrier that |
| // occur during ConcurrentCopying::Scan in GC thread. May be used to diagnose possibly unnecessary |
| // read barriers. Only enabled for kIsDebugBuild to avoid performance hit. |
| static constexpr bool kDisallowReadBarrierDuringScan = kIsDebugBuild; |
| // Slow path mark stack size, increase this if the stack is getting full and it is causing |
| // performance problems. |
| static constexpr size_t kReadBarrierMarkStackSize = 512 * KB; |
| // Size (in the number of objects) of the sweep array free buffer. |
| static constexpr size_t kSweepArrayChunkFreeSize = 1024; |
| // Verify that there are no missing card marks. |
| static constexpr bool kVerifyNoMissingCardMarks = kIsDebugBuild; |
| |
| ConcurrentCopying::ConcurrentCopying(Heap* heap, |
| bool young_gen, |
| bool use_generational_cc, |
| const std::string& name_prefix, |
| bool measure_read_barrier_slow_path) |
| : GarbageCollector(heap, |
| name_prefix + (name_prefix.empty() ? "" : " ") + |
| "concurrent copying"), |
| region_space_(nullptr), |
| gc_barrier_(new Barrier(0)), |
| gc_mark_stack_(accounting::ObjectStack::Create("concurrent copying gc mark stack", |
| kDefaultGcMarkStackSize, |
| kDefaultGcMarkStackSize)), |
| use_generational_cc_(use_generational_cc), |
| young_gen_(young_gen), |
| rb_mark_bit_stack_(accounting::ObjectStack::Create("rb copying gc mark stack", |
| kReadBarrierMarkStackSize, |
| kReadBarrierMarkStackSize)), |
| rb_mark_bit_stack_full_(false), |
| mark_stack_lock_("concurrent copying mark stack lock", kMarkSweepMarkStackLock), |
| thread_running_gc_(nullptr), |
| is_marking_(false), |
| is_using_read_barrier_entrypoints_(false), |
| is_active_(false), |
| is_asserting_to_space_invariant_(false), |
| region_space_bitmap_(nullptr), |
| heap_mark_bitmap_(nullptr), |
| live_stack_freeze_size_(0), |
| from_space_num_objects_at_first_pause_(0), |
| from_space_num_bytes_at_first_pause_(0), |
| mark_stack_mode_(kMarkStackModeOff), |
| weak_ref_access_enabled_(true), |
| copied_live_bytes_ratio_sum_(0.f), |
| gc_count_(0), |
| reclaimed_bytes_ratio_sum_(0.f), |
| cumulative_bytes_moved_(0), |
| cumulative_objects_moved_(0), |
| skipped_blocks_lock_("concurrent copying bytes blocks lock", kMarkSweepMarkStackLock), |
| measure_read_barrier_slow_path_(measure_read_barrier_slow_path), |
| mark_from_read_barrier_measurements_(false), |
| rb_slow_path_ns_(0), |
| rb_slow_path_count_(0), |
| rb_slow_path_count_gc_(0), |
| rb_slow_path_histogram_lock_("Read barrier histogram lock"), |
| rb_slow_path_time_histogram_("Mutator time in read barrier slow path", 500, 32), |
| rb_slow_path_count_total_(0), |
| rb_slow_path_count_gc_total_(0), |
| rb_table_(heap_->GetReadBarrierTable()), |
| force_evacuate_all_(false), |
| gc_grays_immune_objects_(false), |
| immune_gray_stack_lock_("concurrent copying immune gray stack lock", |
| kMarkSweepMarkStackLock), |
| num_bytes_allocated_before_gc_(0) { |
| static_assert(space::RegionSpace::kRegionSize == accounting::ReadBarrierTable::kRegionSize, |
| "The region space size and the read barrier table region size must match"); |
| CHECK(use_generational_cc_ || !young_gen_); |
| Thread* self = Thread::Current(); |
| { |
| ReaderMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| // Cache this so that we won't have to lock heap_bitmap_lock_ in |
| // Mark() which could cause a nested lock on heap_bitmap_lock_ |
| // when GC causes a RB while doing GC or a lock order violation |
| // (class_linker_lock_ and heap_bitmap_lock_). |
| heap_mark_bitmap_ = heap->GetMarkBitmap(); |
| } |
| { |
| MutexLock mu(self, mark_stack_lock_); |
| for (size_t i = 0; i < kMarkStackPoolSize; ++i) { |
| accounting::AtomicStack<mirror::Object>* mark_stack = |
| accounting::AtomicStack<mirror::Object>::Create( |
| "thread local mark stack", kMarkStackSize, kMarkStackSize); |
| pooled_mark_stacks_.push_back(mark_stack); |
| } |
| } |
| if (use_generational_cc_) { |
| // Allocate sweep array free buffer. |
| std::string error_msg; |
| sweep_array_free_buffer_mem_map_ = MemMap::MapAnonymous( |
| "concurrent copying sweep array free buffer", |
| RoundUp(kSweepArrayChunkFreeSize * sizeof(mirror::Object*), kPageSize), |
| PROT_READ | PROT_WRITE, |
| /*low_4gb=*/ false, |
| &error_msg); |
| CHECK(sweep_array_free_buffer_mem_map_.IsValid()) |
| << "Couldn't allocate sweep array free buffer: " << error_msg; |
| } |
| // Return type of these functions are different. And even though the base class |
| // is same, using ternary operator complains. |
| metrics::ArtMetrics* metrics = GetMetrics(); |
| are_metrics_initialized_ = true; |
| if (young_gen_) { |
| gc_time_histogram_ = metrics->YoungGcCollectionTime(); |
| metrics_gc_count_ = metrics->YoungGcCount(); |
| metrics_gc_count_delta_ = metrics->YoungGcCountDelta(); |
| gc_throughput_histogram_ = metrics->YoungGcThroughput(); |
| gc_tracing_throughput_hist_ = metrics->YoungGcTracingThroughput(); |
| gc_throughput_avg_ = metrics->YoungGcThroughputAvg(); |
| gc_tracing_throughput_avg_ = metrics->YoungGcTracingThroughputAvg(); |
| gc_scanned_bytes_ = metrics->YoungGcScannedBytes(); |
| gc_scanned_bytes_delta_ = metrics->YoungGcScannedBytesDelta(); |
| gc_freed_bytes_ = metrics->YoungGcFreedBytes(); |
| gc_freed_bytes_delta_ = metrics->YoungGcFreedBytesDelta(); |
| gc_duration_ = metrics->YoungGcDuration(); |
| gc_duration_delta_ = metrics->YoungGcDurationDelta(); |
| } else { |
| gc_time_histogram_ = metrics->FullGcCollectionTime(); |
| metrics_gc_count_ = metrics->FullGcCount(); |
| metrics_gc_count_delta_ = metrics->FullGcCountDelta(); |
| gc_throughput_histogram_ = metrics->FullGcThroughput(); |
| gc_tracing_throughput_hist_ = metrics->FullGcTracingThroughput(); |
| gc_throughput_avg_ = metrics->FullGcThroughputAvg(); |
| gc_tracing_throughput_avg_ = metrics->FullGcTracingThroughputAvg(); |
| gc_scanned_bytes_ = metrics->FullGcScannedBytes(); |
| gc_scanned_bytes_delta_ = metrics->FullGcScannedBytesDelta(); |
| gc_freed_bytes_ = metrics->FullGcFreedBytes(); |
| gc_freed_bytes_delta_ = metrics->FullGcFreedBytesDelta(); |
| gc_duration_ = metrics->FullGcDuration(); |
| gc_duration_delta_ = metrics->FullGcDurationDelta(); |
| } |
| } |
| |
| void ConcurrentCopying::MarkHeapReference(mirror::HeapReference<mirror::Object>* field, |
| bool do_atomic_update) { |
| Thread* const self = Thread::Current(); |
| if (UNLIKELY(do_atomic_update)) { |
| // Used to mark the referent in DelayReferenceReferent in transaction mode. |
| mirror::Object* from_ref = field->AsMirrorPtr(); |
| if (from_ref == nullptr) { |
| return; |
| } |
| mirror::Object* to_ref = Mark(self, from_ref); |
| if (from_ref != to_ref) { |
| do { |
| if (field->AsMirrorPtr() != from_ref) { |
| // Concurrently overwritten by a mutator. |
| break; |
| } |
| } while (!field->CasWeakRelaxed(from_ref, to_ref)); |
| } |
| } else { |
| // Used for preserving soft references, should be OK to not have a CAS here since there should be |
| // no other threads which can trigger read barriers on the same referent during reference |
| // processing. |
| field->Assign(Mark(self, field->AsMirrorPtr())); |
| } |
| } |
| |
| ConcurrentCopying::~ConcurrentCopying() { |
| STLDeleteElements(&pooled_mark_stacks_); |
| } |
| |
| void ConcurrentCopying::RunPhases() { |
| CHECK(kUseBakerReadBarrier || kUseTableLookupReadBarrier); |
| CHECK(!is_active_); |
| is_active_ = true; |
| Thread* self = Thread::Current(); |
| thread_running_gc_ = self; |
| Locks::mutator_lock_->AssertNotHeld(self); |
| { |
| ReaderMutexLock mu(self, *Locks::mutator_lock_); |
| InitializePhase(); |
| // In case of forced evacuation, all regions are evacuated and hence no |
| // need to compute live_bytes. |
| if (use_generational_cc_ && !young_gen_ && !force_evacuate_all_) { |
| MarkingPhase(); |
| } |
| } |
| if (kUseBakerReadBarrier && kGrayDirtyImmuneObjects) { |
| // Switch to read barrier mark entrypoints before we gray the objects. This is required in case |
| // a mutator sees a gray bit and dispatches on the entrypoint. (b/37876887). |
| ActivateReadBarrierEntrypoints(); |
| // Gray dirty immune objects concurrently to reduce GC pause times. We re-process gray cards in |
| // the pause. |
| ReaderMutexLock mu(self, *Locks::mutator_lock_); |
| GrayAllDirtyImmuneObjects(); |
| } |
| FlipThreadRoots(); |
| { |
| ReaderMutexLock mu(self, *Locks::mutator_lock_); |
| CopyingPhase(); |
| } |
| // Verify no from space refs. This causes a pause. |
| if (kEnableNoFromSpaceRefsVerification) { |
| TimingLogger::ScopedTiming split("(Paused)VerifyNoFromSpaceReferences", GetTimings()); |
| ScopedPause pause(this, false); |
| CheckEmptyMarkStack(); |
| if (kVerboseMode) { |
| LOG(INFO) << "Verifying no from-space refs"; |
| } |
| VerifyNoFromSpaceReferences(); |
| if (kVerboseMode) { |
| LOG(INFO) << "Done verifying no from-space refs"; |
| } |
| CheckEmptyMarkStack(); |
| } |
| { |
| ReaderMutexLock mu(self, *Locks::mutator_lock_); |
| ReclaimPhase(); |
| } |
| FinishPhase(); |
| CHECK(is_active_); |
| is_active_ = false; |
| thread_running_gc_ = nullptr; |
| } |
| |
| class ConcurrentCopying::ActivateReadBarrierEntrypointsCheckpoint : public Closure { |
| public: |
| explicit ActivateReadBarrierEntrypointsCheckpoint(ConcurrentCopying* concurrent_copying) |
| : concurrent_copying_(concurrent_copying) {} |
| |
| void Run(Thread* thread) override NO_THREAD_SAFETY_ANALYSIS { |
| // Note: self is not necessarily equal to thread since thread may be suspended. |
| Thread* self = Thread::Current(); |
| DCHECK(thread == self || |
| thread->IsSuspended() || |
| thread->GetState() == ThreadState::kWaitingPerformingGc) |
| << thread->GetState() << " thread " << thread << " self " << self; |
| // Switch to the read barrier entrypoints. |
| thread->SetReadBarrierEntrypoints(); |
| // If thread is a running mutator, then act on behalf of the garbage collector. |
| // See the code in ThreadList::RunCheckpoint. |
| concurrent_copying_->GetBarrier().Pass(self); |
| } |
| |
| private: |
| ConcurrentCopying* const concurrent_copying_; |
| }; |
| |
| class ConcurrentCopying::ActivateReadBarrierEntrypointsCallback : public Closure { |
| public: |
| explicit ActivateReadBarrierEntrypointsCallback(ConcurrentCopying* concurrent_copying) |
| : concurrent_copying_(concurrent_copying) {} |
| |
| void Run(Thread* self ATTRIBUTE_UNUSED) override REQUIRES(Locks::thread_list_lock_) { |
| // This needs to run under the thread_list_lock_ critical section in ThreadList::RunCheckpoint() |
| // to avoid a race with ThreadList::Register(). |
| CHECK(!concurrent_copying_->is_using_read_barrier_entrypoints_); |
| concurrent_copying_->is_using_read_barrier_entrypoints_ = true; |
| } |
| |
| private: |
| ConcurrentCopying* const concurrent_copying_; |
| }; |
| |
| void ConcurrentCopying::ActivateReadBarrierEntrypoints() { |
| Thread* const self = Thread::Current(); |
| ActivateReadBarrierEntrypointsCheckpoint checkpoint(this); |
| ThreadList* thread_list = Runtime::Current()->GetThreadList(); |
| gc_barrier_->Init(self, 0); |
| ActivateReadBarrierEntrypointsCallback callback(this); |
| const size_t barrier_count = thread_list->RunCheckpoint(&checkpoint, &callback); |
| // If there are no threads to wait which implies that all the checkpoint functions are finished, |
| // then no need to release the mutator lock. |
| if (barrier_count == 0) { |
| return; |
| } |
| ScopedThreadStateChange tsc(self, ThreadState::kWaitingForCheckPointsToRun); |
| gc_barrier_->Increment(self, barrier_count); |
| } |
| |
| void ConcurrentCopying::CreateInterRegionRefBitmaps() { |
| DCHECK(use_generational_cc_); |
| DCHECK(!region_space_inter_region_bitmap_.IsValid()); |
| DCHECK(!non_moving_space_inter_region_bitmap_.IsValid()); |
| DCHECK(region_space_ != nullptr); |
| DCHECK(heap_->non_moving_space_ != nullptr); |
| // Region-space |
| region_space_inter_region_bitmap_ = accounting::ContinuousSpaceBitmap::Create( |
| "region-space inter region ref bitmap", |
| reinterpret_cast<uint8_t*>(region_space_->Begin()), |
| region_space_->Limit() - region_space_->Begin()); |
| CHECK(region_space_inter_region_bitmap_.IsValid()) |
| << "Couldn't allocate region-space inter region ref bitmap"; |
| |
| // non-moving-space |
| non_moving_space_inter_region_bitmap_ = accounting::ContinuousSpaceBitmap::Create( |
| "non-moving-space inter region ref bitmap", |
| reinterpret_cast<uint8_t*>(heap_->non_moving_space_->Begin()), |
| heap_->non_moving_space_->Limit() - heap_->non_moving_space_->Begin()); |
| CHECK(non_moving_space_inter_region_bitmap_.IsValid()) |
| << "Couldn't allocate non-moving-space inter region ref bitmap"; |
| } |
| |
| void ConcurrentCopying::BindBitmaps() { |
| Thread* self = Thread::Current(); |
| WriterMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| // Mark all of the spaces we never collect as immune. |
| for (const auto& space : heap_->GetContinuousSpaces()) { |
| if (space->GetGcRetentionPolicy() == space::kGcRetentionPolicyNeverCollect || |
| space->GetGcRetentionPolicy() == space::kGcRetentionPolicyFullCollect) { |
| CHECK(space->IsZygoteSpace() || space->IsImageSpace()); |
| immune_spaces_.AddSpace(space); |
| } else { |
| CHECK(!space->IsZygoteSpace()); |
| CHECK(!space->IsImageSpace()); |
| CHECK(space == region_space_ || space == heap_->non_moving_space_); |
| if (use_generational_cc_) { |
| if (space == region_space_) { |
| region_space_bitmap_ = region_space_->GetMarkBitmap(); |
| } else if (young_gen_ && space->IsContinuousMemMapAllocSpace()) { |
| DCHECK_EQ(space->GetGcRetentionPolicy(), space::kGcRetentionPolicyAlwaysCollect); |
| space->AsContinuousMemMapAllocSpace()->BindLiveToMarkBitmap(); |
| } |
| if (young_gen_) { |
| // Age all of the cards for the region space so that we know which evac regions to scan. |
| heap_->GetCardTable()->ModifyCardsAtomic(space->Begin(), |
| space->End(), |
| AgeCardVisitor(), |
| VoidFunctor()); |
| } else { |
| // In a full-heap GC cycle, the card-table corresponding to region-space and |
| // non-moving space can be cleared, because this cycle only needs to |
| // capture writes during the marking phase of this cycle to catch |
| // objects that skipped marking due to heap mutation. Furthermore, |
| // if the next GC is a young-gen cycle, then it only needs writes to |
| // be captured after the thread-flip of this GC cycle, as that is when |
| // the young-gen for the next GC cycle starts getting populated. |
| heap_->GetCardTable()->ClearCardRange(space->Begin(), space->Limit()); |
| } |
| } else { |
| if (space == region_space_) { |
| // It is OK to clear the bitmap with mutators running since the only place it is read is |
| // VisitObjects which has exclusion with CC. |
| region_space_bitmap_ = region_space_->GetMarkBitmap(); |
| region_space_bitmap_->Clear(); |
| } |
| } |
| } |
| } |
| if (use_generational_cc_ && young_gen_) { |
| for (const auto& space : GetHeap()->GetDiscontinuousSpaces()) { |
| CHECK(space->IsLargeObjectSpace()); |
| space->AsLargeObjectSpace()->CopyLiveToMarked(); |
| } |
| } |
| } |
| |
| void ConcurrentCopying::InitializePhase() { |
| TimingLogger::ScopedTiming split("InitializePhase", GetTimings()); |
| num_bytes_allocated_before_gc_ = static_cast<int64_t>(heap_->GetBytesAllocated()); |
| if (kVerboseMode) { |
| LOG(INFO) << "GC InitializePhase"; |
| LOG(INFO) << "Region-space : " << reinterpret_cast<void*>(region_space_->Begin()) << "-" |
| << reinterpret_cast<void*>(region_space_->Limit()); |
| } |
| CheckEmptyMarkStack(); |
| rb_mark_bit_stack_full_ = false; |
| mark_from_read_barrier_measurements_ = measure_read_barrier_slow_path_; |
| if (measure_read_barrier_slow_path_) { |
| rb_slow_path_ns_.store(0, std::memory_order_relaxed); |
| rb_slow_path_count_.store(0, std::memory_order_relaxed); |
| rb_slow_path_count_gc_.store(0, std::memory_order_relaxed); |
| } |
| |
| immune_spaces_.Reset(); |
| bytes_moved_.store(0, std::memory_order_relaxed); |
| objects_moved_.store(0, std::memory_order_relaxed); |
| bytes_moved_gc_thread_ = 0; |
| objects_moved_gc_thread_ = 0; |
| bytes_scanned_ = 0; |
| GcCause gc_cause = GetCurrentIteration()->GetGcCause(); |
| |
| force_evacuate_all_ = false; |
| if (!use_generational_cc_ || !young_gen_) { |
| if (gc_cause == kGcCauseExplicit || |
| gc_cause == kGcCauseCollectorTransition || |
| GetCurrentIteration()->GetClearSoftReferences()) { |
| force_evacuate_all_ = true; |
| } |
| } |
| if (kUseBakerReadBarrier) { |
| updated_all_immune_objects_.store(false, std::memory_order_relaxed); |
| // GC may gray immune objects in the thread flip. |
| gc_grays_immune_objects_ = true; |
| if (kIsDebugBuild) { |
| MutexLock mu(Thread::Current(), immune_gray_stack_lock_); |
| DCHECK(immune_gray_stack_.empty()); |
| } |
| } |
| if (use_generational_cc_) { |
| done_scanning_.store(false, std::memory_order_release); |
| } |
| BindBitmaps(); |
| if (kVerboseMode) { |
| LOG(INFO) << "young_gen=" << std::boolalpha << young_gen_ << std::noboolalpha; |
| LOG(INFO) << "force_evacuate_all=" << std::boolalpha << force_evacuate_all_ << std::noboolalpha; |
| LOG(INFO) << "Largest immune region: " << immune_spaces_.GetLargestImmuneRegion().Begin() |
| << "-" << immune_spaces_.GetLargestImmuneRegion().End(); |
| for (space::ContinuousSpace* space : immune_spaces_.GetSpaces()) { |
| LOG(INFO) << "Immune space: " << *space; |
| } |
| LOG(INFO) << "GC end of InitializePhase"; |
| } |
| if (use_generational_cc_ && !young_gen_) { |
| region_space_bitmap_->Clear(); |
| } |
| mark_stack_mode_.store(ConcurrentCopying::kMarkStackModeThreadLocal, std::memory_order_relaxed); |
| // Mark all of the zygote large objects without graying them. |
| MarkZygoteLargeObjects(); |
| } |
| |
| // Used to switch the thread roots of a thread from from-space refs to to-space refs. |
| class ConcurrentCopying::ThreadFlipVisitor : public Closure, public RootVisitor { |
| public: |
| ThreadFlipVisitor(ConcurrentCopying* concurrent_copying, bool use_tlab) |
| : concurrent_copying_(concurrent_copying), use_tlab_(use_tlab) { |
| } |
| |
| void Run(Thread* thread) override REQUIRES_SHARED(Locks::mutator_lock_) { |
| // Note: self is not necessarily equal to thread since thread may be suspended. |
| Thread* self = Thread::Current(); |
| CHECK(thread == self || |
| thread->IsSuspended() || |
| thread->GetState() == ThreadState::kWaitingPerformingGc) |
| << thread->GetState() << " thread " << thread << " self " << self; |
| thread->SetIsGcMarkingAndUpdateEntrypoints(true); |
| if (use_tlab_ && thread->HasTlab()) { |
| // We should not reuse the partially utilized TLABs revoked here as they |
| // are going to be part of from-space. |
| if (ConcurrentCopying::kEnableFromSpaceAccountingCheck) { |
| // This must come before the revoke. |
| size_t thread_local_objects = thread->GetThreadLocalObjectsAllocated(); |
| concurrent_copying_->region_space_->RevokeThreadLocalBuffers(thread, /*reuse=*/ false); |
| reinterpret_cast<Atomic<size_t>*>( |
| &concurrent_copying_->from_space_num_objects_at_first_pause_)-> |
| fetch_add(thread_local_objects, std::memory_order_relaxed); |
| } else { |
| concurrent_copying_->region_space_->RevokeThreadLocalBuffers(thread, /*reuse=*/ false); |
| } |
| } |
| if (kUseThreadLocalAllocationStack) { |
| thread->RevokeThreadLocalAllocationStack(); |
| } |
| ReaderMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| // We can use the non-CAS VisitRoots functions below because we update thread-local GC roots |
| // only. |
| thread->VisitRoots(this, kVisitRootFlagAllRoots); |
| concurrent_copying_->GetBarrier().Pass(self); |
| } |
| |
| void VisitRoots(mirror::Object*** roots, |
| size_t count, |
| const RootInfo& info ATTRIBUTE_UNUSED) override |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| Thread* self = Thread::Current(); |
| for (size_t i = 0; i < count; ++i) { |
| mirror::Object** root = roots[i]; |
| mirror::Object* ref = *root; |
| if (ref != nullptr) { |
| mirror::Object* to_ref = concurrent_copying_->Mark(self, ref); |
| if (to_ref != ref) { |
| *root = to_ref; |
| } |
| } |
| } |
| } |
| |
| void VisitRoots(mirror::CompressedReference<mirror::Object>** roots, |
| size_t count, |
| const RootInfo& info ATTRIBUTE_UNUSED) override |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| Thread* self = Thread::Current(); |
| for (size_t i = 0; i < count; ++i) { |
| mirror::CompressedReference<mirror::Object>* const root = roots[i]; |
| if (!root->IsNull()) { |
| mirror::Object* ref = root->AsMirrorPtr(); |
| mirror::Object* to_ref = concurrent_copying_->Mark(self, ref); |
| if (to_ref != ref) { |
| root->Assign(to_ref); |
| } |
| } |
| } |
| } |
| |
| private: |
| ConcurrentCopying* const concurrent_copying_; |
| const bool use_tlab_; |
| }; |
| |
| // Called back from Runtime::FlipThreadRoots() during a pause. |
| class ConcurrentCopying::FlipCallback : public Closure { |
| public: |
| explicit FlipCallback(ConcurrentCopying* concurrent_copying) |
| : concurrent_copying_(concurrent_copying) { |
| } |
| |
| void Run(Thread* thread) override REQUIRES(Locks::mutator_lock_) { |
| ConcurrentCopying* cc = concurrent_copying_; |
| TimingLogger::ScopedTiming split("(Paused)FlipCallback", cc->GetTimings()); |
| // Note: self is not necessarily equal to thread since thread may be suspended. |
| Thread* self = Thread::Current(); |
| if (kVerifyNoMissingCardMarks && cc->young_gen_) { |
| cc->VerifyNoMissingCardMarks(); |
| } |
| CHECK_EQ(thread, self); |
| Locks::mutator_lock_->AssertExclusiveHeld(self); |
| space::RegionSpace::EvacMode evac_mode = space::RegionSpace::kEvacModeLivePercentNewlyAllocated; |
| if (cc->young_gen_) { |
| CHECK(!cc->force_evacuate_all_); |
| evac_mode = space::RegionSpace::kEvacModeNewlyAllocated; |
| } else if (cc->force_evacuate_all_) { |
| evac_mode = space::RegionSpace::kEvacModeForceAll; |
| } |
| { |
| TimingLogger::ScopedTiming split2("(Paused)SetFromSpace", cc->GetTimings()); |
| // Only change live bytes for 1-phase full heap CC, that is if we are either not running in |
| // generational-mode, or it's an 'evacuate-all' mode GC. |
| cc->region_space_->SetFromSpace( |
| cc->rb_table_, |
| evac_mode, |
| /*clear_live_bytes=*/ !cc->use_generational_cc_ || cc->force_evacuate_all_); |
| } |
| cc->SwapStacks(); |
| if (ConcurrentCopying::kEnableFromSpaceAccountingCheck) { |
| cc->RecordLiveStackFreezeSize(self); |
| cc->from_space_num_objects_at_first_pause_ = cc->region_space_->GetObjectsAllocated(); |
| cc->from_space_num_bytes_at_first_pause_ = cc->region_space_->GetBytesAllocated(); |
| } |
| cc->is_marking_ = true; |
| if (kIsDebugBuild && !cc->use_generational_cc_) { |
| cc->region_space_->AssertAllRegionLiveBytesZeroOrCleared(); |
| } |
| Runtime* runtime = Runtime::Current(); |
| if (UNLIKELY(runtime->IsActiveTransaction())) { |
| CHECK(runtime->IsAotCompiler()); |
| TimingLogger::ScopedTiming split3("(Paused)VisitTransactionRoots", cc->GetTimings()); |
| runtime->VisitTransactionRoots(cc); |
| } |
| if (kUseBakerReadBarrier && kGrayDirtyImmuneObjects) { |
| cc->GrayAllNewlyDirtyImmuneObjects(); |
| if (kIsDebugBuild) { |
| // Check that all non-gray immune objects only reference immune objects. |
| cc->VerifyGrayImmuneObjects(); |
| } |
| } |
| ObjPtr<mirror::Class> java_lang_Object = |
| GetClassRoot<mirror::Object, kWithoutReadBarrier>(runtime->GetClassLinker()); |
| DCHECK(java_lang_Object != nullptr); |
| cc->java_lang_Object_ = down_cast<mirror::Class*>(cc->Mark(thread, java_lang_Object.Ptr())); |
| } |
| |
| private: |
| ConcurrentCopying* const concurrent_copying_; |
| }; |
| |
| class ConcurrentCopying::VerifyGrayImmuneObjectsVisitor { |
| public: |
| explicit VerifyGrayImmuneObjectsVisitor(ConcurrentCopying* collector) |
| : collector_(collector) {} |
| |
| void operator()(ObjPtr<mirror::Object> obj, MemberOffset offset, bool /* is_static */) |
| const ALWAYS_INLINE REQUIRES_SHARED(Locks::mutator_lock_) |
| REQUIRES_SHARED(Locks::heap_bitmap_lock_) { |
| CheckReference(obj->GetFieldObject<mirror::Object, kVerifyNone, kWithoutReadBarrier>(offset), |
| obj, offset); |
| } |
| |
| void operator()(ObjPtr<mirror::Class> klass, ObjPtr<mirror::Reference> ref) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| CHECK(klass->IsTypeOfReferenceClass()); |
| CheckReference(ref->GetReferent<kWithoutReadBarrier>(), |
| ref, |
| mirror::Reference::ReferentOffset()); |
| } |
| |
| void VisitRootIfNonNull(mirror::CompressedReference<mirror::Object>* root) const |
| ALWAYS_INLINE |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (!root->IsNull()) { |
| VisitRoot(root); |
| } |
| } |
| |
| void VisitRoot(mirror::CompressedReference<mirror::Object>* root) const |
| ALWAYS_INLINE |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| CheckReference(root->AsMirrorPtr(), nullptr, MemberOffset(0)); |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| |
| void CheckReference(ObjPtr<mirror::Object> ref, |
| ObjPtr<mirror::Object> holder, |
| MemberOffset offset) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (ref != nullptr) { |
| if (!collector_->immune_spaces_.ContainsObject(ref.Ptr())) { |
| // Not immune, must be a zygote large object. |
| space::LargeObjectSpace* large_object_space = |
| Runtime::Current()->GetHeap()->GetLargeObjectsSpace(); |
| CHECK(large_object_space->Contains(ref.Ptr()) && |
| large_object_space->IsZygoteLargeObject(Thread::Current(), ref.Ptr())) |
| << "Non gray object references non immune, non zygote large object "<< ref << " " |
| << mirror::Object::PrettyTypeOf(ref) << " in holder " << holder << " " |
| << mirror::Object::PrettyTypeOf(holder) << " offset=" << offset.Uint32Value(); |
| } else { |
| // Make sure the large object class is immune since we will never scan the large object. |
| CHECK(collector_->immune_spaces_.ContainsObject( |
| ref->GetClass<kVerifyNone, kWithoutReadBarrier>())); |
| } |
| } |
| } |
| }; |
| |
| void ConcurrentCopying::VerifyGrayImmuneObjects() { |
| TimingLogger::ScopedTiming split(__FUNCTION__, GetTimings()); |
| for (auto& space : immune_spaces_.GetSpaces()) { |
| DCHECK(space->IsImageSpace() || space->IsZygoteSpace()); |
| accounting::ContinuousSpaceBitmap* live_bitmap = space->GetLiveBitmap(); |
| VerifyGrayImmuneObjectsVisitor visitor(this); |
| live_bitmap->VisitMarkedRange(reinterpret_cast<uintptr_t>(space->Begin()), |
| reinterpret_cast<uintptr_t>(space->Limit()), |
| [&visitor](mirror::Object* obj) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| // If an object is not gray, it should only have references to things in the immune spaces. |
| if (obj->GetReadBarrierState() != ReadBarrier::GrayState()) { |
| obj->VisitReferences</*kVisitNativeRoots=*/true, |
| kDefaultVerifyFlags, |
| kWithoutReadBarrier>(visitor, visitor); |
| } |
| }); |
| } |
| } |
| |
| class ConcurrentCopying::VerifyNoMissingCardMarkVisitor { |
| public: |
| VerifyNoMissingCardMarkVisitor(ConcurrentCopying* cc, ObjPtr<mirror::Object> holder) |
| : cc_(cc), |
| holder_(holder) {} |
| |
| void operator()(ObjPtr<mirror::Object> obj, |
| MemberOffset offset, |
| bool is_static ATTRIBUTE_UNUSED) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| if (offset.Uint32Value() != mirror::Object::ClassOffset().Uint32Value()) { |
| CheckReference(obj->GetFieldObject<mirror::Object, kDefaultVerifyFlags, kWithoutReadBarrier>( |
| offset), offset.Uint32Value()); |
| } |
| } |
| void operator()(ObjPtr<mirror::Class> klass, |
| ObjPtr<mirror::Reference> ref) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| CHECK(klass->IsTypeOfReferenceClass()); |
| this->operator()(ref, mirror::Reference::ReferentOffset(), false); |
| } |
| |
| void VisitRootIfNonNull(mirror::CompressedReference<mirror::Object>* root) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (!root->IsNull()) { |
| VisitRoot(root); |
| } |
| } |
| |
| void VisitRoot(mirror::CompressedReference<mirror::Object>* root) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| CheckReference(root->AsMirrorPtr()); |
| } |
| |
| void CheckReference(mirror::Object* ref, int32_t offset = -1) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (ref != nullptr && cc_->region_space_->IsInNewlyAllocatedRegion(ref)) { |
| LOG(FATAL_WITHOUT_ABORT) |
| << holder_->PrettyTypeOf() << "(" << holder_.Ptr() << ") references object " |
| << ref->PrettyTypeOf() << "(" << ref << ") in newly allocated region at offset=" << offset; |
| LOG(FATAL_WITHOUT_ABORT) << "time=" << cc_->region_space_->Time(); |
| constexpr const char* kIndent = " "; |
| LOG(FATAL_WITHOUT_ABORT) << cc_->DumpReferenceInfo(holder_.Ptr(), "holder_", kIndent); |
| LOG(FATAL_WITHOUT_ABORT) << cc_->DumpReferenceInfo(ref, "ref", kIndent); |
| LOG(FATAL) << "Unexpected reference to newly allocated region."; |
| } |
| } |
| |
| private: |
| ConcurrentCopying* const cc_; |
| const ObjPtr<mirror::Object> holder_; |
| }; |
| |
| void ConcurrentCopying::VerifyNoMissingCardMarks() { |
| auto visitor = [&](mirror::Object* obj) |
| REQUIRES(Locks::mutator_lock_) |
| REQUIRES(!mark_stack_lock_) { |
| // Objects on clean cards should never have references to newly allocated regions. Note |
| // that aged cards are also not clean. |
| if (heap_->GetCardTable()->GetCard(obj) == gc::accounting::CardTable::kCardClean) { |
| VerifyNoMissingCardMarkVisitor internal_visitor(this, /*holder=*/ obj); |
| obj->VisitReferences</*kVisitNativeRoots=*/true, kVerifyNone, kWithoutReadBarrier>( |
| internal_visitor, internal_visitor); |
| } |
| }; |
| TimingLogger::ScopedTiming split(__FUNCTION__, GetTimings()); |
| region_space_->Walk(visitor); |
| { |
| ReaderMutexLock rmu(Thread::Current(), *Locks::heap_bitmap_lock_); |
| heap_->GetLiveBitmap()->Visit(visitor); |
| } |
| } |
| |
| // Switch threads that from from-space to to-space refs. Forward/mark the thread roots. |
| void ConcurrentCopying::FlipThreadRoots() { |
| TimingLogger::ScopedTiming split("FlipThreadRoots", GetTimings()); |
| if (kVerboseMode || heap_->dump_region_info_before_gc_) { |
| LOG(INFO) << "time=" << region_space_->Time(); |
| region_space_->DumpNonFreeRegions(LOG_STREAM(INFO)); |
| } |
| Thread* self = Thread::Current(); |
| Locks::mutator_lock_->AssertNotHeld(self); |
| gc_barrier_->Init(self, 0); |
| ThreadFlipVisitor thread_flip_visitor(this, heap_->use_tlab_); |
| FlipCallback flip_callback(this); |
| |
| size_t barrier_count = Runtime::Current()->GetThreadList()->FlipThreadRoots( |
| &thread_flip_visitor, &flip_callback, this, GetHeap()->GetGcPauseListener()); |
| |
| { |
| ScopedThreadStateChange tsc(self, ThreadState::kWaitingForCheckPointsToRun); |
| gc_barrier_->Increment(self, barrier_count); |
| } |
| is_asserting_to_space_invariant_ = true; |
| QuasiAtomic::ThreadFenceForConstructor(); |
| if (kVerboseMode) { |
| LOG(INFO) << "time=" << region_space_->Time(); |
| region_space_->DumpNonFreeRegions(LOG_STREAM(INFO)); |
| LOG(INFO) << "GC end of FlipThreadRoots"; |
| } |
| } |
| |
| template <bool kConcurrent> |
| class ConcurrentCopying::GrayImmuneObjectVisitor { |
| public: |
| explicit GrayImmuneObjectVisitor(Thread* self) : self_(self) {} |
| |
| ALWAYS_INLINE void operator()(mirror::Object* obj) const REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (kUseBakerReadBarrier && obj->GetReadBarrierState() == ReadBarrier::NonGrayState()) { |
| if (kConcurrent) { |
| Locks::mutator_lock_->AssertSharedHeld(self_); |
| obj->AtomicSetReadBarrierState(ReadBarrier::NonGrayState(), ReadBarrier::GrayState()); |
| // Mod union table VisitObjects may visit the same object multiple times so we can't check |
| // the result of the atomic set. |
| } else { |
| Locks::mutator_lock_->AssertExclusiveHeld(self_); |
| obj->SetReadBarrierState(ReadBarrier::GrayState()); |
| } |
| } |
| } |
| |
| static void Callback(mirror::Object* obj, void* arg) REQUIRES_SHARED(Locks::mutator_lock_) { |
| reinterpret_cast<GrayImmuneObjectVisitor<kConcurrent>*>(arg)->operator()(obj); |
| } |
| |
| private: |
| Thread* const self_; |
| }; |
| |
| void ConcurrentCopying::GrayAllDirtyImmuneObjects() { |
| TimingLogger::ScopedTiming split("GrayAllDirtyImmuneObjects", GetTimings()); |
| accounting::CardTable* const card_table = heap_->GetCardTable(); |
| Thread* const self = Thread::Current(); |
| using VisitorType = GrayImmuneObjectVisitor</* kIsConcurrent= */ true>; |
| VisitorType visitor(self); |
| WriterMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| for (space::ContinuousSpace* space : immune_spaces_.GetSpaces()) { |
| DCHECK(space->IsImageSpace() || space->IsZygoteSpace()); |
| accounting::ModUnionTable* table = heap_->FindModUnionTableFromSpace(space); |
| // Mark all the objects on dirty cards since these may point to objects in other space. |
| // Once these are marked, the GC will eventually clear them later. |
| // Table is non null for boot image and zygote spaces. It is only null for application image |
| // spaces. |
| if (table != nullptr) { |
| table->ProcessCards(); |
| table->VisitObjects(&VisitorType::Callback, &visitor); |
| // Don't clear cards here since we need to rescan in the pause. If we cleared the cards here, |
| // there would be races with the mutator marking new cards. |
| } else { |
| // Keep cards aged if we don't have a mod-union table since we may need to scan them in future |
| // GCs. This case is for app images. |
| card_table->ModifyCardsAtomic( |
| space->Begin(), |
| space->End(), |
| [](uint8_t card) { |
| return (card != gc::accounting::CardTable::kCardClean) |
| ? gc::accounting::CardTable::kCardAged |
| : card; |
| }, |
| /* card modified visitor */ VoidFunctor()); |
| card_table->Scan</*kClearCard=*/ false>(space->GetMarkBitmap(), |
| space->Begin(), |
| space->End(), |
| visitor, |
| gc::accounting::CardTable::kCardAged); |
| } |
| } |
| } |
| |
| void ConcurrentCopying::GrayAllNewlyDirtyImmuneObjects() { |
| TimingLogger::ScopedTiming split("(Paused)GrayAllNewlyDirtyImmuneObjects", GetTimings()); |
| accounting::CardTable* const card_table = heap_->GetCardTable(); |
| using VisitorType = GrayImmuneObjectVisitor</* kIsConcurrent= */ false>; |
| Thread* const self = Thread::Current(); |
| VisitorType visitor(self); |
| WriterMutexLock mu(Thread::Current(), *Locks::heap_bitmap_lock_); |
| for (space::ContinuousSpace* space : immune_spaces_.GetSpaces()) { |
| DCHECK(space->IsImageSpace() || space->IsZygoteSpace()); |
| accounting::ModUnionTable* table = heap_->FindModUnionTableFromSpace(space); |
| |
| // Don't need to scan aged cards since we did these before the pause. Note that scanning cards |
| // also handles the mod-union table cards. |
| card_table->Scan</*kClearCard=*/ false>(space->GetMarkBitmap(), |
| space->Begin(), |
| space->End(), |
| visitor, |
| gc::accounting::CardTable::kCardDirty); |
| if (table != nullptr) { |
| // Add the cards to the mod-union table so that we can clear cards to save RAM. |
| table->ProcessCards(); |
| TimingLogger::ScopedTiming split2("(Paused)ClearCards", GetTimings()); |
| card_table->ClearCardRange(space->Begin(), |
| AlignDown(space->End(), accounting::CardTable::kCardSize)); |
| } |
| } |
| // Since all of the objects that may point to other spaces are gray, we can avoid all the read |
| // barriers in the immune spaces. |
| updated_all_immune_objects_.store(true, std::memory_order_relaxed); |
| } |
| |
| void ConcurrentCopying::SwapStacks() { |
| heap_->SwapStacks(); |
| } |
| |
| void ConcurrentCopying::RecordLiveStackFreezeSize(Thread* self) { |
| WriterMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| live_stack_freeze_size_ = heap_->GetLiveStack()->Size(); |
| } |
| |
| // Used to visit objects in the immune spaces. |
| inline void ConcurrentCopying::ScanImmuneObject(mirror::Object* obj) { |
| DCHECK(obj != nullptr); |
| DCHECK(immune_spaces_.ContainsObject(obj)); |
| // Update the fields without graying it or pushing it onto the mark stack. |
| if (use_generational_cc_ && young_gen_) { |
| // Young GC does not care about references to unevac space. It is safe to not gray these as |
| // long as scan immune objects happens after scanning the dirty cards. |
| Scan<true>(obj); |
| } else { |
| Scan<false>(obj); |
| } |
| } |
| |
| class ConcurrentCopying::ImmuneSpaceScanObjVisitor { |
| public: |
| explicit ImmuneSpaceScanObjVisitor(ConcurrentCopying* cc) |
| : collector_(cc) {} |
| |
| ALWAYS_INLINE void operator()(mirror::Object* obj) const REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (kUseBakerReadBarrier && kGrayDirtyImmuneObjects) { |
| // Only need to scan gray objects. |
| if (obj->GetReadBarrierState() == ReadBarrier::GrayState()) { |
| collector_->ScanImmuneObject(obj); |
| // Done scanning the object, go back to black (non-gray). |
| bool success = obj->AtomicSetReadBarrierState(ReadBarrier::GrayState(), |
| ReadBarrier::NonGrayState()); |
| CHECK(success) |
| << Runtime::Current()->GetHeap()->GetVerification()->DumpObjectInfo(obj, "failed CAS"); |
| } |
| } else { |
| collector_->ScanImmuneObject(obj); |
| } |
| } |
| |
| static void Callback(mirror::Object* obj, void* arg) REQUIRES_SHARED(Locks::mutator_lock_) { |
| reinterpret_cast<ImmuneSpaceScanObjVisitor*>(arg)->operator()(obj); |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| }; |
| |
| template <bool kAtomicTestAndSet> |
| class ConcurrentCopying::CaptureRootsForMarkingVisitor : public RootVisitor { |
| public: |
| explicit CaptureRootsForMarkingVisitor(ConcurrentCopying* cc, Thread* self) |
| : collector_(cc), self_(self) {} |
| |
| void VisitRoots(mirror::Object*** roots, |
| size_t count, |
| const RootInfo& info ATTRIBUTE_UNUSED) override |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| for (size_t i = 0; i < count; ++i) { |
| mirror::Object** root = roots[i]; |
| mirror::Object* ref = *root; |
| if (ref != nullptr && !collector_->TestAndSetMarkBitForRef<kAtomicTestAndSet>(ref)) { |
| collector_->PushOntoMarkStack(self_, ref); |
| } |
| } |
| } |
| |
| void VisitRoots(mirror::CompressedReference<mirror::Object>** roots, |
| size_t count, |
| const RootInfo& info ATTRIBUTE_UNUSED) override |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| for (size_t i = 0; i < count; ++i) { |
| mirror::CompressedReference<mirror::Object>* const root = roots[i]; |
| if (!root->IsNull()) { |
| mirror::Object* ref = root->AsMirrorPtr(); |
| if (!collector_->TestAndSetMarkBitForRef<kAtomicTestAndSet>(ref)) { |
| collector_->PushOntoMarkStack(self_, ref); |
| } |
| } |
| } |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| Thread* const self_; |
| }; |
| |
| class ConcurrentCopying::RevokeThreadLocalMarkStackCheckpoint : public Closure { |
| public: |
| RevokeThreadLocalMarkStackCheckpoint(ConcurrentCopying* concurrent_copying, |
| bool disable_weak_ref_access) |
| : concurrent_copying_(concurrent_copying), |
| disable_weak_ref_access_(disable_weak_ref_access) { |
| } |
| |
| void Run(Thread* thread) override NO_THREAD_SAFETY_ANALYSIS { |
| // Note: self is not necessarily equal to thread since thread may be suspended. |
| Thread* const self = Thread::Current(); |
| CHECK(thread == self || |
| thread->IsSuspended() || |
| thread->GetState() == ThreadState::kWaitingPerformingGc) |
| << thread->GetState() << " thread " << thread << " self " << self; |
| // Revoke thread local mark stacks. |
| { |
| MutexLock mu(self, concurrent_copying_->mark_stack_lock_); |
| accounting::AtomicStack<mirror::Object>* tl_mark_stack = thread->GetThreadLocalMarkStack(); |
| if (tl_mark_stack != nullptr) { |
| concurrent_copying_->revoked_mark_stacks_.push_back(tl_mark_stack); |
| thread->SetThreadLocalMarkStack(nullptr); |
| } |
| } |
| // Disable weak ref access. |
| if (disable_weak_ref_access_) { |
| thread->SetWeakRefAccessEnabled(false); |
| } |
| // If thread is a running mutator, then act on behalf of the garbage collector. |
| // See the code in ThreadList::RunCheckpoint. |
| concurrent_copying_->GetBarrier().Pass(self); |
| } |
| |
| protected: |
| ConcurrentCopying* const concurrent_copying_; |
| |
| private: |
| const bool disable_weak_ref_access_; |
| }; |
| |
| class ConcurrentCopying::CaptureThreadRootsForMarkingAndCheckpoint : |
| public RevokeThreadLocalMarkStackCheckpoint { |
| public: |
| explicit CaptureThreadRootsForMarkingAndCheckpoint(ConcurrentCopying* cc) : |
| RevokeThreadLocalMarkStackCheckpoint(cc, /* disable_weak_ref_access */ false) {} |
| |
| void Run(Thread* thread) override |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| Thread* const self = Thread::Current(); |
| ReaderMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| // We can use the non-CAS VisitRoots functions below because we update thread-local GC roots |
| // only. |
| CaptureRootsForMarkingVisitor</*kAtomicTestAndSet*/ true> visitor(concurrent_copying_, self); |
| thread->VisitRoots(&visitor, kVisitRootFlagAllRoots); |
| // If thread_running_gc_ performed the root visit then its thread-local |
| // mark-stack should be null as we directly push to gc_mark_stack_. |
| CHECK(self == thread || self->GetThreadLocalMarkStack() == nullptr); |
| // Barrier handling is done in the base class' Run() below. |
| RevokeThreadLocalMarkStackCheckpoint::Run(thread); |
| } |
| }; |
| |
| void ConcurrentCopying::CaptureThreadRootsForMarking() { |
| TimingLogger::ScopedTiming split("CaptureThreadRootsForMarking", GetTimings()); |
| if (kVerboseMode) { |
| LOG(INFO) << "time=" << region_space_->Time(); |
| region_space_->DumpNonFreeRegions(LOG_STREAM(INFO)); |
| } |
| Thread* const self = Thread::Current(); |
| CaptureThreadRootsForMarkingAndCheckpoint check_point(this); |
| ThreadList* thread_list = Runtime::Current()->GetThreadList(); |
| gc_barrier_->Init(self, 0); |
| size_t barrier_count = thread_list->RunCheckpoint(&check_point, /* callback */ nullptr); |
| // If there are no threads to wait which implys that all the checkpoint functions are finished, |
| // then no need to release the mutator lock. |
| if (barrier_count == 0) { |
| return; |
| } |
| Locks::mutator_lock_->SharedUnlock(self); |
| { |
| ScopedThreadStateChange tsc(self, ThreadState::kWaitingForCheckPointsToRun); |
| gc_barrier_->Increment(self, barrier_count); |
| } |
| Locks::mutator_lock_->SharedLock(self); |
| if (kVerboseMode) { |
| LOG(INFO) << "time=" << region_space_->Time(); |
| region_space_->DumpNonFreeRegions(LOG_STREAM(INFO)); |
| LOG(INFO) << "GC end of CaptureThreadRootsForMarking"; |
| } |
| } |
| |
| // Used to scan ref fields of an object. |
| template <bool kHandleInterRegionRefs> |
| class ConcurrentCopying::ComputeLiveBytesAndMarkRefFieldsVisitor { |
| public: |
| explicit ComputeLiveBytesAndMarkRefFieldsVisitor(ConcurrentCopying* collector, |
| size_t obj_region_idx) |
| : collector_(collector), |
| obj_region_idx_(obj_region_idx), |
| contains_inter_region_idx_(false) {} |
| |
| void operator()(mirror::Object* obj, MemberOffset offset, bool /* is_static */) const |
| ALWAYS_INLINE |
| REQUIRES_SHARED(Locks::mutator_lock_) |
| REQUIRES_SHARED(Locks::heap_bitmap_lock_) { |
| DCHECK_EQ(collector_->RegionSpace()->RegionIdxForRef(obj), obj_region_idx_); |
| DCHECK(kHandleInterRegionRefs || collector_->immune_spaces_.ContainsObject(obj)); |
| mirror::Object* ref = |
| obj->GetFieldObject<mirror::Object, kVerifyNone, kWithoutReadBarrier>(offset); |
| // TODO(lokeshgidra): Remove the following condition once b/173676071 is fixed. |
| if (UNLIKELY(ref == nullptr && offset == mirror::Object::ClassOffset())) { |
| // It has been verified as a race condition (see b/173676071)! After a small |
| // wait when we reload the class pointer, it turns out to be a valid class |
| // object. So as a workaround, we can continue execution and log an error |
| // that this happened. |
| for (size_t i = 0; i < 1000; i++) { |
| // Wait for 1ms at a time. Don't wait for more than 1 second in total. |
| usleep(1000); |
| ref = obj->GetClass<kVerifyNone, kWithoutReadBarrier>(); |
| if (ref != nullptr) { |
| LOG(ERROR) << "klass pointer for obj: " |
| << obj << " (" << mirror::Object::PrettyTypeOf(obj) |
| << ") found to be null first. Reloading after a small wait fetched klass: " |
| << ref << " (" << mirror::Object::PrettyTypeOf(ref) << ")"; |
| break; |
| } |
| } |
| |
| if (UNLIKELY(ref == nullptr)) { |
| // It must be heap corruption. Remove memory protection and dump data. |
| collector_->region_space_->Unprotect(); |
| LOG(FATAL_WITHOUT_ABORT) << "klass pointer for ref: " << obj << " found to be null."; |
| collector_->heap_->GetVerification()->LogHeapCorruption(obj, offset, ref, /* fatal */ true); |
| } |
| } |
| CheckReference(ref); |
| } |
| |
| void operator()(ObjPtr<mirror::Class> klass, ObjPtr<mirror::Reference> ref) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| DCHECK(klass->IsTypeOfReferenceClass()); |
| // If the referent is not null, then we must re-visit the object during |
| // copying phase to enqueue it for delayed processing and setting |
| // read-barrier state to gray to ensure that call to GetReferent() triggers |
| // the read-barrier. We use same data structure that is used to remember |
| // objects with inter-region refs for this purpose too. |
| if (kHandleInterRegionRefs |
| && !contains_inter_region_idx_ |
| && ref->AsReference()->GetReferent<kWithoutReadBarrier>() != nullptr) { |
| contains_inter_region_idx_ = true; |
| } |
| } |
| |
| void VisitRootIfNonNull(mirror::CompressedReference<mirror::Object>* root) const |
| ALWAYS_INLINE |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (!root->IsNull()) { |
| VisitRoot(root); |
| } |
| } |
| |
| void VisitRoot(mirror::CompressedReference<mirror::Object>* root) const |
| ALWAYS_INLINE |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| CheckReference(root->AsMirrorPtr()); |
| } |
| |
| bool ContainsInterRegionRefs() const ALWAYS_INLINE REQUIRES_SHARED(Locks::mutator_lock_) { |
| return contains_inter_region_idx_; |
| } |
| |
| private: |
| void CheckReference(mirror::Object* ref) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (ref == nullptr) { |
| // Nothing to do. |
| return; |
| } |
| if (!collector_->TestAndSetMarkBitForRef(ref)) { |
| collector_->PushOntoLocalMarkStack(ref); |
| } |
| if (kHandleInterRegionRefs && !contains_inter_region_idx_) { |
| size_t ref_region_idx = collector_->RegionSpace()->RegionIdxForRef(ref); |
| // If a region-space object refers to an outside object, we will have a |
| // mismatch of region idx, but the object need not be re-visited in |
| // copying phase. |
| if (ref_region_idx != static_cast<size_t>(-1) && obj_region_idx_ != ref_region_idx) { |
| contains_inter_region_idx_ = true; |
| } |
| } |
| } |
| |
| ConcurrentCopying* const collector_; |
| const size_t obj_region_idx_; |
| mutable bool contains_inter_region_idx_; |
| }; |
| |
| void ConcurrentCopying::AddLiveBytesAndScanRef(mirror::Object* ref) { |
| DCHECK(ref != nullptr); |
| DCHECK(!immune_spaces_.ContainsObject(ref)); |
| DCHECK(TestMarkBitmapForRef(ref)); |
| size_t obj_region_idx = static_cast<size_t>(-1); |
| if (LIKELY(region_space_->HasAddress(ref))) { |
| obj_region_idx = region_space_->RegionIdxForRefUnchecked(ref); |
| // Add live bytes to the corresponding region |
| if (!region_space_->IsRegionNewlyAllocated(obj_region_idx)) { |
| // Newly Allocated regions are always chosen for evacuation. So no need |
| // to update live_bytes_. |
| size_t obj_size = ref->SizeOf<kDefaultVerifyFlags>(); |
| size_t alloc_size = RoundUp(obj_size, space::RegionSpace::kAlignment); |
| region_space_->AddLiveBytes(ref, alloc_size); |
| } |
| } |
| ComputeLiveBytesAndMarkRefFieldsVisitor</*kHandleInterRegionRefs*/ true> |
| visitor(this, obj_region_idx); |
| ref->VisitReferences</*kVisitNativeRoots=*/ true, kDefaultVerifyFlags, kWithoutReadBarrier>( |
| visitor, visitor); |
| // Mark the corresponding card dirty if the object contains any |
| // inter-region reference. |
| if (visitor.ContainsInterRegionRefs()) { |
| if (obj_region_idx == static_cast<size_t>(-1)) { |
| // If an inter-region ref has been found in a non-region-space, then it |
| // must be non-moving-space. This is because this function cannot be |
| // called on a immune-space object, and a large-object-space object has |
| // only class object reference, which is either in some immune-space, or |
| // in non-moving-space. |
| DCHECK(heap_->non_moving_space_->HasAddress(ref)); |
| non_moving_space_inter_region_bitmap_.Set(ref); |
| } else { |
| region_space_inter_region_bitmap_.Set(ref); |
| } |
| } |
| } |
| |
| template <bool kAtomic> |
| bool ConcurrentCopying::TestAndSetMarkBitForRef(mirror::Object* ref) { |
| accounting::ContinuousSpaceBitmap* bitmap = nullptr; |
| accounting::LargeObjectBitmap* los_bitmap = nullptr; |
| if (LIKELY(region_space_->HasAddress(ref))) { |
| bitmap = region_space_bitmap_; |
| } else if (heap_->GetNonMovingSpace()->HasAddress(ref)) { |
| bitmap = heap_->GetNonMovingSpace()->GetMarkBitmap(); |
| } else if (immune_spaces_.ContainsObject(ref)) { |
| // References to immune space objects are always live. |
| DCHECK(heap_mark_bitmap_->GetContinuousSpaceBitmap(ref)->Test(ref)); |
| return true; |
| } else { |
| // Should be a large object. Must be page aligned and the LOS must exist. |
| if (kIsDebugBuild |
| && (!IsAligned<kPageSize>(ref) || heap_->GetLargeObjectsSpace() == nullptr)) { |
| // It must be heap corruption. Remove memory protection and dump data. |
| region_space_->Unprotect(); |
| heap_->GetVerification()->LogHeapCorruption(/* obj */ nullptr, |
| MemberOffset(0), |
| ref, |
| /* fatal */ true); |
| } |
| los_bitmap = heap_->GetLargeObjectsSpace()->GetMarkBitmap(); |
| } |
| if (kAtomic) { |
| return (bitmap != nullptr) ? bitmap->AtomicTestAndSet(ref) : los_bitmap->AtomicTestAndSet(ref); |
| } else { |
| return (bitmap != nullptr) ? bitmap->Set(ref) : los_bitmap->Set(ref); |
| } |
| } |
| |
| bool ConcurrentCopying::TestMarkBitmapForRef(mirror::Object* ref) { |
| if (LIKELY(region_space_->HasAddress(ref))) { |
| return region_space_bitmap_->Test(ref); |
| } else if (heap_->GetNonMovingSpace()->HasAddress(ref)) { |
| return heap_->GetNonMovingSpace()->GetMarkBitmap()->Test(ref); |
| } else if (immune_spaces_.ContainsObject(ref)) { |
| // References to immune space objects are always live. |
| DCHECK(heap_mark_bitmap_->GetContinuousSpaceBitmap(ref)->Test(ref)); |
| return true; |
| } else { |
| // Should be a large object. Must be page aligned and the LOS must exist. |
| if (kIsDebugBuild |
| && (!IsAligned<kPageSize>(ref) || heap_->GetLargeObjectsSpace() == nullptr)) { |
| // It must be heap corruption. Remove memory protection and dump data. |
| region_space_->Unprotect(); |
| heap_->GetVerification()->LogHeapCorruption(/* obj */ nullptr, |
| MemberOffset(0), |
| ref, |
| /* fatal */ true); |
| } |
| return heap_->GetLargeObjectsSpace()->GetMarkBitmap()->Test(ref); |
| } |
| } |
| |
| void ConcurrentCopying::PushOntoLocalMarkStack(mirror::Object* ref) { |
| if (kIsDebugBuild) { |
| Thread *self = Thread::Current(); |
| DCHECK_EQ(thread_running_gc_, self); |
| DCHECK(self->GetThreadLocalMarkStack() == nullptr); |
| } |
| DCHECK_EQ(mark_stack_mode_.load(std::memory_order_relaxed), kMarkStackModeThreadLocal); |
| if (UNLIKELY(gc_mark_stack_->IsFull())) { |
| ExpandGcMarkStack(); |
| } |
| gc_mark_stack_->PushBack(ref); |
| } |
| |
| void ConcurrentCopying::ProcessMarkStackForMarkingAndComputeLiveBytes() { |
| // Process thread-local mark stack containing thread roots |
| ProcessThreadLocalMarkStacks(/* disable_weak_ref_access */ false, |
| /* checkpoint_callback */ nullptr, |
| [this] (mirror::Object* ref) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| AddLiveBytesAndScanRef(ref); |
| }); |
| { |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| CHECK(revoked_mark_stacks_.empty()); |
| CHECK_EQ(pooled_mark_stacks_.size(), kMarkStackPoolSize); |
| } |
| |
| while (!gc_mark_stack_->IsEmpty()) { |
| mirror::Object* ref = gc_mark_stack_->PopBack(); |
| AddLiveBytesAndScanRef(ref); |
| } |
| } |
| |
| class ConcurrentCopying::ImmuneSpaceCaptureRefsVisitor { |
| public: |
| explicit ImmuneSpaceCaptureRefsVisitor(ConcurrentCopying* cc) : collector_(cc) {} |
| |
| ALWAYS_INLINE void operator()(mirror::Object* obj) const REQUIRES_SHARED(Locks::mutator_lock_) { |
| ComputeLiveBytesAndMarkRefFieldsVisitor</*kHandleInterRegionRefs*/ false> |
| visitor(collector_, /*obj_region_idx*/ static_cast<size_t>(-1)); |
| obj->VisitReferences</*kVisitNativeRoots=*/true, kDefaultVerifyFlags, kWithoutReadBarrier>( |
| visitor, visitor); |
| } |
| |
| static void Callback(mirror::Object* obj, void* arg) REQUIRES_SHARED(Locks::mutator_lock_) { |
| reinterpret_cast<ImmuneSpaceCaptureRefsVisitor*>(arg)->operator()(obj); |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| }; |
| |
| /* Invariants for two-phase CC |
| * =========================== |
| * A) Definitions |
| * --------------- |
| * 1) Black: marked in bitmap, rb_state is non-gray, and not in mark stack |
| * 2) Black-clean: marked in bitmap, and corresponding card is clean/aged |
| * 3) Black-dirty: marked in bitmap, and corresponding card is dirty |
| * 4) Gray: marked in bitmap, and exists in mark stack |
| * 5) Gray-dirty: marked in bitmap, rb_state is gray, corresponding card is |
| * dirty, and exists in mark stack |
| * 6) White: unmarked in bitmap, rb_state is non-gray, and not in mark stack |
| * |
| * B) Before marking phase |
| * ----------------------- |
| * 1) All objects are white |
| * 2) Cards are either clean or aged (cannot be asserted without a STW pause) |
| * 3) Mark bitmap is cleared |
| * 4) Mark stack is empty |
| * |
| * C) During marking phase |
| * ------------------------ |
| * 1) If a black object holds an inter-region or white reference, then its |
| * corresponding card is dirty. In other words, it changes from being |
| * black-clean to black-dirty |
| * 2) No black-clean object points to a white object |
| * |
| * D) After marking phase |
| * ----------------------- |
| * 1) There are no gray objects |
| * 2) All newly allocated objects are in from space |
| * 3) No white object can be reachable, directly or otherwise, from a |
| * black-clean object |
| * |
| * E) During copying phase |
| * ------------------------ |
| * 1) Mutators cannot observe white and black-dirty objects |
| * 2) New allocations are in to-space (newly allocated regions are part of to-space) |
| * 3) An object in mark stack must have its rb_state = Gray |
| * |
| * F) During card table scan |
| * -------------------------- |
| * 1) Referents corresponding to root references are gray or in to-space |
| * 2) Every path from an object that is read or written by a mutator during |
| * this period to a dirty black object goes through some gray object. |
| * Mutators preserve this by graying black objects as needed during this |
| * period. Ensures that a mutator never encounters a black dirty object. |
| * |
| * G) After card table scan |
| * ------------------------ |
| * 1) There are no black-dirty objects |
| * 2) Referents corresponding to root references are gray, black-clean or in |
| * to-space |
| * |
| * H) After copying phase |
| * ----------------------- |
| * 1) Mark stack is empty |
| * 2) No references into evacuated from-space |
| * 3) No reference to an object which is unmarked and is also not in newly |
| * allocated region. In other words, no reference to white objects. |
| */ |
| |
| void ConcurrentCopying::MarkingPhase() { |
| TimingLogger::ScopedTiming split("MarkingPhase", GetTimings()); |
| if (kVerboseMode) { |
| LOG(INFO) << "GC MarkingPhase"; |
| } |
| accounting::CardTable* const card_table = heap_->GetCardTable(); |
| Thread* const self = Thread::Current(); |
| CHECK_EQ(self, thread_running_gc_); |
| // Clear live_bytes_ of every non-free region, except the ones that are newly |
| // allocated. |
| region_space_->SetAllRegionLiveBytesZero(); |
| if (kIsDebugBuild) { |
| region_space_->AssertAllRegionLiveBytesZeroOrCleared(); |
| } |
| // Scan immune spaces |
| { |
| TimingLogger::ScopedTiming split2("ScanImmuneSpaces", GetTimings()); |
| for (auto& space : immune_spaces_.GetSpaces()) { |
| DCHECK(space->IsImageSpace() || space->IsZygoteSpace()); |
| accounting::ContinuousSpaceBitmap* live_bitmap = space->GetLiveBitmap(); |
| accounting::ModUnionTable* table = heap_->FindModUnionTableFromSpace(space); |
| ImmuneSpaceCaptureRefsVisitor visitor(this); |
| if (table != nullptr) { |
| table->VisitObjects(ImmuneSpaceCaptureRefsVisitor::Callback, &visitor); |
| } else { |
| WriterMutexLock rmu(Thread::Current(), *Locks::heap_bitmap_lock_); |
| card_table->Scan<false>( |
| live_bitmap, |
| space->Begin(), |
| space->Limit(), |
| visitor, |
| accounting::CardTable::kCardDirty - 1); |
| } |
| } |
| } |
| // Scan runtime roots |
| { |
| TimingLogger::ScopedTiming split2("VisitConcurrentRoots", GetTimings()); |
| CaptureRootsForMarkingVisitor visitor(this, self); |
| Runtime::Current()->VisitConcurrentRoots(&visitor, kVisitRootFlagAllRoots); |
| } |
| { |
| // TODO: don't visit the transaction roots if it's not active. |
| TimingLogger::ScopedTiming split2("VisitNonThreadRoots", GetTimings()); |
| CaptureRootsForMarkingVisitor visitor(this, self); |
| Runtime::Current()->VisitNonThreadRoots(&visitor); |
| } |
| // Capture thread roots |
| CaptureThreadRootsForMarking(); |
| // Process mark stack |
| ProcessMarkStackForMarkingAndComputeLiveBytes(); |
| |
| if (kVerboseMode) { |
| LOG(INFO) << "GC end of MarkingPhase"; |
| } |
| } |
| |
| template <bool kNoUnEvac> |
| void ConcurrentCopying::ScanDirtyObject(mirror::Object* obj) { |
| Scan<kNoUnEvac>(obj); |
| // Set the read-barrier state of a reference-type object to gray if its |
| // referent is not marked yet. This is to ensure that if GetReferent() is |
| // called, it triggers the read-barrier to process the referent before use. |
| if (UNLIKELY((obj->GetClass<kVerifyNone, kWithoutReadBarrier>()->IsTypeOfReferenceClass()))) { |
| mirror::Object* referent = |
| obj->AsReference<kVerifyNone, kWithoutReadBarrier>()->GetReferent<kWithoutReadBarrier>(); |
| if (referent != nullptr && !IsInToSpace(referent)) { |
| obj->AtomicSetReadBarrierState(ReadBarrier::NonGrayState(), ReadBarrier::GrayState()); |
| } |
| } |
| } |
| |
| // Concurrently mark roots that are guarded by read barriers and process the mark stack. |
| void ConcurrentCopying::CopyingPhase() { |
| TimingLogger::ScopedTiming split("CopyingPhase", GetTimings()); |
| if (kVerboseMode) { |
| LOG(INFO) << "GC CopyingPhase"; |
| } |
| Thread* self = Thread::Current(); |
| accounting::CardTable* const card_table = heap_->GetCardTable(); |
| if (kIsDebugBuild) { |
| MutexLock mu(self, *Locks::thread_list_lock_); |
| CHECK(weak_ref_access_enabled_); |
| } |
| |
| // Scan immune spaces. |
| // Update all the fields in the immune spaces first without graying the objects so that we |
| // minimize dirty pages in the immune spaces. Note mutators can concurrently access and gray some |
| // of the objects. |
| if (kUseBakerReadBarrier) { |
| gc_grays_immune_objects_ = false; |
| } |
| if (use_generational_cc_) { |
| if (kVerboseMode) { |
| LOG(INFO) << "GC ScanCardsForSpace"; |
| } |
| TimingLogger::ScopedTiming split2("ScanCardsForSpace", GetTimings()); |
| WriterMutexLock rmu(Thread::Current(), *Locks::heap_bitmap_lock_); |
| CHECK(!done_scanning_.load(std::memory_order_relaxed)); |
| if (kIsDebugBuild) { |
| // Leave some time for mutators to race ahead to try and find races between the GC card |
| // scanning and mutators reading references. |
| usleep(10 * 1000); |
| } |
| for (space::ContinuousSpace* space : GetHeap()->GetContinuousSpaces()) { |
| if (space->IsImageSpace() || space->IsZygoteSpace()) { |
| // Image and zygote spaces are already handled since we gray the objects in the pause. |
| continue; |
| } |
| // Scan all of the objects on dirty cards in unevac from space, and non moving space. These |
| // are from previous GCs (or from marking phase of 2-phase full GC) and may reference things |
| // in the from space. |
| // |
| // Note that we do not need to process the large-object space (the only discontinuous space) |
| // as it contains only large string objects and large primitive array objects, that have no |
| // reference to other objects, except their class. There is no need to scan these large |
| // objects, as the String class and the primitive array classes are expected to never move |
| // during a collection: |
| // - In the case where we run with a boot image, these classes are part of the image space, |
| // which is an immune space. |
| // - In the case where we run without a boot image, these classes are allocated in the |
| // non-moving space (see art::ClassLinker::InitWithoutImage). |
| card_table->Scan<false>( |
| space->GetMarkBitmap(), |
| space->Begin(), |
| space->End(), |
| [this, space](mirror::Object* obj) |
| REQUIRES(Locks::heap_bitmap_lock_) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| // TODO: This code may be refactored to avoid scanning object while |
| // done_scanning_ is false by setting rb_state to gray, and pushing the |
| // object on mark stack. However, it will also require clearing the |
| // corresponding mark-bit and, for region space objects, |
| // decrementing the object's size from the corresponding region's |
| // live_bytes. |
| if (young_gen_) { |
| // Don't push or gray unevac refs. |
| if (kIsDebugBuild && space == region_space_) { |
| // We may get unevac large objects. |
| if (!region_space_->IsInUnevacFromSpace(obj)) { |
| CHECK(region_space_bitmap_->Test(obj)); |
| region_space_->DumpRegionForObject(LOG_STREAM(FATAL_WITHOUT_ABORT), obj); |
| LOG(FATAL) << "Scanning " << obj << " not in unevac space"; |
| } |
| } |
| ScanDirtyObject</*kNoUnEvac*/ true>(obj); |
| } else if (space != region_space_) { |
| DCHECK(space == heap_->non_moving_space_); |
| // We need to process un-evac references as they may be unprocessed, |
| // if they skipped the marking phase due to heap mutation. |
| ScanDirtyObject</*kNoUnEvac*/ false>(obj); |
| non_moving_space_inter_region_bitmap_.Clear(obj); |
| } else if (region_space_->IsInUnevacFromSpace(obj)) { |
| ScanDirtyObject</*kNoUnEvac*/ false>(obj); |
| region_space_inter_region_bitmap_.Clear(obj); |
| } |
| }, |
| accounting::CardTable::kCardAged); |
| |
| if (!young_gen_) { |
| auto visitor = [this](mirror::Object* obj) REQUIRES_SHARED(Locks::mutator_lock_) { |
| // We don't need to process un-evac references as any unprocessed |
| // ones will be taken care of in the card-table scan above. |
| ScanDirtyObject</*kNoUnEvac*/ true>(obj); |
| }; |
| if (space == region_space_) { |
| region_space_->ScanUnevacFromSpace(®ion_space_inter_region_bitmap_, visitor); |
| } else { |
| DCHECK(space == heap_->non_moving_space_); |
| non_moving_space_inter_region_bitmap_.VisitMarkedRange( |
| reinterpret_cast<uintptr_t>(space->Begin()), |
| reinterpret_cast<uintptr_t>(space->End()), |
| visitor); |
| } |
| } |
| } |
| // Done scanning unevac space. |
| done_scanning_.store(true, std::memory_order_release); |
| // NOTE: inter-region-ref bitmaps can be cleared here to release memory, if needed. |
| // Currently we do it in ReclaimPhase(). |
| if (kVerboseMode) { |
| LOG(INFO) << "GC end of ScanCardsForSpace"; |
| } |
| } |
| { |
| // For a sticky-bit collection, this phase needs to be after the card scanning since the |
| // mutator may read an unevac space object out of an image object. If the image object is no |
| // longer gray it will trigger a read barrier for the unevac space object. |
| TimingLogger::ScopedTiming split2("ScanImmuneSpaces", GetTimings()); |
| for (auto& space : immune_spaces_.GetSpaces()) { |
| DCHECK(space->IsImageSpace() || space->IsZygoteSpace()); |
| accounting::ContinuousSpaceBitmap* live_bitmap = space->GetLiveBitmap(); |
| accounting::ModUnionTable* table = heap_->FindModUnionTableFromSpace(space); |
| ImmuneSpaceScanObjVisitor visitor(this); |
| if (kUseBakerReadBarrier && kGrayDirtyImmuneObjects && table != nullptr) { |
| table->VisitObjects(ImmuneSpaceScanObjVisitor::Callback, &visitor); |
| } else { |
| WriterMutexLock rmu(Thread::Current(), *Locks::heap_bitmap_lock_); |
| card_table->Scan<false>( |
| live_bitmap, |
| space->Begin(), |
| space->Limit(), |
| visitor, |
| accounting::CardTable::kCardDirty - 1); |
| } |
| } |
| } |
| if (kUseBakerReadBarrier) { |
| // This release fence makes the field updates in the above loop visible before allowing mutator |
| // getting access to immune objects without graying it first. |
| updated_all_immune_objects_.store(true, std::memory_order_release); |
| // Now "un-gray" (conceptually blacken) immune objects concurrently accessed and grayed by |
| // mutators. We can't do this in the above loop because we would incorrectly disable the read |
| // barrier by un-graying (conceptually blackening) an object which may point to an unscanned, |
| // white object, breaking the to-space invariant (a mutator shall never observe a from-space |
| // (white) object). |
| // |
| // Make sure no mutators are in the middle of marking an immune object before un-graying |
| // (blackening) immune objects. |
| IssueEmptyCheckpoint(); |
| MutexLock mu(Thread::Current(), immune_gray_stack_lock_); |
| if (kVerboseMode) { |
| LOG(INFO) << "immune gray stack size=" << immune_gray_stack_.size(); |
| } |
| for (mirror::Object* obj : immune_gray_stack_) { |
| DCHECK_EQ(obj->GetReadBarrierState(), ReadBarrier::GrayState()); |
| bool success = obj->AtomicSetReadBarrierState(ReadBarrier::GrayState(), |
| ReadBarrier::NonGrayState()); |
| DCHECK(success); |
| } |
| immune_gray_stack_.clear(); |
| } |
| |
| { |
| TimingLogger::ScopedTiming split2("VisitConcurrentRoots", GetTimings()); |
| Runtime::Current()->VisitConcurrentRoots(this, kVisitRootFlagAllRoots); |
| } |
| { |
| // TODO: don't visit the transaction roots if it's not active. |
| TimingLogger::ScopedTiming split5("VisitNonThreadRoots", GetTimings()); |
| Runtime::Current()->VisitNonThreadRoots(this); |
| } |
| |
| { |
| TimingLogger::ScopedTiming split7("Process mark stacks and References", GetTimings()); |
| |
| // Process the mark stack once in the thread local stack mode. This marks most of the live |
| // objects, aside from weak ref accesses with read barriers (Reference::GetReferent() and |
| // system weaks) that may happen concurrently while we are processing the mark stack and newly |
| // mark/gray objects and push refs on the mark stack. |
| ProcessMarkStack(); |
| |
| ReferenceProcessor* rp = GetHeap()->GetReferenceProcessor(); |
| bool clear_soft_references = GetCurrentIteration()->GetClearSoftReferences(); |
| rp->Setup(self, this, /*concurrent=*/ true, clear_soft_references); |
| if (!clear_soft_references) { |
| // Forward as many SoftReferences as possible before inhibiting reference access. |
| rp->ForwardSoftReferences(GetTimings()); |
| } |
| |
| // We transition through three mark stack modes (thread-local, shared, GC-exclusive). The |
| // primary reasons are that we need to use a checkpoint to process thread-local mark |
| // stacks, but after we disable weak refs accesses, we can't use a checkpoint due to a deadlock |
| // issue because running threads potentially blocking at WaitHoldingLocks, and that once we |
| // reach the point where we process weak references, we can avoid using a lock when accessing |
| // the GC mark stack, which makes mark stack processing more efficient. |
| |
| // Switch to the shared mark stack mode. That is, revoke and process thread-local mark stacks |
| // for the last time before transitioning to the shared mark stack mode, which would process new |
| // refs that may have been concurrently pushed onto the mark stack during the ProcessMarkStack() |
| // call above. At the same time, disable weak ref accesses using a per-thread flag. It's |
| // important to do these together so that we can ensure that mutators won't |
| // newly gray objects and push new refs onto the mark stack due to weak ref accesses and |
| // mutators safely transition to the shared mark stack mode (without leaving unprocessed refs on |
| // the thread-local mark stacks), without a race. This is why we use a thread-local weak ref |
| // access flag Thread::tls32_.weak_ref_access_enabled_ instead of the global ones. |
| // We must use a stop-the-world pause to disable weak ref access. A checkpoint may lead to a |
| // deadlock if one mutator acquires a low-level mutex and then gets blocked while accessing |
| // a weak-ref (after participating in the checkpoint), and another mutator indefinitely waits |
| // for the mutex before it participates in the checkpoint. Consequently, the gc-thread blocks |
| // forever as the checkpoint never finishes (See runtime/mutator_gc_coord.md). |
| SwitchToSharedMarkStackMode(); |
| CHECK(!self->GetWeakRefAccessEnabled()); |
| |
| // Now that weak refs accesses are disabled, once we exhaust the shared mark stack again here |
| // (which may be non-empty if there were refs found on thread-local mark stacks during the above |
| // SwitchToSharedMarkStackMode() call), we won't have new refs to process, that is, mutators |
| // (via read barriers) have no way to produce any more refs to process. Marking converges once |
| // before we process weak refs below. |
| ProcessMarkStack(); |
| CheckEmptyMarkStack(); |
| |
| // Switch to the GC exclusive mark stack mode so that we can process the mark stack without a |
| // lock from this point on. |
| SwitchToGcExclusiveMarkStackMode(); |
| CheckEmptyMarkStack(); |
| if (kVerboseMode) { |
| LOG(INFO) << "ProcessReferences"; |
| } |
| // Process weak references. This also marks through finalizers. Although |
| // reference processing is "disabled", some accesses will proceed once we've ensured that |
| // objects directly reachable by the mutator are marked, i.e. before we mark through |
| // finalizers. |
| ProcessReferences(self); |
| CheckEmptyMarkStack(); |
| // JNI WeakGlobalRefs and most other system weaks cannot be processed until we're done marking |
| // through finalizers, since such references to finalizer-reachable objects must be preserved. |
| if (kVerboseMode) { |
| LOG(INFO) << "SweepSystemWeaks"; |
| } |
| SweepSystemWeaks(self); |
| CheckEmptyMarkStack(); |
| ReenableWeakRefAccess(self); |
| if (kVerboseMode) { |
| LOG(INFO) << "SweepSystemWeaks done"; |
| } |
| // Marking is done. Disable marking. |
| DisableMarking(); |
| CheckEmptyMarkStack(); |
| } |
| |
| if (kIsDebugBuild) { |
| MutexLock mu(self, *Locks::thread_list_lock_); |
| CHECK(weak_ref_access_enabled_); |
| } |
| if (kVerboseMode) { |
| LOG(INFO) << "GC end of CopyingPhase"; |
| } |
| } |
| |
| void ConcurrentCopying::ReenableWeakRefAccess(Thread* self) { |
| if (kVerboseMode) { |
| LOG(INFO) << "ReenableWeakRefAccess"; |
| } |
| // Iterate all threads (don't need to or can't use a checkpoint) and re-enable weak ref access. |
| { |
| MutexLock mu(self, *Locks::thread_list_lock_); |
| weak_ref_access_enabled_ = true; // This is for new threads. |
| std::list<Thread*> thread_list = Runtime::Current()->GetThreadList()->GetList(); |
| for (Thread* thread : thread_list) { |
| thread->SetWeakRefAccessEnabled(true); |
| } |
| } |
| // Unblock blocking threads. |
| GetHeap()->GetReferenceProcessor()->BroadcastForSlowPath(self); |
| Runtime::Current()->BroadcastForNewSystemWeaks(); |
| } |
| |
| class ConcurrentCopying::DisableMarkingCheckpoint : public Closure { |
| public: |
| explicit DisableMarkingCheckpoint(ConcurrentCopying* concurrent_copying) |
| : concurrent_copying_(concurrent_copying) { |
| } |
| |
| void Run(Thread* thread) override NO_THREAD_SAFETY_ANALYSIS { |
| // Note: self is not necessarily equal to thread since thread may be suspended. |
| Thread* self = Thread::Current(); |
| DCHECK(thread == self || |
| thread->IsSuspended() || |
| thread->GetState() == ThreadState::kWaitingPerformingGc) |
| << thread->GetState() << " thread " << thread << " self " << self; |
| // We sweep interpreter caches here so that it can be done after all |
| // reachable objects are marked and the mutators can sweep their caches |
| // without synchronization. |
| thread->SweepInterpreterCache(concurrent_copying_); |
| // Disable the thread-local is_gc_marking flag. |
| // Note a thread that has just started right before this checkpoint may have already this flag |
| // set to false, which is ok. |
| thread->SetIsGcMarkingAndUpdateEntrypoints(false); |
| // If thread is a running mutator, then act on behalf of the garbage collector. |
| // See the code in ThreadList::RunCheckpoint. |
| concurrent_copying_->GetBarrier().Pass(self); |
| } |
| |
| private: |
| ConcurrentCopying* const concurrent_copying_; |
| }; |
| |
| class ConcurrentCopying::DisableMarkingCallback : public Closure { |
| public: |
| explicit DisableMarkingCallback(ConcurrentCopying* concurrent_copying) |
| : concurrent_copying_(concurrent_copying) { |
| } |
| |
| void Run(Thread* self ATTRIBUTE_UNUSED) override REQUIRES(Locks::thread_list_lock_) { |
| // This needs to run under the thread_list_lock_ critical section in ThreadList::RunCheckpoint() |
| // to avoid a race with ThreadList::Register(). |
| CHECK(concurrent_copying_->is_marking_); |
| concurrent_copying_->is_marking_ = false; |
| if (kUseBakerReadBarrier && kGrayDirtyImmuneObjects) { |
| CHECK(concurrent_copying_->is_using_read_barrier_entrypoints_); |
| concurrent_copying_->is_using_read_barrier_entrypoints_ = false; |
| } else { |
| CHECK(!concurrent_copying_->is_using_read_barrier_entrypoints_); |
| } |
| } |
| |
| private: |
| ConcurrentCopying* const concurrent_copying_; |
| }; |
| |
| void ConcurrentCopying::IssueDisableMarkingCheckpoint() { |
| Thread* self = Thread::Current(); |
| DisableMarkingCheckpoint check_point(this); |
| ThreadList* thread_list = Runtime::Current()->GetThreadList(); |
| gc_barrier_->Init(self, 0); |
| DisableMarkingCallback dmc(this); |
| size_t barrier_count = thread_list->RunCheckpoint(&check_point, &dmc); |
| // If there are no threads to wait which implies that all the checkpoint functions are finished, |
| // then no need to release the mutator lock. |
| if (barrier_count == 0) { |
| return; |
| } |
| // Release locks then wait for all mutator threads to pass the barrier. |
| Locks::mutator_lock_->SharedUnlock(self); |
| { |
| ScopedThreadStateChange tsc(self, ThreadState::kWaitingForCheckPointsToRun); |
| gc_barrier_->Increment(self, barrier_count); |
| } |
| Locks::mutator_lock_->SharedLock(self); |
| } |
| |
| void ConcurrentCopying::DisableMarking() { |
| // Use a checkpoint to turn off the global is_marking and the thread-local is_gc_marking flags and |
| // to ensure no threads are still in the middle of a read barrier which may have a from-space ref |
| // cached in a local variable. |
| IssueDisableMarkingCheckpoint(); |
| if (kUseTableLookupReadBarrier) { |
| heap_->rb_table_->ClearAll(); |
| DCHECK(heap_->rb_table_->IsAllCleared()); |
| } |
| is_mark_stack_push_disallowed_.store(1, std::memory_order_seq_cst); |
| mark_stack_mode_.store(kMarkStackModeOff, std::memory_order_seq_cst); |
| } |
| |
| void ConcurrentCopying::IssueEmptyCheckpoint() { |
| Thread* self = Thread::Current(); |
| ThreadList* thread_list = Runtime::Current()->GetThreadList(); |
| // Release locks then wait for all mutator threads to pass the barrier. |
| Locks::mutator_lock_->SharedUnlock(self); |
| thread_list->RunEmptyCheckpoint(); |
| Locks::mutator_lock_->SharedLock(self); |
| } |
| |
| void ConcurrentCopying::ExpandGcMarkStack() { |
| DCHECK(gc_mark_stack_->IsFull()); |
| const size_t new_size = gc_mark_stack_->Capacity() * 2; |
| std::vector<StackReference<mirror::Object>> temp(gc_mark_stack_->Begin(), |
| gc_mark_stack_->End()); |
| gc_mark_stack_->Resize(new_size); |
| for (auto& ref : temp) { |
| gc_mark_stack_->PushBack(ref.AsMirrorPtr()); |
| } |
| DCHECK(!gc_mark_stack_->IsFull()); |
| } |
| |
| void ConcurrentCopying::PushOntoMarkStack(Thread* const self, mirror::Object* to_ref) { |
| CHECK_EQ(is_mark_stack_push_disallowed_.load(std::memory_order_relaxed), 0) |
| << " " << to_ref << " " << mirror::Object::PrettyTypeOf(to_ref); |
| CHECK(thread_running_gc_ != nullptr); |
| MarkStackMode mark_stack_mode = mark_stack_mode_.load(std::memory_order_relaxed); |
| if (LIKELY(mark_stack_mode == kMarkStackModeThreadLocal)) { |
| if (LIKELY(self == thread_running_gc_)) { |
| // If GC-running thread, use the GC mark stack instead of a thread-local mark stack. |
| CHECK(self->GetThreadLocalMarkStack() == nullptr); |
| if (UNLIKELY(gc_mark_stack_->IsFull())) { |
| ExpandGcMarkStack(); |
| } |
| gc_mark_stack_->PushBack(to_ref); |
| } else { |
| // Otherwise, use a thread-local mark stack. |
| accounting::AtomicStack<mirror::Object>* tl_mark_stack = self->GetThreadLocalMarkStack(); |
| if (UNLIKELY(tl_mark_stack == nullptr || tl_mark_stack->IsFull())) { |
| MutexLock mu(self, mark_stack_lock_); |
| // Get a new thread local mark stack. |
| accounting::AtomicStack<mirror::Object>* new_tl_mark_stack; |
| if (!pooled_mark_stacks_.empty()) { |
| // Use a pooled mark stack. |
| new_tl_mark_stack = pooled_mark_stacks_.back(); |
| pooled_mark_stacks_.pop_back(); |
| } else { |
| // None pooled. Create a new one. |
| new_tl_mark_stack = |
| accounting::AtomicStack<mirror::Object>::Create( |
| "thread local mark stack", 4 * KB, 4 * KB); |
| } |
| DCHECK(new_tl_mark_stack != nullptr); |
| DCHECK(new_tl_mark_stack->IsEmpty()); |
| new_tl_mark_stack->PushBack(to_ref); |
| self->SetThreadLocalMarkStack(new_tl_mark_stack); |
| if (tl_mark_stack != nullptr) { |
| // Store the old full stack into a vector. |
| revoked_mark_stacks_.push_back(tl_mark_stack); |
| } |
| } else { |
| tl_mark_stack->PushBack(to_ref); |
| } |
| } |
| } else if (mark_stack_mode == kMarkStackModeShared) { |
| // Access the shared GC mark stack with a lock. |
| MutexLock mu(self, mark_stack_lock_); |
| if (UNLIKELY(gc_mark_stack_->IsFull())) { |
| ExpandGcMarkStack(); |
| } |
| gc_mark_stack_->PushBack(to_ref); |
| } else { |
| CHECK_EQ(static_cast<uint32_t>(mark_stack_mode), |
| static_cast<uint32_t>(kMarkStackModeGcExclusive)) |
| << "ref=" << to_ref |
| << " self->gc_marking=" << self->GetIsGcMarking() |
| << " cc->is_marking=" << is_marking_; |
| CHECK(self == thread_running_gc_) |
| << "Only GC-running thread should access the mark stack " |
| << "in the GC exclusive mark stack mode. " |
| << "ref=" << to_ref |
| << " self->gc_marking=" << self->GetIsGcMarking() |
| << " cc->is_marking=" << is_marking_; |
| // Access the GC mark stack without a lock. |
| if (UNLIKELY(gc_mark_stack_->IsFull())) { |
| ExpandGcMarkStack(); |
| } |
| gc_mark_stack_->PushBack(to_ref); |
| } |
| } |
| |
| accounting::ObjectStack* ConcurrentCopying::GetAllocationStack() { |
| return heap_->allocation_stack_.get(); |
| } |
| |
| accounting::ObjectStack* ConcurrentCopying::GetLiveStack() { |
| return heap_->live_stack_.get(); |
| } |
| |
| // The following visitors are used to verify that there's no references to the from-space left after |
| // marking. |
| class ConcurrentCopying::VerifyNoFromSpaceRefsVisitor : public SingleRootVisitor { |
| public: |
| explicit VerifyNoFromSpaceRefsVisitor(ConcurrentCopying* collector) |
| : collector_(collector) {} |
| |
| void operator()(mirror::Object* ref, |
| MemberOffset offset = MemberOffset(0), |
| mirror::Object* holder = nullptr) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| if (ref == nullptr) { |
| // OK. |
| return; |
| } |
| collector_->AssertToSpaceInvariant(holder, offset, ref); |
| if (kUseBakerReadBarrier) { |
| CHECK_EQ(ref->GetReadBarrierState(), ReadBarrier::NonGrayState()) |
| << "Ref " << ref << " " << ref->PrettyTypeOf() << " has gray rb_state"; |
| } |
| } |
| |
| void VisitRoot(mirror::Object* root, const RootInfo& info ATTRIBUTE_UNUSED) |
| override REQUIRES_SHARED(Locks::mutator_lock_) { |
| DCHECK(root != nullptr); |
| operator()(root); |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| }; |
| |
| class ConcurrentCopying::VerifyNoFromSpaceRefsFieldVisitor { |
| public: |
| explicit VerifyNoFromSpaceRefsFieldVisitor(ConcurrentCopying* collector) |
| : collector_(collector) {} |
| |
| void operator()(ObjPtr<mirror::Object> obj, |
| MemberOffset offset, |
| bool is_static ATTRIBUTE_UNUSED) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| mirror::Object* ref = |
| obj->GetFieldObject<mirror::Object, kDefaultVerifyFlags, kWithoutReadBarrier>(offset); |
| VerifyNoFromSpaceRefsVisitor visitor(collector_); |
| visitor(ref, offset, obj.Ptr()); |
| } |
| void operator()(ObjPtr<mirror::Class> klass, |
| ObjPtr<mirror::Reference> ref) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| CHECK(klass->IsTypeOfReferenceClass()); |
| this->operator()(ref, mirror::Reference::ReferentOffset(), false); |
| } |
| |
| void VisitRootIfNonNull(mirror::CompressedReference<mirror::Object>* root) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (!root->IsNull()) { |
| VisitRoot(root); |
| } |
| } |
| |
| void VisitRoot(mirror::CompressedReference<mirror::Object>* root) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| VerifyNoFromSpaceRefsVisitor visitor(collector_); |
| visitor(root->AsMirrorPtr()); |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| }; |
| |
| // Verify there's no from-space references left after the marking phase. |
| void ConcurrentCopying::VerifyNoFromSpaceReferences() { |
| Thread* self = Thread::Current(); |
| DCHECK(Locks::mutator_lock_->IsExclusiveHeld(self)); |
| // Verify all threads have is_gc_marking to be false |
| { |
| MutexLock mu(self, *Locks::thread_list_lock_); |
| std::list<Thread*> thread_list = Runtime::Current()->GetThreadList()->GetList(); |
| for (Thread* thread : thread_list) { |
| CHECK(!thread->GetIsGcMarking()); |
| } |
| } |
| |
| auto verify_no_from_space_refs_visitor = [&](mirror::Object* obj) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| CHECK(obj != nullptr); |
| space::RegionSpace* region_space = RegionSpace(); |
| CHECK(!region_space->IsInFromSpace(obj)) << "Scanning object " << obj << " in from space"; |
| VerifyNoFromSpaceRefsFieldVisitor visitor(this); |
| obj->VisitReferences</*kVisitNativeRoots=*/true, kDefaultVerifyFlags, kWithoutReadBarrier>( |
| visitor, |
| visitor); |
| if (kUseBakerReadBarrier) { |
| CHECK_EQ(obj->GetReadBarrierState(), ReadBarrier::NonGrayState()) |
| << "obj=" << obj << " has gray rb_state " << obj->GetReadBarrierState(); |
| } |
| }; |
| // Roots. |
| { |
| ReaderMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| VerifyNoFromSpaceRefsVisitor ref_visitor(this); |
| Runtime::Current()->VisitRoots(&ref_visitor); |
| } |
| // The to-space. |
| region_space_->WalkToSpace(verify_no_from_space_refs_visitor); |
| // Non-moving spaces. |
| { |
| WriterMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| heap_->GetMarkBitmap()->Visit(verify_no_from_space_refs_visitor); |
| } |
| // The alloc stack. |
| { |
| VerifyNoFromSpaceRefsVisitor ref_visitor(this); |
| for (auto* it = heap_->allocation_stack_->Begin(), *end = heap_->allocation_stack_->End(); |
| it < end; ++it) { |
| mirror::Object* const obj = it->AsMirrorPtr(); |
| if (obj != nullptr && obj->GetClass() != nullptr) { |
| // TODO: need to call this only if obj is alive? |
| ref_visitor(obj); |
| verify_no_from_space_refs_visitor(obj); |
| } |
| } |
| } |
| // TODO: LOS. But only refs in LOS are classes. |
| } |
| |
| // The following visitors are used to assert the to-space invariant. |
| class ConcurrentCopying::AssertToSpaceInvariantFieldVisitor { |
| public: |
| explicit AssertToSpaceInvariantFieldVisitor(ConcurrentCopying* collector) |
| : collector_(collector) {} |
| |
| void operator()(ObjPtr<mirror::Object> obj, |
| MemberOffset offset, |
| bool is_static ATTRIBUTE_UNUSED) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| mirror::Object* ref = |
| obj->GetFieldObject<mirror::Object, kDefaultVerifyFlags, kWithoutReadBarrier>(offset); |
| collector_->AssertToSpaceInvariant(obj.Ptr(), offset, ref); |
| } |
| void operator()(ObjPtr<mirror::Class> klass, ObjPtr<mirror::Reference> ref ATTRIBUTE_UNUSED) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| CHECK(klass->IsTypeOfReferenceClass()); |
| } |
| |
| void VisitRootIfNonNull(mirror::CompressedReference<mirror::Object>* root) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (!root->IsNull()) { |
| VisitRoot(root); |
| } |
| } |
| |
| void VisitRoot(mirror::CompressedReference<mirror::Object>* root) const |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| mirror::Object* ref = root->AsMirrorPtr(); |
| collector_->AssertToSpaceInvariant(/* obj */ nullptr, MemberOffset(0), ref); |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| }; |
| |
| void ConcurrentCopying::RevokeThreadLocalMarkStacks(bool disable_weak_ref_access, |
| Closure* checkpoint_callback) { |
| Thread* self = Thread::Current(); |
| Locks::mutator_lock_->AssertSharedHeld(self); |
| ThreadList* thread_list = Runtime::Current()->GetThreadList(); |
| RevokeThreadLocalMarkStackCheckpoint check_point(this, disable_weak_ref_access); |
| if (disable_weak_ref_access) { |
| // We're the only thread that could possibly ask for exclusive access here. |
| Locks::mutator_lock_->SharedUnlock(self); |
| { |
| ScopedPause pause(this); |
| MutexLock mu(self, *Locks::thread_list_lock_); |
| checkpoint_callback->Run(self); |
| for (Thread* thread : thread_list->GetList()) { |
| check_point.Run(thread); |
| } |
| } |
| Locks::mutator_lock_->SharedLock(self); |
| } else { |
| gc_barrier_->Init(self, 0); |
| size_t barrier_count = thread_list->RunCheckpoint(&check_point, checkpoint_callback); |
| // If there are no threads to wait which implys that all the checkpoint functions are finished, |
| // then no need to release the mutator lock. |
| if (barrier_count == 0) { |
| return; |
| } |
| Locks::mutator_lock_->SharedUnlock(self); |
| { |
| ScopedThreadStateChange tsc(self, ThreadState::kWaitingForCheckPointsToRun); |
| gc_barrier_->Increment(self, barrier_count); |
| } |
| Locks::mutator_lock_->SharedLock(self); |
| } |
| } |
| |
| void ConcurrentCopying::RevokeThreadLocalMarkStack(Thread* thread) { |
| Thread* self = Thread::Current(); |
| CHECK_EQ(self, thread); |
| MutexLock mu(self, mark_stack_lock_); |
| accounting::AtomicStack<mirror::Object>* tl_mark_stack = thread->GetThreadLocalMarkStack(); |
| if (tl_mark_stack != nullptr) { |
| CHECK(is_marking_); |
| revoked_mark_stacks_.push_back(tl_mark_stack); |
| thread->SetThreadLocalMarkStack(nullptr); |
| } |
| } |
| |
| void ConcurrentCopying::ProcessMarkStack() { |
| if (kVerboseMode) { |
| LOG(INFO) << "ProcessMarkStack. "; |
| } |
| bool empty_prev = false; |
| while (true) { |
| bool empty = ProcessMarkStackOnce(); |
| if (empty_prev && empty) { |
| // Saw empty mark stack for a second time, done. |
| break; |
| } |
| empty_prev = empty; |
| } |
| } |
| |
| bool ConcurrentCopying::ProcessMarkStackOnce() { |
| DCHECK(thread_running_gc_ != nullptr); |
| Thread* const self = Thread::Current(); |
| DCHECK(self == thread_running_gc_); |
| DCHECK(thread_running_gc_->GetThreadLocalMarkStack() == nullptr); |
| size_t count = 0; |
| MarkStackMode mark_stack_mode = mark_stack_mode_.load(std::memory_order_relaxed); |
| if (mark_stack_mode == kMarkStackModeThreadLocal) { |
| // Process the thread-local mark stacks and the GC mark stack. |
| count += ProcessThreadLocalMarkStacks(/* disable_weak_ref_access= */ false, |
| /* checkpoint_callback= */ nullptr, |
| [this] (mirror::Object* ref) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| ProcessMarkStackRef(ref); |
| }); |
| while (!gc_mark_stack_->IsEmpty()) { |
| mirror::Object* to_ref = gc_mark_stack_->PopBack(); |
| ProcessMarkStackRef(to_ref); |
| ++count; |
| } |
| gc_mark_stack_->Reset(); |
| } else if (mark_stack_mode == kMarkStackModeShared) { |
| // Do an empty checkpoint to avoid a race with a mutator preempted in the middle of a read |
| // barrier but before pushing onto the mark stack. b/32508093. Note the weak ref access is |
| // disabled at this point. |
| IssueEmptyCheckpoint(); |
| // Process the shared GC mark stack with a lock. |
| { |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| CHECK(revoked_mark_stacks_.empty()); |
| CHECK_EQ(pooled_mark_stacks_.size(), kMarkStackPoolSize); |
| } |
| while (true) { |
| std::vector<mirror::Object*> refs; |
| { |
| // Copy refs with lock. Note the number of refs should be small. |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| if (gc_mark_stack_->IsEmpty()) { |
| break; |
| } |
| for (StackReference<mirror::Object>* p = gc_mark_stack_->Begin(); |
| p != gc_mark_stack_->End(); ++p) { |
| refs.push_back(p->AsMirrorPtr()); |
| } |
| gc_mark_stack_->Reset(); |
| } |
| for (mirror::Object* ref : refs) { |
| ProcessMarkStackRef(ref); |
| ++count; |
| } |
| } |
| } else { |
| CHECK_EQ(static_cast<uint32_t>(mark_stack_mode), |
| static_cast<uint32_t>(kMarkStackModeGcExclusive)); |
| { |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| CHECK(revoked_mark_stacks_.empty()); |
| CHECK_EQ(pooled_mark_stacks_.size(), kMarkStackPoolSize); |
| } |
| // Process the GC mark stack in the exclusive mode. No need to take the lock. |
| while (!gc_mark_stack_->IsEmpty()) { |
| mirror::Object* to_ref = gc_mark_stack_->PopBack(); |
| ProcessMarkStackRef(to_ref); |
| ++count; |
| } |
| gc_mark_stack_->Reset(); |
| } |
| |
| // Return true if the stack was empty. |
| return count == 0; |
| } |
| |
| template <typename Processor> |
| size_t ConcurrentCopying::ProcessThreadLocalMarkStacks(bool disable_weak_ref_access, |
| Closure* checkpoint_callback, |
| const Processor& processor) { |
| // Run a checkpoint to collect all thread local mark stacks and iterate over them all. |
| RevokeThreadLocalMarkStacks(disable_weak_ref_access, checkpoint_callback); |
| if (disable_weak_ref_access) { |
| CHECK_EQ(static_cast<uint32_t>(mark_stack_mode_.load(std::memory_order_relaxed)), |
| static_cast<uint32_t>(kMarkStackModeShared)); |
| } |
| size_t count = 0; |
| std::vector<accounting::AtomicStack<mirror::Object>*> mark_stacks; |
| { |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| // Make a copy of the mark stack vector. |
| mark_stacks = revoked_mark_stacks_; |
| revoked_mark_stacks_.clear(); |
| } |
| for (accounting::AtomicStack<mirror::Object>* mark_stack : mark_stacks) { |
| for (StackReference<mirror::Object>* p = mark_stack->Begin(); p != mark_stack->End(); ++p) { |
| mirror::Object* to_ref = p->AsMirrorPtr(); |
| processor(to_ref); |
| ++count; |
| } |
| { |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| if (pooled_mark_stacks_.size() >= kMarkStackPoolSize) { |
| // The pool has enough. Delete it. |
| delete mark_stack; |
| } else { |
| // Otherwise, put it into the pool for later reuse. |
| mark_stack->Reset(); |
| pooled_mark_stacks_.push_back(mark_stack); |
| } |
| } |
| } |
| if (disable_weak_ref_access) { |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| CHECK(revoked_mark_stacks_.empty()); |
| CHECK_EQ(pooled_mark_stacks_.size(), kMarkStackPoolSize); |
| } |
| return count; |
| } |
| |
| inline void ConcurrentCopying::ProcessMarkStackRef(mirror::Object* to_ref) { |
| DCHECK(!region_space_->IsInFromSpace(to_ref)); |
| size_t obj_size = 0; |
| space::RegionSpace::RegionType rtype = region_space_->GetRegionType(to_ref); |
| if (kUseBakerReadBarrier) { |
| DCHECK(to_ref->GetReadBarrierState() == ReadBarrier::GrayState()) |
| << " to_ref=" << to_ref |
| << " rb_state=" << to_ref->GetReadBarrierState() |
| << " is_marked=" << IsMarked(to_ref) |
| << " type=" << to_ref->PrettyTypeOf() |
| << " young_gen=" << std::boolalpha << young_gen_ << std::noboolalpha |
| << " space=" << heap_->DumpSpaceNameFromAddress(to_ref) |
| << " region_type=" << rtype; |
| } |
| bool add_to_live_bytes = false; |
| // Invariant: There should be no object from a newly-allocated |
| // region (either large or non-large) on the mark stack. |
| DCHECK(!region_space_->IsInNewlyAllocatedRegion(to_ref)) << to_ref; |
| bool perform_scan = false; |
| switch (rtype) { |
| case space::RegionSpace::RegionType::kRegionTypeUnevacFromSpace: |
| // Mark the bitmap only in the GC thread here so that we don't need a CAS. |
| if (!kUseBakerReadBarrier || !region_space_bitmap_->Set(to_ref)) { |
| // It may be already marked if we accidentally pushed the same object twice due to the racy |
| // bitmap read in MarkUnevacFromSpaceRegion. |
| if (use_generational_cc_ && young_gen_) { |
| CHECK(region_space_->IsLargeObject(to_ref)); |
| region_space_->ZeroLiveBytesForLargeObject(to_ref); |
| } |
| perform_scan = true; |
| // Only add to the live bytes if the object was not already marked and we are not the young |
| // GC. |
| // Why add live bytes even after 2-phase GC? |
| // We need to ensure that if there is a unevac region with any live |
| // objects, then its live_bytes must be non-zero. Otherwise, |
| // ClearFromSpace() will clear the region. Considering, that we may skip |
| // live objects during marking phase of 2-phase GC, we have to take care |
| // of such objects here. |
| add_to_live_bytes = true; |
| } |
| break; |
| case space::RegionSpace::RegionType::kRegionTypeToSpace: |
| if (use_generational_cc_) { |
| // Copied to to-space, set the bit so that the next GC can scan objects. |
| region_space_bitmap_->Set(to_ref); |
| } |
| perform_scan = true; |
| break; |
| default: |
| DCHECK(!region_space_->HasAddress(to_ref)) << to_ref; |
| DCHECK(!immune_spaces_.ContainsObject(to_ref)); |
| // Non-moving or large-object space. |
| if (kUseBakerReadBarrier) { |
| accounting::ContinuousSpaceBitmap* mark_bitmap = |
| heap_->GetNonMovingSpace()->GetMarkBitmap(); |
| const bool is_los = !mark_bitmap->HasAddress(to_ref); |
| if (is_los) { |
| if (!IsAligned<kPageSize>(to_ref)) { |
| // Ref is a large object that is not aligned, it must be heap |
| // corruption. Remove memory protection and dump data before |
| // AtomicSetReadBarrierState since it will fault if the address is not |
| // valid. |
| region_space_->Unprotect(); |
| heap_->GetVerification()->LogHeapCorruption(/* obj */ nullptr, |
| MemberOffset(0), |
| to_ref, |
| /* fatal */ true); |
| } |
| DCHECK(heap_->GetLargeObjectsSpace()) |
| << "ref=" << to_ref |
| << " doesn't belong to non-moving space and large object space doesn't exist"; |
| accounting::LargeObjectBitmap* los_bitmap = |
| heap_->GetLargeObjectsSpace()->GetMarkBitmap(); |
| DCHECK(los_bitmap->HasAddress(to_ref)); |
| // Only the GC thread could be setting the LOS bit map hence doesn't |
| // need to be atomically done. |
| perform_scan = !los_bitmap->Set(to_ref); |
| } else { |
| // Only the GC thread could be setting the non-moving space bit map |
| // hence doesn't need to be atomically done. |
| perform_scan = !mark_bitmap->Set(to_ref); |
| } |
| } else { |
| perform_scan = true; |
| } |
| } |
| if (perform_scan) { |
| obj_size = to_ref->SizeOf<kDefaultVerifyFlags>(); |
| if (use_generational_cc_ && young_gen_) { |
| Scan<true>(to_ref, obj_size); |
| } else { |
| Scan<false>(to_ref, obj_size); |
| } |
| } |
| if (kUseBakerReadBarrier) { |
| DCHECK(to_ref->GetReadBarrierState() == ReadBarrier::GrayState()) |
| << " to_ref=" << to_ref |
| << " rb_state=" << to_ref->GetReadBarrierState() |
| << " is_marked=" << IsMarked(to_ref) |
| << " type=" << to_ref->PrettyTypeOf() |
| << " young_gen=" << std::boolalpha << young_gen_ << std::noboolalpha |
| << " space=" << heap_->DumpSpaceNameFromAddress(to_ref) |
| << " region_type=" << rtype |
| // TODO: Temporary; remove this when this is no longer needed (b/116087961). |
| << " runtime->sentinel=" << Runtime::Current()->GetSentinel().Read<kWithoutReadBarrier>(); |
| } |
| #ifdef USE_BAKER_READ_BARRIER |
| mirror::Object* referent = nullptr; |
| if (UNLIKELY((to_ref->GetClass<kVerifyNone, kWithoutReadBarrier>()->IsTypeOfReferenceClass() && |
| (referent = to_ref->AsReference()->GetReferent<kWithoutReadBarrier>()) != nullptr && |
| !IsInToSpace(referent)))) { |
| // Leave this reference gray in the queue so that GetReferent() will trigger a read barrier. We |
| // will change it to non-gray later in ReferenceQueue::DisableReadBarrierForReference. |
| DCHECK(to_ref->AsReference()->GetPendingNext() != nullptr) |
| << "Left unenqueued ref gray " << to_ref; |
| } else { |
| // We may occasionally leave a reference non-gray in the queue if its referent happens to be |
| // concurrently marked after the Scan() call above has enqueued the Reference, in which case the |
| // above IsInToSpace() evaluates to true and we change the color from gray to non-gray here in |
| // this else block. |
| if (kUseBakerReadBarrier) { |
| bool success = to_ref->AtomicSetReadBarrierState<std::memory_order_release>( |
| ReadBarrier::GrayState(), |
| ReadBarrier::NonGrayState()); |
| DCHECK(success) << "Must succeed as we won the race."; |
| } |
| } |
| #else |
| DCHECK(!kUseBakerReadBarrier); |
| #endif |
| |
| if (add_to_live_bytes) { |
| // Add to the live bytes per unevacuated from-space. Note this code is always run by the |
| // GC-running thread (no synchronization required). |
| DCHECK(region_space_bitmap_->Test(to_ref)); |
| if (obj_size == 0) { |
| obj_size = to_ref->SizeOf<kDefaultVerifyFlags>(); |
| } |
| region_space_->AddLiveBytes(to_ref, RoundUp(obj_size, space::RegionSpace::kAlignment)); |
| } |
| if (ReadBarrier::kEnableToSpaceInvariantChecks) { |
| CHECK(to_ref != nullptr); |
| space::RegionSpace* region_space = RegionSpace(); |
| CHECK(!region_space->IsInFromSpace(to_ref)) << "Scanning object " << to_ref << " in from space"; |
| AssertToSpaceInvariant(nullptr, MemberOffset(0), to_ref); |
| AssertToSpaceInvariantFieldVisitor visitor(this); |
| to_ref->VisitReferences</*kVisitNativeRoots=*/true, kDefaultVerifyFlags, kWithoutReadBarrier>( |
| visitor, |
| visitor); |
| } |
| } |
| |
| class ConcurrentCopying::DisableWeakRefAccessCallback : public Closure { |
| public: |
| explicit DisableWeakRefAccessCallback(ConcurrentCopying* concurrent_copying) |
| : concurrent_copying_(concurrent_copying) { |
| } |
| |
| void Run(Thread* self ATTRIBUTE_UNUSED) override REQUIRES(Locks::thread_list_lock_) { |
| // This needs to run under the thread_list_lock_ critical section in ThreadList::RunCheckpoint() |
| // to avoid a deadlock b/31500969. |
| CHECK(concurrent_copying_->weak_ref_access_enabled_); |
| concurrent_copying_->weak_ref_access_enabled_ = false; |
| } |
| |
| private: |
| ConcurrentCopying* const concurrent_copying_; |
| }; |
| |
| void ConcurrentCopying::SwitchToSharedMarkStackMode() { |
| Thread* self = Thread::Current(); |
| DCHECK(thread_running_gc_ != nullptr); |
| DCHECK(self == thread_running_gc_); |
| DCHECK(thread_running_gc_->GetThreadLocalMarkStack() == nullptr); |
| MarkStackMode before_mark_stack_mode = mark_stack_mode_.load(std::memory_order_relaxed); |
| CHECK_EQ(static_cast<uint32_t>(before_mark_stack_mode), |
| static_cast<uint32_t>(kMarkStackModeThreadLocal)); |
| mark_stack_mode_.store(kMarkStackModeShared, std::memory_order_relaxed); |
| DisableWeakRefAccessCallback dwrac(this); |
| // Process the thread local mark stacks one last time after switching to the shared mark stack |
| // mode and disable weak ref accesses. |
| ProcessThreadLocalMarkStacks(/* disable_weak_ref_access= */ true, |
| &dwrac, |
| [this] (mirror::Object* ref) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| ProcessMarkStackRef(ref); |
| }); |
| if (kVerboseMode) { |
| LOG(INFO) << "Switched to shared mark stack mode and disabled weak ref access"; |
| } |
| } |
| |
| void ConcurrentCopying::SwitchToGcExclusiveMarkStackMode() { |
| Thread* self = Thread::Current(); |
| DCHECK(thread_running_gc_ != nullptr); |
| DCHECK(self == thread_running_gc_); |
| DCHECK(thread_running_gc_->GetThreadLocalMarkStack() == nullptr); |
| MarkStackMode before_mark_stack_mode = mark_stack_mode_.load(std::memory_order_relaxed); |
| CHECK_EQ(static_cast<uint32_t>(before_mark_stack_mode), |
| static_cast<uint32_t>(kMarkStackModeShared)); |
| mark_stack_mode_.store(kMarkStackModeGcExclusive, std::memory_order_relaxed); |
| QuasiAtomic::ThreadFenceForConstructor(); |
| if (kVerboseMode) { |
| LOG(INFO) << "Switched to GC exclusive mark stack mode"; |
| } |
| } |
| |
| void ConcurrentCopying::CheckEmptyMarkStack() { |
| Thread* self = Thread::Current(); |
| DCHECK(thread_running_gc_ != nullptr); |
| DCHECK(self == thread_running_gc_); |
| DCHECK(thread_running_gc_->GetThreadLocalMarkStack() == nullptr); |
| MarkStackMode mark_stack_mode = mark_stack_mode_.load(std::memory_order_relaxed); |
| if (mark_stack_mode == kMarkStackModeThreadLocal) { |
| // Thread-local mark stack mode. |
| RevokeThreadLocalMarkStacks(false, nullptr); |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| if (!revoked_mark_stacks_.empty()) { |
| for (accounting::AtomicStack<mirror::Object>* mark_stack : revoked_mark_stacks_) { |
| while (!mark_stack->IsEmpty()) { |
| mirror::Object* obj = mark_stack->PopBack(); |
| if (kUseBakerReadBarrier) { |
| uint32_t rb_state = obj->GetReadBarrierState(); |
| LOG(INFO) << "On mark queue : " << obj << " " << obj->PrettyTypeOf() << " rb_state=" |
| << rb_state << " is_marked=" << IsMarked(obj); |
| } else { |
| LOG(INFO) << "On mark queue : " << obj << " " << obj->PrettyTypeOf() |
| << " is_marked=" << IsMarked(obj); |
| } |
| } |
| } |
| LOG(FATAL) << "mark stack is not empty"; |
| } |
| } else { |
| // Shared, GC-exclusive, or off. |
| MutexLock mu(thread_running_gc_, mark_stack_lock_); |
| CHECK(gc_mark_stack_->IsEmpty()); |
| CHECK(revoked_mark_stacks_.empty()); |
| CHECK_EQ(pooled_mark_stacks_.size(), kMarkStackPoolSize); |
| } |
| } |
| |
| void ConcurrentCopying::SweepSystemWeaks(Thread* self) { |
| TimingLogger::ScopedTiming split("SweepSystemWeaks", GetTimings()); |
| ReaderMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| Runtime::Current()->SweepSystemWeaks(this); |
| } |
| |
| void ConcurrentCopying::Sweep(bool swap_bitmaps) { |
| if (use_generational_cc_ && young_gen_) { |
| // Only sweep objects on the live stack. |
| SweepArray(heap_->GetLiveStack(), /* swap_bitmaps= */ false); |
| } else { |
| { |
| TimingLogger::ScopedTiming t("MarkStackAsLive", GetTimings()); |
| accounting::ObjectStack* live_stack = heap_->GetLiveStack(); |
| if (kEnableFromSpaceAccountingCheck) { |
| // Ensure that nobody inserted items in the live stack after we swapped the stacks. |
| CHECK_GE(live_stack_freeze_size_, live_stack->Size()); |
| } |
| heap_->MarkAllocStackAsLive(live_stack); |
| live_stack->Reset(); |
| } |
| CheckEmptyMarkStack(); |
| TimingLogger::ScopedTiming split("Sweep", GetTimings()); |
| for (const auto& space : GetHeap()->GetContinuousSpaces()) { |
| if (space->IsContinuousMemMapAllocSpace() && space != region_space_ |
| && !immune_spaces_.ContainsSpace(space)) { |
| space::ContinuousMemMapAllocSpace* alloc_space = space->AsContinuousMemMapAllocSpace(); |
| TimingLogger::ScopedTiming split2( |
| alloc_space->IsZygoteSpace() ? "SweepZygoteSpace" : "SweepAllocSpace", GetTimings()); |
| RecordFree(alloc_space->Sweep(swap_bitmaps)); |
| } |
| } |
| SweepLargeObjects(swap_bitmaps); |
| } |
| } |
| |
| // Copied and adapted from MarkSweep::SweepArray. |
| void ConcurrentCopying::SweepArray(accounting::ObjectStack* allocations, bool swap_bitmaps) { |
| // This method is only used when Generational CC collection is enabled. |
| DCHECK(use_generational_cc_); |
| CheckEmptyMarkStack(); |
| TimingLogger::ScopedTiming t("SweepArray", GetTimings()); |
| Thread* self = Thread::Current(); |
| mirror::Object** chunk_free_buffer = reinterpret_cast<mirror::Object**>( |
| sweep_array_free_buffer_mem_map_.BaseBegin()); |
| size_t chunk_free_pos = 0; |
| ObjectBytePair freed; |
| ObjectBytePair freed_los; |
| // How many objects are left in the array, modified after each space is swept. |
| StackReference<mirror::Object>* objects = allocations->Begin(); |
| size_t count = allocations->Size(); |
| // Start by sweeping the continuous spaces. |
| for (space::ContinuousSpace* space : heap_->GetContinuousSpaces()) { |
| if (!space->IsAllocSpace() || |
| space == region_space_ || |
| immune_spaces_.ContainsSpace(space) || |
| space->GetLiveBitmap() == nullptr) { |
| continue; |
| } |
| space::AllocSpace* alloc_space = space->AsAllocSpace(); |
| accounting::ContinuousSpaceBitmap* live_bitmap = space->GetLiveBitmap(); |
| accounting::ContinuousSpaceBitmap* mark_bitmap = space->GetMarkBitmap(); |
| if (swap_bitmaps) { |
| std::swap(live_bitmap, mark_bitmap); |
| } |
| StackReference<mirror::Object>* out = objects; |
| for (size_t i = 0; i < count; ++i) { |
| mirror::Object* const obj = objects[i].AsMirrorPtr(); |
| if (kUseThreadLocalAllocationStack && obj == nullptr) { |
| continue; |
| } |
| if (space->HasAddress(obj)) { |
| // This object is in the space, remove it from the array and add it to the sweep buffer |
| // if needed. |
| if (!mark_bitmap->Test(obj)) { |
| if (chunk_free_pos >= kSweepArrayChunkFreeSize) { |
| TimingLogger::ScopedTiming t2("FreeList", GetTimings()); |
| freed.objects += chunk_free_pos; |
| freed.bytes += alloc_space->FreeList(self, chunk_free_pos, chunk_free_buffer); |
| chunk_free_pos = 0; |
| } |
| chunk_free_buffer[chunk_free_pos++] = obj; |
| } |
| } else { |
| (out++)->Assign(obj); |
| } |
| } |
| if (chunk_free_pos > 0) { |
| TimingLogger::ScopedTiming t2("FreeList", GetTimings()); |
| freed.objects += chunk_free_pos; |
| freed.bytes += alloc_space->FreeList(self, chunk_free_pos, chunk_free_buffer); |
| chunk_free_pos = 0; |
| } |
| // All of the references which space contained are no longer in the allocation stack, update |
| // the count. |
| count = out - objects; |
| } |
| // Handle the large object space. |
| space::LargeObjectSpace* large_object_space = GetHeap()->GetLargeObjectsSpace(); |
| if (large_object_space != nullptr) { |
| accounting::LargeObjectBitmap* large_live_objects = large_object_space->GetLiveBitmap(); |
| accounting::LargeObjectBitmap* large_mark_objects = large_object_space->GetMarkBitmap(); |
| if (swap_bitmaps) { |
| std::swap(large_live_objects, large_mark_objects); |
| } |
| for (size_t i = 0; i < count; ++i) { |
| mirror::Object* const obj = objects[i].AsMirrorPtr(); |
| // Handle large objects. |
| if (kUseThreadLocalAllocationStack && obj == nullptr) { |
| continue; |
| } |
| if (!large_mark_objects->Test(obj)) { |
| ++freed_los.objects; |
| freed_los.bytes += large_object_space->Free(self, obj); |
| } |
| } |
| } |
| { |
| TimingLogger::ScopedTiming t2("RecordFree", GetTimings()); |
| RecordFree(freed); |
| RecordFreeLOS(freed_los); |
| t2.NewTiming("ResetStack"); |
| allocations->Reset(); |
| } |
| sweep_array_free_buffer_mem_map_.MadviseDontNeedAndZero(); |
| } |
| |
| void ConcurrentCopying::MarkZygoteLargeObjects() { |
| TimingLogger::ScopedTiming split(__FUNCTION__, GetTimings()); |
| Thread* const self = Thread::Current(); |
| WriterMutexLock rmu(self, *Locks::heap_bitmap_lock_); |
| space::LargeObjectSpace* const los = heap_->GetLargeObjectsSpace(); |
| if (los != nullptr) { |
| // Pick the current live bitmap (mark bitmap if swapped). |
| accounting::LargeObjectBitmap* const live_bitmap = los->GetLiveBitmap(); |
| accounting::LargeObjectBitmap* const mark_bitmap = los->GetMarkBitmap(); |
| // Walk through all of the objects and explicitly mark the zygote ones so they don't get swept. |
| std::pair<uint8_t*, uint8_t*> range = los->GetBeginEndAtomic(); |
| live_bitmap->VisitMarkedRange(reinterpret_cast<uintptr_t>(range.first), |
| reinterpret_cast<uintptr_t>(range.second), |
| [mark_bitmap, los, self](mirror::Object* obj) |
| REQUIRES(Locks::heap_bitmap_lock_) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (los->IsZygoteLargeObject(self, obj)) { |
| mark_bitmap->Set(obj); |
| } |
| }); |
| } |
| } |
| |
| void ConcurrentCopying::SweepLargeObjects(bool swap_bitmaps) { |
| TimingLogger::ScopedTiming split("SweepLargeObjects", GetTimings()); |
| if (heap_->GetLargeObjectsSpace() != nullptr) { |
| RecordFreeLOS(heap_->GetLargeObjectsSpace()->Sweep(swap_bitmaps)); |
| } |
| } |
| |
| void ConcurrentCopying::CaptureRssAtPeak() { |
| using range_t = std::pair<void*, void*>; |
| // This operation is expensive as several calls to mincore() are performed. |
| // Also, this must be called before clearing regions in ReclaimPhase(). |
| // Therefore, we make it conditional on the flag that enables dumping GC |
| // performance info on shutdown. |
| if (Runtime::Current()->GetDumpGCPerformanceOnShutdown()) { |
| std::list<range_t> gc_ranges; |
| auto add_gc_range = [&gc_ranges](void* start, size_t size) { |
| void* end = static_cast<char*>(start) + RoundUp(size, kPageSize); |
| gc_ranges.emplace_back(range_t(start, end)); |
| }; |
| |
| // region space |
| DCHECK(IsAligned<kPageSize>(region_space_->Limit())); |
| gc_ranges.emplace_back(range_t(region_space_->Begin(), region_space_->Limit())); |
| // mark bitmap |
| add_gc_range(region_space_bitmap_->Begin(), region_space_bitmap_->Size()); |
| |
| // non-moving space |
| { |
| DCHECK(IsAligned<kPageSize>(heap_->non_moving_space_->Limit())); |
| gc_ranges.emplace_back(range_t(heap_->non_moving_space_->Begin(), |
| heap_->non_moving_space_->Limit())); |
| // mark bitmap |
| accounting::ContinuousSpaceBitmap *bitmap = heap_->non_moving_space_->GetMarkBitmap(); |
| add_gc_range(bitmap->Begin(), bitmap->Size()); |
| // live bitmap. Deal with bound bitmaps. |
| ReaderMutexLock mu(Thread::Current(), *Locks::heap_bitmap_lock_); |
| if (heap_->non_moving_space_->HasBoundBitmaps()) { |
| DCHECK_EQ(bitmap, heap_->non_moving_space_->GetLiveBitmap()); |
| bitmap = heap_->non_moving_space_->GetTempBitmap(); |
| } else { |
| bitmap = heap_->non_moving_space_->GetLiveBitmap(); |
| } |
| add_gc_range(bitmap->Begin(), bitmap->Size()); |
| } |
| // large-object space |
| if (heap_->GetLargeObjectsSpace()) { |
| heap_->GetLargeObjectsSpace()->ForEachMemMap([&add_gc_range](const MemMap& map) { |
| DCHECK(IsAligned<kPageSize>(map.BaseSize())); |
| add_gc_range(map.BaseBegin(), map.BaseSize()); |
| }); |
| // mark bitmap |
| accounting::LargeObjectBitmap* bitmap = heap_->GetLargeObjectsSpace()->GetMarkBitmap(); |
| add_gc_range(bitmap->Begin(), bitmap->Size()); |
| // live bitmap |
| bitmap = heap_->GetLargeObjectsSpace()->GetLiveBitmap(); |
| add_gc_range(bitmap->Begin(), bitmap->Size()); |
| } |
| // card table |
| add_gc_range(heap_->GetCardTable()->MemMapBegin(), heap_->GetCardTable()->MemMapSize()); |
| // inter-region refs |
| if (use_generational_cc_ && !young_gen_) { |
| // region space |
| add_gc_range(region_space_inter_region_bitmap_.Begin(), |
| region_space_inter_region_bitmap_.Size()); |
| // non-moving space |
| add_gc_range(non_moving_space_inter_region_bitmap_.Begin(), |
| non_moving_space_inter_region_bitmap_.Size()); |
| } |
| // Extract RSS using mincore(). Updates the cummulative RSS counter. |
| ExtractRssFromMincore(&gc_ranges); |
| } |
| } |
| |
| void ConcurrentCopying::ReclaimPhase() { |
| TimingLogger::ScopedTiming split("ReclaimPhase", GetTimings()); |
| if (kVerboseMode) { |
| LOG(INFO) << "GC ReclaimPhase"; |
| } |
| Thread* self = Thread::Current(); |
| |
| // Free data for class loaders that we unloaded. This includes removing |
| // dead methods from JIT's internal maps. This must be done before |
| // reclaiming the memory of the dead methods' declaring classes. |
| Runtime::Current()->GetClassLinker()->CleanupClassLoaders(); |
| |
| { |
| // Double-check that the mark stack is empty. |
| // Note: need to set this after VerifyNoFromSpaceRef(). |
| is_asserting_to_space_invariant_ = false; |
| QuasiAtomic::ThreadFenceForConstructor(); |
| if (kVerboseMode) { |
| LOG(INFO) << "Issue an empty check point. "; |
| } |
| IssueEmptyCheckpoint(); |
| // Disable the check. |
| is_mark_stack_push_disallowed_.store(0, std::memory_order_seq_cst); |
| if (kUseBakerReadBarrier) { |
| updated_all_immune_objects_.store(false, std::memory_order_seq_cst); |
| } |
| CheckEmptyMarkStack(); |
| } |
| |
| // Capture RSS at the time when memory usage is at its peak. All GC related |
| // memory ranges like java heap, card table, bitmap etc. are taken into |
| // account. |
| // TODO: We can fetch resident memory for region space directly by going |
| // through list of allocated regions. This way we can avoid calling mincore on |
| // the biggest memory range, thereby reducing the cost of this function. |
| CaptureRssAtPeak(); |
| |
| // Sweep the malloc spaces before clearing the from space since the memory tool mode might |
| // access the object classes in the from space for dead objects. |
| { |
| WriterMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| Sweep(/* swap_bitmaps= */ false); |
| SwapBitmaps(); |
| heap_->UnBindBitmaps(); |
| |
| // The bitmap was cleared at the start of the GC, there is nothing we need to do here. |
| DCHECK(region_space_bitmap_ != nullptr); |
| region_space_bitmap_ = nullptr; |
| } |
| |
| |
| { |
| // Record freed objects. |
| TimingLogger::ScopedTiming split2("RecordFree", GetTimings()); |
| // Don't include thread-locals that are in the to-space. |
| const uint64_t from_bytes = region_space_->GetBytesAllocatedInFromSpace(); |
| const uint64_t from_objects = region_space_->GetObjectsAllocatedInFromSpace(); |
| const uint64_t unevac_from_bytes = region_space_->GetBytesAllocatedInUnevacFromSpace(); |
| const uint64_t unevac_from_objects = region_space_->GetObjectsAllocatedInUnevacFromSpace(); |
| uint64_t to_bytes = bytes_moved_.load(std::memory_order_relaxed) + bytes_moved_gc_thread_; |
| cumulative_bytes_moved_ += to_bytes; |
| uint64_t to_objects = objects_moved_.load(std::memory_order_relaxed) + objects_moved_gc_thread_; |
| cumulative_objects_moved_ += to_objects; |
| if (kEnableFromSpaceAccountingCheck) { |
| CHECK_EQ(from_space_num_objects_at_first_pause_, from_objects + unevac_from_objects); |
| CHECK_EQ(from_space_num_bytes_at_first_pause_, from_bytes + unevac_from_bytes); |
| } |
| CHECK_LE(to_objects, from_objects); |
| // to_bytes <= from_bytes is only approximately true, because objects expand a little when |
| // copying to non-moving space in near-OOM situations. |
| if (from_bytes > 0) { |
| copied_live_bytes_ratio_sum_ += static_cast<float>(to_bytes) / from_bytes; |
| gc_count_++; |
| } |
| |
| // Cleared bytes and objects, populated by the call to RegionSpace::ClearFromSpace below. |
| uint64_t cleared_bytes; |
| uint64_t cleared_objects; |
| { |
| TimingLogger::ScopedTiming split4("ClearFromSpace", GetTimings()); |
| region_space_->ClearFromSpace(&cleared_bytes, &cleared_objects, /*clear_bitmap*/ !young_gen_); |
| // `cleared_bytes` and `cleared_objects` may be greater than the from space equivalents since |
| // RegionSpace::ClearFromSpace may clear empty unevac regions. |
| CHECK_GE(cleared_bytes, from_bytes); |
| CHECK_GE(cleared_objects, from_objects); |
| } |
| // freed_bytes could conceivably be negative if we fall back to nonmoving space and have to |
| // pad to a larger size. |
| int64_t freed_bytes = (int64_t)cleared_bytes - (int64_t)to_bytes; |
| uint64_t freed_objects = cleared_objects - to_objects; |
| if (kVerboseMode) { |
| LOG(INFO) << "RecordFree:" |
| << " from_bytes=" << from_bytes << " from_objects=" << from_objects |
| << " unevac_from_bytes=" << unevac_from_bytes |
| << " unevac_from_objects=" << unevac_from_objects |
| << " to_bytes=" << to_bytes << " to_objects=" << to_objects |
| << " freed_bytes=" << freed_bytes << " freed_objects=" << freed_objects |
| << " from_space size=" << region_space_->FromSpaceSize() |
| << " unevac_from_space size=" << region_space_->UnevacFromSpaceSize() |
| << " to_space size=" << region_space_->ToSpaceSize(); |
| LOG(INFO) << "(before) num_bytes_allocated=" |
| << heap_->num_bytes_allocated_.load(); |
| } |
| RecordFree(ObjectBytePair(freed_objects, freed_bytes)); |
| GetCurrentIteration()->SetScannedBytes(bytes_scanned_); |
| if (kVerboseMode) { |
| LOG(INFO) << "(after) num_bytes_allocated=" |
| << heap_->num_bytes_allocated_.load(); |
| } |
| |
| float reclaimed_bytes_ratio = static_cast<float>(freed_bytes) / num_bytes_allocated_before_gc_; |
| reclaimed_bytes_ratio_sum_ += reclaimed_bytes_ratio; |
| } |
| |
| CheckEmptyMarkStack(); |
| |
| if (heap_->dump_region_info_after_gc_) { |
| LOG(INFO) << "time=" << region_space_->Time(); |
| region_space_->DumpNonFreeRegions(LOG_STREAM(INFO)); |
| } |
| |
| if (kVerboseMode) { |
| LOG(INFO) << "GC end of ReclaimPhase"; |
| } |
| } |
| |
| std::string ConcurrentCopying::DumpReferenceInfo(mirror::Object* ref, |
| const char* ref_name, |
| const char* indent) { |
| std::ostringstream oss; |
| oss << indent << heap_->GetVerification()->DumpObjectInfo(ref, ref_name) << '\n'; |
| if (ref != nullptr) { |
| if (kUseBakerReadBarrier) { |
| oss << indent << ref_name << "->GetMarkBit()=" << ref->GetMarkBit() << '\n'; |
| oss << indent << ref_name << "->GetReadBarrierState()=" << ref->GetReadBarrierState() << '\n'; |
| } |
| } |
| if (region_space_->HasAddress(ref)) { |
| oss << indent << "Region containing " << ref_name << ":" << '\n'; |
| region_space_->DumpRegionForObject(oss, ref); |
| if (region_space_bitmap_ != nullptr) { |
| oss << indent << "region_space_bitmap_->Test(" << ref_name << ")=" |
| << std::boolalpha << region_space_bitmap_->Test(ref) << std::noboolalpha; |
| } |
| } |
| return oss.str(); |
| } |
| |
| std::string ConcurrentCopying::DumpHeapReference(mirror::Object* obj, |
| MemberOffset offset, |
| mirror::Object* ref) { |
| std::ostringstream oss; |
| constexpr const char* kIndent = " "; |
| oss << kIndent << "Invalid reference: ref=" << ref |
| << " referenced from: object=" << obj << " offset= " << offset << '\n'; |
| // Information about `obj`. |
| oss << DumpReferenceInfo(obj, "obj", kIndent) << '\n'; |
| // Information about `ref`. |
| oss << DumpReferenceInfo(ref, "ref", kIndent); |
| return oss.str(); |
| } |
| |
| void ConcurrentCopying::AssertToSpaceInvariant(mirror::Object* obj, |
| MemberOffset offset, |
| mirror::Object* ref) { |
| CHECK_EQ(heap_->collector_type_, kCollectorTypeCC) << static_cast<size_t>(heap_->collector_type_); |
| if (is_asserting_to_space_invariant_) { |
| if (ref == nullptr) { |
| // OK. |
| return; |
| } else if (region_space_->HasAddress(ref)) { |
| // Check to-space invariant in region space (moving space). |
| using RegionType = space::RegionSpace::RegionType; |
| space::RegionSpace::RegionType type = region_space_->GetRegionTypeUnsafe(ref); |
| if (type == RegionType::kRegionTypeToSpace) { |
| // OK. |
| return; |
| } else if (type == RegionType::kRegionTypeUnevacFromSpace) { |
| if (!IsMarkedInUnevacFromSpace(ref)) { |
| LOG(FATAL_WITHOUT_ABORT) << "Found unmarked reference in unevac from-space:"; |
| // Remove memory protection from the region space and log debugging information. |
| region_space_->Unprotect(); |
| LOG(FATAL_WITHOUT_ABORT) << DumpHeapReference(obj, offset, ref); |
| Thread::Current()->DumpJavaStack(LOG_STREAM(FATAL_WITHOUT_ABORT)); |
| } |
| CHECK(IsMarkedInUnevacFromSpace(ref)) << ref; |
| } else { |
| // Not OK: either a from-space ref or a reference in an unused region. |
| if (type == RegionType::kRegionTypeFromSpace) { |
| LOG(FATAL_WITHOUT_ABORT) << "Found from-space reference:"; |
| } else { |
| LOG(FATAL_WITHOUT_ABORT) << "Found reference in region with type " << type << ":"; |
| } |
| // Remove memory protection from the region space and log debugging information. |
| region_space_->Unprotect(); |
| LOG(FATAL_WITHOUT_ABORT) << DumpHeapReference(obj, offset, ref); |
| if (obj != nullptr) { |
| LogFromSpaceRefHolder(obj, offset); |
| LOG(FATAL_WITHOUT_ABORT) << "UNEVAC " << region_space_->IsInUnevacFromSpace(obj) << " " |
| << obj << " " << obj->GetMarkBit(); |
| if (region_space_->HasAddress(obj)) { |
| region_space_->DumpRegionForObject(LOG_STREAM(FATAL_WITHOUT_ABORT), obj); |
| } |
| LOG(FATAL_WITHOUT_ABORT) << "CARD " << static_cast<size_t>( |
| *Runtime::Current()->GetHeap()->GetCardTable()->CardFromAddr( |
| reinterpret_cast<uint8_t*>(obj))); |
| if (region_space_->HasAddress(obj)) { |
| LOG(FATAL_WITHOUT_ABORT) << "BITMAP " << region_space_bitmap_->Test(obj); |
| } else { |
| accounting::ContinuousSpaceBitmap* mark_bitmap = |
| heap_mark_bitmap_->GetContinuousSpaceBitmap(obj); |
| if (mark_bitmap != nullptr) { |
| LOG(FATAL_WITHOUT_ABORT) << "BITMAP " << mark_bitmap->Test(obj); |
| } else { |
| accounting::LargeObjectBitmap* los_bitmap = |
| heap_mark_bitmap_->GetLargeObjectBitmap(obj); |
| LOG(FATAL_WITHOUT_ABORT) << "BITMAP " << los_bitmap->Test(obj); |
| } |
| } |
| } |
| ref->GetLockWord(false).Dump(LOG_STREAM(FATAL_WITHOUT_ABORT)); |
| LOG(FATAL_WITHOUT_ABORT) << "Non-free regions:"; |
| region_space_->DumpNonFreeRegions(LOG_STREAM(FATAL_WITHOUT_ABORT)); |
| PrintFileToLog("/proc/self/maps", LogSeverity::FATAL_WITHOUT_ABORT); |
| MemMap::DumpMaps(LOG_STREAM(FATAL_WITHOUT_ABORT), /* terse= */ true); |
| LOG(FATAL) << "Invalid reference " << ref |
| << " referenced from object " << obj << " at offset " << offset; |
| } |
| } else { |
| // Check to-space invariant in non-moving space. |
| AssertToSpaceInvariantInNonMovingSpace(obj, ref); |
| } |
| } |
| } |
| |
| class RootPrinter { |
| public: |
| RootPrinter() { } |
| |
| template <class MirrorType> |
| ALWAYS_INLINE void VisitRootIfNonNull(mirror::CompressedReference<MirrorType>* root) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (!root->IsNull()) { |
| VisitRoot(root); |
| } |
| } |
| |
| template <class MirrorType> |
| void VisitRoot(mirror::Object** root) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| LOG(FATAL_WITHOUT_ABORT) << "root=" << root << " ref=" << *root; |
| } |
| |
| template <class MirrorType> |
| void VisitRoot(mirror::CompressedReference<MirrorType>* root) |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| LOG(FATAL_WITHOUT_ABORT) << "root=" << root << " ref=" << root->AsMirrorPtr(); |
| } |
| }; |
| |
| std::string ConcurrentCopying::DumpGcRoot(mirror::Object* ref) { |
| std::ostringstream oss; |
| constexpr const char* kIndent = " "; |
| oss << kIndent << "Invalid GC root: ref=" << ref << '\n'; |
| // Information about `ref`. |
| oss << DumpReferenceInfo(ref, "ref", kIndent); |
| return oss.str(); |
| } |
| |
| void ConcurrentCopying::AssertToSpaceInvariant(GcRootSource* gc_root_source, |
| mirror::Object* ref) { |
| CHECK_EQ(heap_->collector_type_, kCollectorTypeCC) << static_cast<size_t>(heap_->collector_type_); |
| if (is_asserting_to_space_invariant_) { |
| if (ref == nullptr) { |
| // OK. |
| return; |
| } else if (region_space_->HasAddress(ref)) { |
| // Check to-space invariant in region space (moving space). |
| using RegionType = space::RegionSpace::RegionType; |
| space::RegionSpace::RegionType type = region_space_->GetRegionTypeUnsafe(ref); |
| if (type == RegionType::kRegionTypeToSpace) { |
| // OK. |
| return; |
| } else if (type == RegionType::kRegionTypeUnevacFromSpace) { |
| if (!IsMarkedInUnevacFromSpace(ref)) { |
| LOG(FATAL_WITHOUT_ABORT) << "Found unmarked reference in unevac from-space:"; |
| // Remove memory protection from the region space and log debugging information. |
| region_space_->Unprotect(); |
| LOG(FATAL_WITHOUT_ABORT) << DumpGcRoot(ref); |
| } |
| CHECK(IsMarkedInUnevacFromSpace(ref)) << ref; |
| } else { |
| // Not OK: either a from-space ref or a reference in an unused region. |
| if (type == RegionType::kRegionTypeFromSpace) { |
| LOG(FATAL_WITHOUT_ABORT) << "Found from-space reference:"; |
| } else { |
| LOG(FATAL_WITHOUT_ABORT) << "Found reference in region with type " << type << ":"; |
| } |
| // Remove memory protection from the region space and log debugging information. |
| region_space_->Unprotect(); |
| LOG(FATAL_WITHOUT_ABORT) << DumpGcRoot(ref); |
| if (gc_root_source == nullptr) { |
| // No info. |
| } else if (gc_root_source->HasArtField()) { |
| ArtField* field = gc_root_source->GetArtField(); |
| LOG(FATAL_WITHOUT_ABORT) << "gc root in field " << field << " " |
| << ArtField::PrettyField(field); |
| RootPrinter root_printer; |
| field->VisitRoots(root_printer); |
| } else if (gc_root_source->HasArtMethod()) { |
| ArtMethod* method = gc_root_source->GetArtMethod(); |
| LOG(FATAL_WITHOUT_ABORT) << "gc root in method " << method << " " |
| << ArtMethod::PrettyMethod(method); |
| RootPrinter root_printer; |
| method->VisitRoots(root_printer, kRuntimePointerSize); |
| } |
| ref->GetLockWord(false).Dump(LOG_STREAM(FATAL_WITHOUT_ABORT)); |
| LOG(FATAL_WITHOUT_ABORT) << "Non-free regions:"; |
| region_space_->DumpNonFreeRegions(LOG_STREAM(FATAL_WITHOUT_ABORT)); |
| PrintFileToLog("/proc/self/maps", LogSeverity::FATAL_WITHOUT_ABORT); |
| MemMap::DumpMaps(LOG_STREAM(FATAL_WITHOUT_ABORT), /* terse= */ true); |
| LOG(FATAL) << "Invalid reference " << ref; |
| } |
| } else { |
| // Check to-space invariant in non-moving space. |
| AssertToSpaceInvariantInNonMovingSpace(/* obj= */ nullptr, ref); |
| } |
| } |
| } |
| |
| void ConcurrentCopying::LogFromSpaceRefHolder(mirror::Object* obj, MemberOffset offset) { |
| if (kUseBakerReadBarrier) { |
| LOG(INFO) << "holder=" << obj << " " << obj->PrettyTypeOf() |
| << " holder rb_state=" << obj->GetReadBarrierState(); |
| } else { |
| LOG(INFO) << "holder=" << obj << " " << obj->PrettyTypeOf(); |
| } |
| if (region_space_->IsInFromSpace(obj)) { |
| LOG(INFO) << "holder is in the from-space."; |
| } else if (region_space_->IsInToSpace(obj)) { |
| LOG(INFO) << "holder is in the to-space."; |
| } else if (region_space_->IsInUnevacFromSpace(obj)) { |
| LOG(INFO) << "holder is in the unevac from-space."; |
| if (IsMarkedInUnevacFromSpace(obj)) { |
| LOG(INFO) << "holder is marked in the region space bitmap."; |
| } else { |
| LOG(INFO) << "holder is not marked in the region space bitmap."; |
| } |
| } else { |
| // In a non-moving space. |
| if (immune_spaces_.ContainsObject(obj)) { |
| LOG(INFO) << "holder is in an immune image or the zygote space."; |
| } else { |
| LOG(INFO) << "holder is in a non-immune, non-moving (or main) space."; |
| accounting::ContinuousSpaceBitmap* mark_bitmap = heap_->GetNonMovingSpace()->GetMarkBitmap(); |
| accounting::LargeObjectBitmap* los_bitmap = nullptr; |
| const bool is_los = !mark_bitmap->HasAddress(obj); |
| if (is_los) { |
| DCHECK(heap_->GetLargeObjectsSpace() && heap_->GetLargeObjectsSpace()->Contains(obj)) |
| << "obj=" << obj |
| << " LOS bit map covers the entire lower 4GB address range"; |
| los_bitmap = heap_->GetLargeObjectsSpace()->GetMarkBitmap(); |
| } |
| if (!is_los && mark_bitmap->Test(obj)) { |
| LOG(INFO) << "holder is marked in the non-moving space mark bit map."; |
| } else if (is_los && los_bitmap->Test(obj)) { |
| LOG(INFO) << "holder is marked in the los bit map."; |
| } else { |
| // If ref is on the allocation stack, then it is considered |
| // mark/alive (but not necessarily on the live stack.) |
| if (IsOnAllocStack(obj)) { |
| LOG(INFO) << "holder is on the alloc stack."; |
| } else { |
| LOG(INFO) << "holder is not marked or on the alloc stack."; |
| } |
| } |
| } |
| } |
| LOG(INFO) << "offset=" << offset.SizeValue(); |
| } |
| |
| bool ConcurrentCopying::IsMarkedInNonMovingSpace(mirror::Object* from_ref) { |
| DCHECK(!region_space_->HasAddress(from_ref)) << "ref=" << from_ref; |
| DCHECK(!immune_spaces_.ContainsObject(from_ref)) << "ref=" << from_ref; |
| if (kUseBakerReadBarrier && from_ref->GetReadBarrierStateAcquire() == ReadBarrier::GrayState()) { |
| return true; |
| } else if (!use_generational_cc_ || done_scanning_.load(std::memory_order_acquire)) { |
| // Read the comment in IsMarkedInUnevacFromSpace() |
| accounting::ContinuousSpaceBitmap* mark_bitmap = heap_->GetNonMovingSpace()->GetMarkBitmap(); |
| accounting::LargeObjectBitmap* los_bitmap = nullptr; |
| const bool is_los = !mark_bitmap->HasAddress(from_ref); |
| if (is_los) { |
| DCHECK(heap_->GetLargeObjectsSpace() && heap_->GetLargeObjectsSpace()->Contains(from_ref)) |
| << "ref=" << from_ref |
| << " doesn't belong to non-moving space and large object space doesn't exist"; |
| los_bitmap = heap_->GetLargeObjectsSpace()->GetMarkBitmap(); |
| } |
| if (is_los ? los_bitmap->Test(from_ref) : mark_bitmap->Test(from_ref)) { |
| return true; |
| } |
| } |
| return IsOnAllocStack(from_ref); |
| } |
| |
| void ConcurrentCopying::AssertToSpaceInvariantInNonMovingSpace(mirror::Object* obj, |
| mirror::Object* ref) { |
| CHECK(ref != nullptr); |
| CHECK(!region_space_->HasAddress(ref)) << "obj=" << obj << " ref=" << ref; |
| // In a non-moving space. Check that the ref is marked. |
| if (immune_spaces_.ContainsObject(ref)) { |
| // Immune space case. |
| if (kUseBakerReadBarrier) { |
| // Immune object may not be gray if called from the GC. |
| if (Thread::Current() == thread_running_gc_ && !gc_grays_immune_objects_) { |
| return; |
| } |
| bool updated_all_immune_objects = updated_all_immune_objects_.load(std::memory_order_seq_cst); |
| CHECK(updated_all_immune_objects || ref->GetReadBarrierState() == ReadBarrier::GrayState()) |
| << "Unmarked immune space ref. obj=" << obj << " rb_state=" |
| << (obj != nullptr ? obj->GetReadBarrierState() : 0U) |
| << " ref=" << ref << " ref rb_state=" << ref->GetReadBarrierState() |
| << " updated_all_immune_objects=" << updated_all_immune_objects; |
| } |
| } else { |
| // Non-moving space and large-object space (LOS) cases. |
| // If `ref` is on the allocation stack, then it may not be |
| // marked live, but considered marked/alive (but not |
| // necessarily on the live stack). |
| CHECK(IsMarkedInNonMovingSpace(ref)) |
| << "Unmarked ref that's not on the allocation stack." |
| << " obj=" << obj |
| << " ref=" << ref |
| << " rb_state=" << ref->GetReadBarrierState() |
| << " is_marking=" << std::boolalpha << is_marking_ << std::noboolalpha |
| << " young_gen=" << std::boolalpha << young_gen_ << std::noboolalpha |
| << " done_scanning=" |
| << std::boolalpha << done_scanning_.load(std::memory_order_acquire) << std::noboolalpha |
| << " self=" << Thread::Current(); |
| } |
| } |
| |
| // Used to scan ref fields of an object. |
| template <bool kNoUnEvac> |
| class ConcurrentCopying::RefFieldsVisitor { |
| public: |
| explicit RefFieldsVisitor(ConcurrentCopying* collector, Thread* const thread) |
| : collector_(collector), thread_(thread) { |
| // Cannot have `kNoUnEvac` when Generational CC collection is disabled. |
| DCHECK_IMPLIES(kNoUnEvac, collector_->use_generational_cc_); |
| } |
| |
| void operator()(mirror::Object* obj, MemberOffset offset, bool /* is_static */) |
| const ALWAYS_INLINE REQUIRES_SHARED(Locks::mutator_lock_) |
| REQUIRES_SHARED(Locks::heap_bitmap_lock_) { |
| collector_->Process<kNoUnEvac>(obj, offset); |
| } |
| |
| void operator()(ObjPtr<mirror::Class> klass, ObjPtr<mirror::Reference> ref) const |
| REQUIRES_SHARED(Locks::mutator_lock_) ALWAYS_INLINE { |
| CHECK(klass->IsTypeOfReferenceClass()); |
| collector_->DelayReferenceReferent(klass, ref); |
| } |
| |
| void VisitRootIfNonNull(mirror::CompressedReference<mirror::Object>* root) const |
| ALWAYS_INLINE |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| if (!root->IsNull()) { |
| VisitRoot(root); |
| } |
| } |
| |
| void VisitRoot(mirror::CompressedReference<mirror::Object>* root) const |
| ALWAYS_INLINE |
| REQUIRES_SHARED(Locks::mutator_lock_) { |
| collector_->MarkRoot</*kGrayImmuneObject=*/false>(thread_, root); |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| Thread* const thread_; |
| }; |
| |
| template <bool kNoUnEvac> |
| inline void ConcurrentCopying::Scan(mirror::Object* to_ref, size_t obj_size) { |
| // Cannot have `kNoUnEvac` when Generational CC collection is disabled. |
| DCHECK_IMPLIES(kNoUnEvac, use_generational_cc_); |
| if (kDisallowReadBarrierDuringScan && !Runtime::Current()->IsActiveTransaction()) { |
| // Avoid all read barriers during visit references to help performance. |
| // Don't do this in transaction mode because we may read the old value of an field which may |
| // trigger read barriers. |
| Thread::Current()->ModifyDebugDisallowReadBarrier(1); |
| } |
| if (obj_size == 0) { |
| obj_size = to_ref->SizeOf<kDefaultVerifyFlags>(); |
| } |
| bytes_scanned_ += obj_size; |
| |
| DCHECK(!region_space_->IsInFromSpace(to_ref)); |
| DCHECK_EQ(Thread::Current(), thread_running_gc_); |
| RefFieldsVisitor<kNoUnEvac> visitor(this, thread_running_gc_); |
| // Disable the read barrier for a performance reason. |
| to_ref->VisitReferences</*kVisitNativeRoots=*/true, kDefaultVerifyFlags, kWithoutReadBarrier>( |
| visitor, visitor); |
| if (kDisallowReadBarrierDuringScan && !Runtime::Current()->IsActiveTransaction()) { |
| thread_running_gc_->ModifyDebugDisallowReadBarrier(-1); |
| } |
| } |
| |
| template <bool kNoUnEvac> |
| inline void ConcurrentCopying::Process(mirror::Object* obj, MemberOffset offset) { |
| // Cannot have `kNoUnEvac` when Generational CC collection is disabled. |
| DCHECK_IMPLIES(kNoUnEvac, use_generational_cc_); |
| DCHECK_EQ(Thread::Current(), thread_running_gc_); |
| mirror::Object* ref = obj->GetFieldObject< |
| mirror::Object, kVerifyNone, kWithoutReadBarrier, false>(offset); |
| mirror::Object* to_ref = Mark</*kGrayImmuneObject=*/false, kNoUnEvac, /*kFromGCThread=*/true>( |
| thread_running_gc_, |
| ref, |
| /*holder=*/ obj, |
| offset); |
| if (to_ref == ref) { |
| return; |
| } |
| // This may fail if the mutator writes to the field at the same time. But it's ok. |
| mirror::Object* expected_ref = ref; |
| mirror::Object* new_ref = to_ref; |
| do { |
| if (expected_ref != |
| obj->GetFieldObject<mirror::Object, kVerifyNone, kWithoutReadBarrier, false>(offset)) { |
| // It was updated by the mutator. |
| break; |
| } |
| // Use release CAS to make sure threads reading the reference see contents of copied objects. |
| } while (!obj->CasFieldObjectWithoutWriteBarrier<false, false, kVerifyNone>( |
| offset, |
| expected_ref, |
| new_ref, |
| CASMode::kWeak, |
| std::memory_order_release)); |
| } |
| |
| // Process some roots. |
| inline void ConcurrentCopying::VisitRoots( |
| mirror::Object*** roots, size_t count, const RootInfo& info ATTRIBUTE_UNUSED) { |
| Thread* const self = Thread::Current(); |
| for (size_t i = 0; i < count; ++i) { |
| mirror::Object** root = roots[i]; |
| mirror::Object* ref = *root; |
| mirror::Object* to_ref = Mark(self, ref); |
| if (to_ref == ref) { |
| continue; |
| } |
| Atomic<mirror::Object*>* addr = reinterpret_cast<Atomic<mirror::Object*>*>(root); |
| mirror::Object* expected_ref = ref; |
| mirror::Object* new_ref = to_ref; |
| do { |
| if (expected_ref != addr->load(std::memory_order_relaxed)) { |
| // It was updated by the mutator. |
| break; |
| } |
| } while (!addr->CompareAndSetWeakRelaxed(expected_ref, new_ref)); |
| } |
| } |
| |
| template<bool kGrayImmuneObject> |
| inline void ConcurrentCopying::MarkRoot(Thread* const self, |
| mirror::CompressedReference<mirror::Object>* root) { |
| DCHECK(!root->IsNull()); |
| mirror::Object* const ref = root->AsMirrorPtr(); |
| mirror::Object* to_ref = Mark<kGrayImmuneObject>(self, ref); |
| if (to_ref != ref) { |
| auto* addr = reinterpret_cast<Atomic<mirror::CompressedReference<mirror::Object>>*>(root); |
| auto expected_ref = mirror::CompressedReference<mirror::Object>::FromMirrorPtr(ref); |
| auto new_ref = mirror::CompressedReference<mirror::Object>::FromMirrorPtr(to_ref); |
| // If the cas fails, then it was updated by the mutator. |
| do { |
| if (ref != addr->load(std::memory_order_relaxed).AsMirrorPtr()) { |
| // It was updated by the mutator. |
| break; |
| } |
| } while (!addr->CompareAndSetWeakRelaxed(expected_ref, new_ref)); |
| } |
| } |
| |
| inline void ConcurrentCopying::VisitRoots( |
| mirror::CompressedReference<mirror::Object>** roots, size_t count, |
| const RootInfo& info ATTRIBUTE_UNUSED) { |
| Thread* const self = Thread::Current(); |
| for (size_t i = 0; i < count; ++i) { |
| mirror::CompressedReference<mirror::Object>* const root = roots[i]; |
| if (!root->IsNull()) { |
| // kGrayImmuneObject is true because this is used for the thread flip. |
| MarkRoot</*kGrayImmuneObject=*/true>(self, root); |
| } |
| } |
| } |
| |
| // Temporary set gc_grays_immune_objects_ to true in a scope if the current thread is GC. |
| class ConcurrentCopying::ScopedGcGraysImmuneObjects { |
| public: |
| explicit ScopedGcGraysImmuneObjects(ConcurrentCopying* collector) |
| : collector_(collector), enabled_(false) { |
| if (kUseBakerReadBarrier && |
| collector_->thread_running_gc_ == Thread::Current() && |
| !collector_->gc_grays_immune_objects_) { |
| collector_->gc_grays_immune_objects_ = true; |
| enabled_ = true; |
| } |
| } |
| |
| ~ScopedGcGraysImmuneObjects() { |
| if (kUseBakerReadBarrier && |
| collector_->thread_running_gc_ == Thread::Current() && |
| enabled_) { |
| DCHECK(collector_->gc_grays_immune_objects_); |
| collector_->gc_grays_immune_objects_ = false; |
| } |
| } |
| |
| private: |
| ConcurrentCopying* const collector_; |
| bool enabled_; |
| }; |
| |
| // Fill the given memory block with a fake object. Used to fill in a |
| // copy of objects that was lost in race. |
| void ConcurrentCopying::FillWithFakeObject(Thread* const self, |
| mirror::Object* fake_obj, |
| size_t byte_size) { |
| // GC doesn't gray immune objects while scanning immune objects. But we need to trigger the read |
| // barriers here because we need the updated reference to the int array class, etc. Temporary set |
| // gc_grays_immune_objects_ to true so that we won't cause a DCHECK failure in MarkImmuneSpace(). |
| ScopedGcGraysImmuneObjects scoped_gc_gray_immune_objects(this); |
| CHECK_ALIGNED(byte_size, kObjectAlignment); |
| memset(fake_obj, 0, byte_size); |
| // Avoid going through read barrier for since kDisallowReadBarrierDuringScan may be enabled. |
| // Explicitly mark to make sure to get an object in the to-space. |
| mirror::Class* int_array_class = down_cast<mirror::Class*>( |
| Mark(self, GetClassRoot<mirror::IntArray, kWithoutReadBarrier>().Ptr())); |
| CHECK(int_array_class != nullptr); |
| if (ReadBarrier::kEnableToSpaceInvariantChecks) { |
| AssertToSpaceInvariant(nullptr, MemberOffset(0), int_array_class); |
| } |
| size_t component_size = int_array_class->GetComponentSize(); |
| CHECK_EQ(component_size, sizeof(int32_t)); |
| size_t data_offset = mirror::Array::DataOffset(component_size).SizeValue(); |
| if (data_offset > byte_size) { |
| // An int array is too big. Use java.lang.Object. |
| CHECK(java_lang_Object_ != nullptr); |
| if (ReadBarrier::kEnableToSpaceInvariantChecks) { |
| AssertToSpaceInvariant(nullptr, MemberOffset(0), java_lang_Object_); |
| } |
| CHECK_EQ(byte_size, java_lang_Object_->GetObjectSize<kVerifyNone>()); |
| fake_obj->SetClass(java_lang_Object_); |
| CHECK_EQ(byte_size, (fake_obj->SizeOf<kVerifyNone>())); |
| } else { |
| // Use an int array. |
| fake_obj->SetClass(int_array_class); |
| CHECK(fake_obj->IsArrayInstance<kVerifyNone>()); |
| int32_t length = (byte_size - data_offset) / component_size; |
| ObjPtr<mirror::Array> fake_arr = fake_obj->AsArray<kVerifyNone>(); |
| fake_arr->SetLength(length); |
| CHECK_EQ(fake_arr->GetLength(), length) |
| << "byte_size=" << byte_size << " length=" << length |
| << " component_size=" << component_size << " data_offset=" << data_offset; |
| CHECK_EQ(byte_size, (fake_obj->SizeOf<kVerifyNone>())) |
| << "byte_size=" << byte_size << " length=" << length |
| << " component_size=" << component_size << " data_offset=" << data_offset; |
| } |
| } |
| |
| // Reuse the memory blocks that were copy of objects that were lost in race. |
| mirror::Object* ConcurrentCopying::AllocateInSkippedBlock(Thread* const self, size_t alloc_size) { |
| // Try to reuse the blocks that were unused due to CAS failures. |
| CHECK_ALIGNED(alloc_size, space::RegionSpace::kAlignment); |
| size_t min_object_size = RoundUp(sizeof(mirror::Object), space::RegionSpace::kAlignment); |
| size_t byte_size; |
| uint8_t* addr; |
| { |
| MutexLock mu(self, skipped_blocks_lock_); |
| auto it = skipped_blocks_map_.lower_bound(alloc_size); |
| if (it == skipped_blocks_map_.end()) { |
| // Not found. |
| return nullptr; |
| } |
| byte_size = it->first; |
| CHECK_GE(byte_size, alloc_size); |
| if (byte_size > alloc_size && byte_size - alloc_size < min_object_size) { |
| // If remainder would be too small for a fake object, retry with a larger request size. |
| it = skipped_blocks_map_.lower_bound(alloc_size + min_object_size); |
| if (it == skipped_blocks_map_.end()) { |
| // Not found. |
| return nullptr; |
| } |
| CHECK_ALIGNED(it->first - alloc_size, space::RegionSpace::kAlignment); |
| CHECK_GE(it->first - alloc_size, min_object_size) |
| << "byte_size=" << byte_size << " it->first=" << it->first << " alloc_size=" << alloc_size; |
| } |
| // Found a block. |
| CHECK(it != skipped_blocks_map_.end()); |
| byte_size = it->first; |
| addr = it->second; |
| CHECK_GE(byte_size, alloc_size); |
| CHECK(region_space_->IsInToSpace(reinterpret_cast<mirror::Object*>(addr))); |
| CHECK_ALIGNED(byte_size, space::RegionSpace::kAlignment); |
| if (kVerboseMode) { |
| LOG(INFO) << "Reusing skipped bytes : " << reinterpret_cast<void*>(addr) << ", " << byte_size; |
| } |
| skipped_blocks_map_.erase(it); |
| } |
| memset(addr, 0, byte_size); |
| if (byte_size > alloc_size) { |
| // Return the remainder to the map. |
| CHECK_ALIGNED(byte_size - alloc_size, space::RegionSpace::kAlignment); |
| CHECK_GE(byte_size - alloc_size, min_object_size); |
| // FillWithFakeObject may mark an object, avoid holding skipped_blocks_lock_ to prevent lock |
| // violation and possible deadlock. The deadlock case is a recursive case: |
| // FillWithFakeObject -> Mark(IntArray.class) -> Copy -> AllocateInSkippedBlock. |
| FillWithFakeObject(self, |
| reinterpret_cast<mirror::Object*>(addr + alloc_size), |
| byte_size - alloc_size); |
| CHECK(region_space_->IsInToSpace(reinterpret_cast<mirror::Object*>(addr + alloc_size))); |
| { |
| MutexLock mu(self, skipped_blocks_lock_); |
| skipped_blocks_map_.insert(std::make_pair(byte_size - alloc_size, addr + alloc_size)); |
| } |
| } |
| return reinterpret_cast<mirror::Object*>(addr); |
| } |
| |
| mirror::Object* ConcurrentCopying::Copy(Thread* const self, |
| mirror::Object* from_ref, |
| mirror::Object* holder, |
| MemberOffset offset) { |
| DCHECK(region_space_->IsInFromSpace(from_ref)); |
| // If the class pointer is null, the object is invalid. This could occur for a dangling pointer |
| // from a previous GC that is either inside or outside the allocated region. |
| mirror::Class* klass = from_ref->GetClass<kVerifyNone, kWithoutReadBarrier>(); |
| if (UNLIKELY(klass == nullptr)) { |
| // Remove memory protection from the region space and log debugging information. |
| region_space_->Unprotect(); |
| heap_->GetVerification()->LogHeapCorruption(holder, offset, from_ref, /* fatal= */ true); |
| } |
| // There must not be a read barrier to avoid nested RB that might violate the to-space invariant. |
| // Note that from_ref is a from space ref so the SizeOf() call will access the from-space meta |
| // objects, but it's ok and necessary. |
| size_t obj_size = from_ref->SizeOf<kDefaultVerifyFlags>(); |
| size_t region_space_alloc_size = RoundUp(obj_size, space::RegionSpace::kAlignment); |
| // Large objects are never evacuated. |
| CHECK_LE(region_space_alloc_size, space::RegionSpace::kRegionSize); |
| size_t region_space_bytes_allocated = 0U; |
| size_t non_moving_space_bytes_allocated = 0U; |
| size_t bytes_allocated = 0U; |
| size_t unused_size; |
| bool fall_back_to_non_moving = false; |
| mirror::Object* to_ref = region_space_->AllocNonvirtual</*kForEvac=*/ true>( |
| region_space_alloc_size, ®ion_space_bytes_allocated, nullptr, &unused_size); |
| bytes_allocated = region_space_bytes_allocated; |
| if (LIKELY(to_ref != nullptr)) { |
| DCHECK_EQ(region_space_alloc_size, region_space_bytes_allocated); |
| } else { |
| // Failed to allocate in the region space. Try the skipped blocks. |
| to_ref = AllocateInSkippedBlock(self, region_space_alloc_size); |
| if (to_ref != nullptr) { |
| // Succeeded to allocate in a skipped block. |
| if (heap_->use_tlab_) { |
| // This is necessary for the tlab case as it's not accounted in the space. |
| region_space_->RecordAlloc(to_ref); |
| } |
| bytes_allocated = region_space_alloc_size; |
| heap_->num_bytes_allocated_.fetch_sub(bytes_allocated, std::memory_order_relaxed); |
| to_space_bytes_skipped_.fetch_sub(bytes_allocated, std::memory_order_relaxed); |
| to_space_objects_skipped_.fetch_sub(1, std::memory_order_relaxed); |
| } else { |
| // Fall back to the non-moving space. |
| fall_back_to_non_moving = true; |
| if (kVerboseMode) { |
| LOG(INFO) << "Out of memory in the to-space. Fall back to non-moving. skipped_bytes=" |
| << to_space_bytes_skipped_.load(std::memory_order_relaxed) |
| << " skipped_objects=" |
| << to_space_objects_skipped_.load(std::memory_order_relaxed); |
| } |
| to_ref = heap_->non_moving_space_->Alloc( |
| self, obj_size, &non_moving_space_bytes_allocated, nullptr, &unused_size); |
| if (UNLIKELY(to_ref == nullptr)) { |
| LOG(FATAL_WITHOUT_ABORT) << "Fall-back non-moving space allocation failed for a " |
| << obj_size << " byte object in region type " |
| << region_space_->GetRegionType(from_ref); |
| LOG(FATAL) << "Object address=" << from_ref << " type=" << from_ref->PrettyTypeOf(); |
| } |
| bytes_allocated = non_moving_space_bytes_allocated; |
| } |
| } |
| DCHECK(to_ref != nullptr); |
| |
| // Copy the object excluding the lock word since that is handled in the loop. |
| to_ref->SetClass(klass); |
| const size_t kObjectHeaderSize = sizeof(mirror::Object); |
| DCHECK_GE(obj_size, kObjectHeaderSize); |
| static_assert(kObjectHeaderSize == sizeof(mirror::HeapReference<mirror::Class>) + |
| sizeof(LockWord), |
| "Object header size does not match"); |
| // Memcpy can tear for words since it may do byte copy. It is only safe to do this since the |
| // object in the from space is immutable other than the lock word. b/31423258 |
| memcpy(reinterpret_cast<uint8_t*>(to_ref) + kObjectHeaderSize, |
| reinterpret_cast<const uint8_t*>(from_ref) + kObjectHeaderSize, |
| obj_size - kObjectHeaderSize); |
| |
| // Attempt to install the forward pointer. This is in a loop as the |
| // lock word atomic write can fail. |
| while (true) { |
| LockWord old_lock_word = from_ref->GetLockWord(false); |
| |
| if (old_lock_word.GetState() == LockWord::kForwardingAddress) { |
| // Lost the race. Another thread (either GC or mutator) stored |
| // the forwarding pointer first. Make the lost copy (to_ref) |
| // look like a valid but dead (fake) object and keep it for |
| // future reuse. |
| FillWithFakeObject(self, to_ref, bytes_allocated); |
| if (!fall_back_to_non_moving) { |
| DCHECK(region_space_->IsInToSpace(to_ref)); |
| // Record the lost copy for later reuse. |
| heap_->num_bytes_allocated_.fetch_add(bytes_allocated, std::memory_order_relaxed); |
| to_space_bytes_skipped_.fetch_add(bytes_allocated, std::memory_order_relaxed); |
| to_space_objects_skipped_.fetch_add(1, std::memory_order_relaxed); |
| MutexLock mu(self, skipped_blocks_lock_); |
| skipped_blocks_map_.insert(std::make_pair(bytes_allocated, |
| reinterpret_cast<uint8_t*>(to_ref))); |
| } else { |
| DCHECK(heap_->non_moving_space_->HasAddress(to_ref)); |
| DCHECK_EQ(bytes_allocated, non_moving_space_bytes_allocated); |
| // Free the non-moving-space chunk. |
| heap_->non_moving_space_->Free(self, to_ref); |
| } |
| |
| // Get the winner's forward ptr. |
| mirror::Object* lost_fwd_ptr = to_ref; |
| to_ref = reinterpret_cast<mirror::Object*>(old_lock_word.ForwardingAddress()); |
| CHECK(to_ref != nullptr); |
| CHECK_NE(to_ref, lost_fwd_ptr); |
| CHECK(region_space_->IsInToSpace(to_ref) || heap_->non_moving_space_->HasAddress(to_ref)) |
| << "to_ref=" << to_ref << " " << heap_->DumpSpaces(); |
| CHECK_NE(to_ref->GetLockWord(false).GetState(), LockWord::kForwardingAddress); |
| return to_ref; |
| } |
| |
| // Copy the old lock word over since we did not copy it yet. |
| to_ref->SetLockWord(old_lock_word, false); |
| // Set the gray ptr. |
| if (kUseBakerReadBarrier) { |
| to_ref->SetReadBarrierState(ReadBarrier::GrayState()); |
| } |
| |
| LockWord new_lock_word = LockWord::FromForwardingAddress(reinterpret_cast<size_t>(to_ref)); |
| |
| // Try to atomically write the fwd ptr. Make sure that the copied object is visible to any |
| // readers of the fwd pointer. |
| bool success = from_ref->CasLockWord(old_lock_word, |
| new_lock_word, |
| CASMode::kWeak, |
| std::memory_order_release); |
| if (LIKELY(success)) { |
| // The CAS succeeded. |
| DCHECK(thread_running_gc_ != nullptr); |
| if (LIKELY(self == thread_running_gc_)) { |
| objects_moved_gc_thread_ += 1; |
| bytes_moved_gc_thread_ += bytes_allocated; |
| } else { |
| objects_moved_.fetch_add(1, std::memory_order_relaxed); |
| bytes_moved_.fetch_add(bytes_allocated, std::memory_order_relaxed); |
| } |
| |
| if (LIKELY(!fall_back_to_non_moving)) { |
| DCHECK(region_space_->IsInToSpace(to_ref)); |
| } else { |
| DCHECK(heap_->non_moving_space_->HasAddress(to_ref)); |
| DCHECK_EQ(bytes_allocated, non_moving_space_bytes_allocated); |
| if (!use_generational_cc_ || !young_gen_) { |
| // Mark it in the live bitmap. |
| CHECK(!heap_->non_moving_space_->GetLiveBitmap()->AtomicTestAndSet(to_ref)); |
| } |
| if (!kUseBakerReadBarrier) { |
| // Mark it in the mark bitmap. |
| CHECK(!heap_->non_moving_space_->GetMarkBitmap()->AtomicTestAndSet(to_ref)); |
| } |
| } |
| if (kUseBakerReadBarrier) { |
| DCHECK(to_ref->GetReadBarrierState() == ReadBarrier::GrayState()); |
| } |
| DCHECK(GetFwdPtr(from_ref) == to_ref); |
| CHECK_NE(to_ref->GetLockWord(false).GetState(), LockWord::kForwardingAddress); |
| // Make sure that anyone who sees to_ref also sees both the object contents and the |
| // fwd pointer. |
| QuasiAtomic::ThreadFenceForConstructor(); |
| PushOntoMarkStack(self, to_ref); |
| return to_ref; |
| } else { |
| // The CAS failed. It may have lost the race or may have failed |
| // due to monitor/hashcode ops. Either way, retry. |
| } |
| } |
| } |
| |
| mirror::Object* ConcurrentCopying::IsMarked(mirror::Object* from_ref) { |
| DCHECK(from_ref != nullptr); |
| space::RegionSpace::RegionType rtype = region_space_->GetRegionType(from_ref); |
| if (rtype == space::RegionSpace::RegionType::kRegionTypeToSpace) { |
| // It's already marked. |
| return from_ref; |
| } |
| mirror::Object* to_ref; |
| if (rtype == space::RegionSpace::RegionType::kRegionTypeFromSpace) { |
| to_ref = GetFwdPtr(from_ref); |
| DCHECK(to_ref == nullptr || region_space_->IsInToSpace(to_ref) || |
| heap_->non_moving_space_->HasAddress(to_ref)) |
| << "from_ref=" << from_ref << " to_ref=" << to_ref; |
| } else if (rtype == space::RegionSpace::RegionType::kRegionTypeUnevacFromSpace) { |
| if (IsMarkedInUnevacFromSpace(from_ref)) { |
| to_ref = from_ref; |
| } else { |
| to_ref = nullptr; |
| } |
| } else { |
| // At this point, `from_ref` should not be in the region space |
| // (i.e. within an "unused" region). |
| DCHECK(!region_space_->HasAddress(from_ref)) << from_ref; |
| // from_ref is in a non-moving space. |
| if (immune_spaces_.ContainsObject(from_ref)) { |
| // An immune object is alive. |
| to_ref = from_ref; |
| } else { |
| // Non-immune non-moving space. Use the mark bitmap. |
| if (IsMarkedInNonMovingSpace(from_ref)) { |
| // Already marked. |
| to_ref = from_ref; |
| } else { |
| to_ref = nullptr; |
| } |
| } |
| } |
| return to_ref; |
| } |
| |
| bool ConcurrentCopying::IsOnAllocStack(mirror::Object* ref) { |
| // TODO: Explain why this is here. What release operation does it pair with? |
| std::atomic_thread_fence(std::memory_order_acquire); |
| accounting::ObjectStack* alloc_stack = GetAllocationStack(); |
| return alloc_stack->Contains(ref); |
| } |
| |
| mirror::Object* ConcurrentCopying::MarkNonMoving(Thread* const self, |
| mirror::Object* ref, |
| mirror::Object* holder, |
| MemberOffset offset) { |
| // ref is in a non-moving space (from_ref == to_ref). |
| DCHECK(!region_space_->HasAddress(ref)) << ref; |
| DCHECK(!immune_spaces_.ContainsObject(ref)); |
| // Use the mark bitmap. |
| accounting::ContinuousSpaceBitmap* mark_bitmap = heap_->GetNonMovingSpace()->GetMarkBitmap(); |
| accounting::LargeObjectBitmap* los_bitmap = nullptr; |
| const bool is_los = !mark_bitmap->HasAddress(ref); |
| if (is_los) { |
| if (!IsAligned<kPageSize>(ref)) { |
| // Ref is a large object that is not aligned, it must be heap |
| // corruption. Remove memory protection and dump data before |
| // AtomicSetReadBarrierState since it will fault if the address is not |
| // valid. |
| region_space_->Unprotect(); |
| heap_->GetVerification()->LogHeapCorruption(holder, offset, ref, /* fatal= */ true); |
| } |
| DCHECK(heap_->GetLargeObjectsSpace()) |
| << "ref=" << ref |
| << " doesn't belong to non-moving space and large object space doesn't exist"; |
| los_bitmap = heap_->GetLargeObjectsSpace()->GetMarkBitmap(); |
| DCHECK(los_bitmap->HasAddress(ref)); |
| } |
| if (use_generational_cc_) { |
| // The sticky-bit CC collector is only compatible with Baker-style read barriers. |
| DCHECK(kUseBakerReadBarrier); |
| // Not done scanning, use AtomicSetReadBarrierPointer. |
| if (!done_scanning_.load(std::memory_order_acquire)) { |
| // Since the mark bitmap is still filled in from last GC, we can not use that or else the |
| // mutator may see references to the from space. Instead, use the Baker pointer itself as |
| // the mark bit. |
| // |
| // We need to avoid marking objects that are on allocation stack as that will lead to a |
| // situation (after this GC cycle is finished) where some object(s) are on both allocation |
| // stack and live bitmap. This leads to visiting the same object(s) twice during a heapdump |
| // (b/117426281). |
| if (!IsOnAllocStack(ref) && |
| ref->AtomicSetReadBarrierState(ReadBarrier::NonGrayState(), ReadBarrier::GrayState())) { |
| // TODO: We don't actually need to scan this object later, we just need to clear the gray |
| // bit. |
| // We don't need to mark newly allocated objects (those in allocation stack) as they can |
| // only point to to-space objects. Also, they are considered live till the next GC cycle. |
| PushOntoMarkStack(self, ref); |
| } |
| return ref; |
| } |
| } |
| if (!is_los && mark_bitmap->Test(ref)) { |
| // Already marked. |
| } else if (is_los && los_bitmap->Test(ref)) { |
| // Already marked in LOS. |
| } else if (IsOnAllocStack(ref)) { |
| // If it's on the allocation stack, it's considered marked. Keep it white (non-gray). |
| // Objects on the allocation stack need not be marked. |
| if (!is_los) { |
| DCHECK(!mark_bitmap->Test(ref)); |
| } else { |
| DCHECK(!los_bitmap->Test(ref)); |
| } |
| if (kUseBakerReadBarrier) { |
| DCHECK_EQ(ref->GetReadBarrierState(), ReadBarrier::NonGrayState()); |
| } |
| } else { |
| // Not marked nor on the allocation stack. Try to mark it. |
| // This may or may not succeed, which is ok. |
| bool success = false; |
| if (kUseBakerReadBarrier) { |
| success = ref->AtomicSetReadBarrierState(ReadBarrier::NonGrayState(), |
| ReadBarrier::GrayState()); |
| } else { |
| success = is_los ? |
| !los_bitmap->AtomicTestAndSet(ref) : |
| !mark_bitmap->AtomicTestAndSet(ref); |
| } |
| if (success) { |
| if (kUseBakerReadBarrier) { |
| DCHECK_EQ(ref->GetReadBarrierState(), ReadBarrier::GrayState()); |
| } |
| PushOntoMarkStack(self, ref); |
| } |
| } |
| return ref; |
| } |
| |
| void ConcurrentCopying::FinishPhase() { |
| Thread* const self = Thread::Current(); |
| { |
| MutexLock mu(self, mark_stack_lock_); |
| CHECK(revoked_mark_stacks_.empty()); |
| CHECK_EQ(pooled_mark_stacks_.size(), kMarkStackPoolSize); |
| } |
| // kVerifyNoMissingCardMarks relies on the region space cards not being cleared to avoid false |
| // positives. |
| if (!kVerifyNoMissingCardMarks && !use_generational_cc_) { |
| TimingLogger::ScopedTiming split("ClearRegionSpaceCards", GetTimings()); |
| // We do not currently use the region space cards at all, madvise them away to save ram. |
| heap_->GetCardTable()->ClearCardRange(region_space_->Begin(), region_space_->Limit()); |
| } else if (use_generational_cc_ && !young_gen_) { |
| region_space_inter_region_bitmap_.Clear(); |
| non_moving_space_inter_region_bitmap_.Clear(); |
| } |
| { |
| MutexLock mu(self, skipped_blocks_lock_); |
| skipped_blocks_map_.clear(); |
| } |
| { |
| ReaderMutexLock mu(self, *Locks::mutator_lock_); |
| { |
| WriterMutexLock mu2(self, *Locks::heap_bitmap_lock_); |
| heap_->ClearMarkedObjects(); |
| } |
| if (kUseBakerReadBarrier && kFilterModUnionCards) { |
| TimingLogger::ScopedTiming split("FilterModUnionCards", GetTimings()); |
| ReaderMutexLock mu2(self, *Locks::heap_bitmap_lock_); |
| for (space::ContinuousSpace* space : immune_spaces_.GetSpaces()) { |
| DCHECK(space->IsImageSpace() || space->IsZygoteSpace()); |
| accounting::ModUnionTable* table = heap_->FindModUnionTableFromSpace(space); |
| // Filter out cards that don't need to be set. |
| if (table != nullptr) { |
| table->FilterCards(); |
| } |
| } |
| } |
| if (kUseBakerReadBarrier) { |
| TimingLogger::ScopedTiming split("EmptyRBMarkBitStack", GetTimings()); |
| DCHECK(rb_mark_bit_stack_ != nullptr); |
| const auto* limit = rb_mark_bit_stack_->End(); |
| for (StackReference<mirror::Object>* it = rb_mark_bit_stack_->Begin(); it != limit; ++it) { |
| CHECK(it->AsMirrorPtr()->AtomicSetMarkBit(1, 0)) |
| << "rb_mark_bit_stack_->Begin()" << rb_mark_bit_stack_->Begin() << '\n' |
| << "rb_mark_bit_stack_->End()" << rb_mark_bit_stack_->End() << '\n' |
| << "rb_mark_bit_stack_->IsFull()" |
| << std::boolalpha << rb_mark_bit_stack_->IsFull() << std::noboolalpha << '\n' |
| << DumpReferenceInfo(it->AsMirrorPtr(), "*it"); |
| } |
| rb_mark_bit_stack_->Reset(); |
| } |
| } |
| if (measure_read_barrier_slow_path_) { |
| MutexLock mu(self, rb_slow_path_histogram_lock_); |
| rb_slow_path_time_histogram_.AdjustAndAddValue( |
| rb_slow_path_ns_.load(std::memory_order_relaxed)); |
| rb_slow_path_count_total_ += rb_slow_path_count_.load(std::memory_order_relaxed); |
| rb_slow_path_count_gc_total_ += rb_slow_path_count_gc_.load(std::memory_order_relaxed); |
| } |
| } |
| |
| bool ConcurrentCopying::IsNullOrMarkedHeapReference(mirror::HeapReference<mirror::Object>* field, |
| bool do_atomic_update) { |
| mirror::Object* from_ref = field->AsMirrorPtr(); |
| if (from_ref == nullptr) { |
| return true; |
| } |
| mirror::Object* to_ref = IsMarked(from_ref); |
| if (to_ref == nullptr) { |
| return false; |
| } |
| if (from_ref != to_ref) { |
| if (do_atomic_update) { |
| do { |
| if (field->AsMirrorPtr() != from_ref) { |
| // Concurrently overwritten by a mutator. |
| break; |
| } |
| } while (!field->CasWeakRelaxed(from_ref, to_ref)); |
| } else { |
| field->Assign(to_ref); |
| } |
| } |
| return true; |
| } |
| |
| mirror::Object* ConcurrentCopying::MarkObject(mirror::Object* from_ref) { |
| return Mark(Thread::Current(), from_ref); |
| } |
| |
| void ConcurrentCopying::DelayReferenceReferent(ObjPtr<mirror::Class> klass, |
| ObjPtr<mirror::Reference> reference) { |
| heap_->GetReferenceProcessor()->DelayReferenceReferent(klass, reference, this); |
| } |
| |
| void ConcurrentCopying::ProcessReferences(Thread* self) { |
| // We don't really need to lock the heap bitmap lock as we use CAS to mark in bitmaps. |
| WriterMutexLock mu(self, *Locks::heap_bitmap_lock_); |
| GetHeap()->GetReferenceProcessor()->ProcessReferences(self, GetTimings()); |
| } |
| |
| void ConcurrentCopying::RevokeAllThreadLocalBuffers() { |
| TimingLogger::ScopedTiming t(__FUNCTION__, GetTimings()); |
| region_space_->RevokeAllThreadLocalBuffers(); |
| } |
| |
| mirror::Object* ConcurrentCopying::MarkFromReadBarrierWithMeasurements(Thread* const self, |
| mirror::Object* from_ref) { |
| if (self != thread_running_gc_) { |
| rb_slow_path_count_.fetch_add(1u, std::memory_order_relaxed); |
| } else { |
| rb_slow_path_count_gc_.fetch_add(1u, std::memory_order_relaxed); |
| } |
| ScopedTrace tr(__FUNCTION__); |
| const uint64_t start_time = measure_read_barrier_slow_path_ ? NanoTime() : 0u; |
| mirror::Object* ret = |
| Mark</*kGrayImmuneObject=*/true, /*kNoUnEvac=*/false, /*kFromGCThread=*/false>(self, |
| from_ref); |
| if (measure_read_barrier_slow_path_) { |
| rb_slow_path_ns_.fetch_add(NanoTime() - start_time, std::memory_order_relaxed); |
| } |
| return ret; |
| } |
| |
| void ConcurrentCopying::DumpPerformanceInfo(std::ostream& os) { |
| GarbageCollector::DumpPerformanceInfo(os); |
| size_t num_gc_cycles = GetCumulativeTimings().GetIterations(); |
| MutexLock mu(Thread::Current(), rb_slow_path_histogram_lock_); |
| if (rb_slow_path_time_histogram_.SampleSize() > 0) { |
| Histogram<uint64_t>::CumulativeData cumulative_data; |
| rb_slow_path_time_histogram_.CreateHistogram(&cumulative_data); |
| rb_slow_path_time_histogram_.PrintConfidenceIntervals(os, 0.99, cumulative_data); |
| } |
| if (rb_slow_path_count_total_ > 0) { |
| os << "Slow path count " << rb_slow_path_count_total_ << "\n"; |
| } |
| if (rb_slow_path_count_gc_total_ > 0) { |
| os << "GC slow path count " << rb_slow_path_count_gc_total_ << "\n"; |
| } |
| |
| os << "Average " << (young_gen_ ? "minor" : "major") << " GC reclaim bytes ratio " |
| << (reclaimed_bytes_ratio_sum_ / num_gc_cycles) << " over " << num_gc_cycles |
| << " GC cycles\n"; |
| |
| os << "Average " << (young_gen_ ? "minor" : "major") << " GC copied live bytes ratio " |
| << (copied_live_bytes_ratio_sum_ / gc_count_) << " over " << gc_count_ |
| << " " << (young_gen_ ? "minor" : "major") << " GCs\n"; |
| |
| os << "Cumulative bytes moved " << cumulative_bytes_moved_ << "\n"; |
| os << "Cumulative objects moved " << cumulative_objects_moved_ << "\n"; |
| |
| os << "Peak regions allocated " |
| << region_space_->GetMaxPeakNumNonFreeRegions() << " (" |
| << PrettySize(region_space_->GetMaxPeakNumNonFreeRegions() * space::RegionSpace::kRegionSize) |
| << ") / " << region_space_->GetNumRegions() / 2 << " (" |
| << PrettySize(region_space_->GetNumRegions() * space::RegionSpace::kRegionSize / 2) |
| << ")\n"; |
| if (!young_gen_) { |
| os << "Total madvise time " << PrettyDuration(region_space_->GetMadviseTime()) << "\n"; |
| } |
| } |
| |
| } // namespace collector |
| } // namespace gc |
| } // namespace art |