// Copyright 2009 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. // Garbage collector: sweeping // The sweeper consists of two different algorithms: // // * The object reclaimer finds and frees unmarked slots in spans. It // can free a whole span if none of the objects are marked, but that // isn't its goal. This can be driven either synchronously by // mcentral.cacheSpan for mcentral spans, or asynchronously by // sweepone, which looks at all the mcentral lists. // // * The span reclaimer looks for spans that contain no marked objects // and frees whole spans. This is a separate algorithm because // freeing whole spans is the hardest task for the object reclaimer, // but is critical when allocating new spans. The entry point for // this is mheap_.reclaim and it's driven by a sequential scan of // the page marks bitmap in the heap arenas. // // Both algorithms ultimately call mspan.sweep, which sweeps a single // heap span. package runtime import ( "internal/abi" "internal/goexperiment" "runtime/internal/atomic" "unsafe" ) var sweep sweepdata // State of background sweep. type sweepdata struct { lock mutex g *g parked bool // active tracks outstanding sweepers and the sweep // termination condition. active activeSweep // centralIndex is the current unswept span class. // It represents an index into the mcentral span // sets. Accessed and updated via its load and // update methods. Not protected by a lock. // // Reset at mark termination. // Used by mheap.nextSpanForSweep. centralIndex sweepClass } // sweepClass is a spanClass and one bit to represent whether we're currently // sweeping partial or full spans. type sweepClass uint32 const ( numSweepClasses = numSpanClasses * 2 sweepClassDone sweepClass = sweepClass(^uint32(0)) ) func (s *sweepClass) load() sweepClass { return sweepClass(atomic.Load((*uint32)(s))) } func (s *sweepClass) update(sNew sweepClass) { // Only update *s if its current value is less than sNew, // since *s increases monotonically. sOld := s.load() for sOld < sNew && !atomic.Cas((*uint32)(s), uint32(sOld), uint32(sNew)) { sOld = s.load() } // TODO(mknyszek): This isn't the only place we have // an atomic monotonically increasing counter. It would // be nice to have an "atomic max" which is just implemented // as the above on most architectures. Some architectures // like RISC-V however have native support for an atomic max. } func (s *sweepClass) clear() { atomic.Store((*uint32)(s), 0) } // split returns the underlying span class as well as // whether we're interested in the full or partial // unswept lists for that class, indicated as a boolean // (true means "full"). func (s sweepClass) split() (spc spanClass, full bool) { return spanClass(s >> 1), s&1 == 0 } // nextSpanForSweep finds and pops the next span for sweeping from the // central sweep buffers. It returns ownership of the span to the caller. // Returns nil if no such span exists. func (h *mheap) nextSpanForSweep() *mspan { sg := h.sweepgen for sc := sweep.centralIndex.load(); sc < numSweepClasses; sc++ { spc, full := sc.split() c := &h.central[spc].mcentral var s *mspan if full { s = c.fullUnswept(sg).pop() } else { s = c.partialUnswept(sg).pop() } if s != nil { // Write down that we found something so future sweepers // can start from here. sweep.centralIndex.update(sc) return s } } // Write down that we found nothing. sweep.centralIndex.update(sweepClassDone) return nil } const sweepDrainedMask = 1 << 31 // activeSweep is a type that captures whether sweeping // is done, and whether there are any outstanding sweepers. // // Every potential sweeper must call begin() before they look // for work, and end() after they've finished sweeping. type activeSweep struct { // state is divided into two parts. // // The top bit (masked by sweepDrainedMask) is a boolean // value indicating whether all the sweep work has been // drained from the queue. // // The rest of the bits are a counter, indicating the // number of outstanding concurrent sweepers. state atomic.Uint32 } // begin registers a new sweeper. Returns a sweepLocker // for acquiring spans for sweeping. Any outstanding sweeper blocks // sweep termination. // // If the sweepLocker is invalid, the caller can be sure that all // outstanding sweep work has been drained, so there is nothing left // to sweep. Note that there may be sweepers currently running, so // this does not indicate that all sweeping has completed. // // Even if the sweepLocker is invalid, its sweepGen is always valid. func (a *activeSweep) begin() sweepLocker { for { state := a.state.Load() if state&sweepDrainedMask != 0 { return sweepLocker{mheap_.sweepgen, false} } if a.state.CompareAndSwap(state, state+1) { return sweepLocker{mheap_.sweepgen, true} } } } // end deregisters a sweeper. Must be called once for each time // begin is called if the sweepLocker is valid. func (a *activeSweep) end(sl sweepLocker) { if sl.sweepGen != mheap_.sweepgen { throw("sweeper left outstanding across sweep generations") } for { state := a.state.Load() if (state&^sweepDrainedMask)-1 >= sweepDrainedMask { throw("mismatched begin/end of activeSweep") } if a.state.CompareAndSwap(state, state-1) { if state != sweepDrainedMask { return } if debug.gcpacertrace > 0 { live := gcController.heapLive.Load() print("pacer: sweep done at heap size ", live>>20, "MB; allocated ", (live-mheap_.sweepHeapLiveBasis)>>20, "MB during sweep; swept ", mheap_.pagesSwept.Load(), " pages at ", mheap_.sweepPagesPerByte, " pages/byte\n") } return } } } // markDrained marks the active sweep cycle as having drained // all remaining work. This is safe to be called concurrently // with all other methods of activeSweep, though may race. // // Returns true if this call was the one that actually performed // the mark. func (a *activeSweep) markDrained() bool { for { state := a.state.Load() if state&sweepDrainedMask != 0 { return false } if a.state.CompareAndSwap(state, state|sweepDrainedMask) { return true } } } // sweepers returns the current number of active sweepers. func (a *activeSweep) sweepers() uint32 { return a.state.Load() &^ sweepDrainedMask } // isDone returns true if all sweep work has been drained and no more // outstanding sweepers exist. That is, when the sweep phase is // completely done. func (a *activeSweep) isDone() bool { return a.state.Load() == sweepDrainedMask } // reset sets up the activeSweep for the next sweep cycle. // // The world must be stopped. func (a *activeSweep) reset() { assertWorldStopped() a.state.Store(0) } // finishsweep_m ensures that all spans are swept. // // The world must be stopped. This ensures there are no sweeps in // progress. // //go:nowritebarrier func finishsweep_m() { assertWorldStopped() // Sweeping must be complete before marking commences, so // sweep any unswept spans. If this is a concurrent GC, there // shouldn't be any spans left to sweep, so this should finish // instantly. If GC was forced before the concurrent sweep // finished, there may be spans to sweep. for sweepone() != ^uintptr(0) { } // Make sure there aren't any outstanding sweepers left. // At this point, with the world stopped, it means one of two // things. Either we were able to preempt a sweeper, or that // a sweeper didn't call sweep.active.end when it should have. // Both cases indicate a bug, so throw. if sweep.active.sweepers() != 0 { throw("active sweepers found at start of mark phase") } // Reset all the unswept buffers, which should be empty. // Do this in sweep termination as opposed to mark termination // so that we can catch unswept spans and reclaim blocks as // soon as possible. sg := mheap_.sweepgen for i := range mheap_.central { c := &mheap_.central[i].mcentral c.partialUnswept(sg).reset() c.fullUnswept(sg).reset() } // Sweeping is done, so there won't be any new memory to // scavenge for a bit. // // If the scavenger isn't already awake, wake it up. There's // definitely work for it to do at this point. scavenger.wake() nextMarkBitArenaEpoch() } func bgsweep(c chan int) { sweep.g = getg() lockInit(&sweep.lock, lockRankSweep) lock(&sweep.lock) sweep.parked = true c <- 1 goparkunlock(&sweep.lock, waitReasonGCSweepWait, traceBlockGCSweep, 1) for { // bgsweep attempts to be a "low priority" goroutine by intentionally // yielding time. It's OK if it doesn't run, because goroutines allocating // memory will sweep and ensure that all spans are swept before the next // GC cycle. We really only want to run when we're idle. // // However, calling Gosched after each span swept produces a tremendous // amount of tracing events, sometimes up to 50% of events in a trace. It's // also inefficient to call into the scheduler so much because sweeping a // single span is in general a very fast operation, taking as little as 30 ns // on modern hardware. (See #54767.) // // As a result, bgsweep sweeps in batches, and only calls into the scheduler // at the end of every batch. Furthermore, it only yields its time if there // isn't spare idle time available on other cores. If there's available idle // time, helping to sweep can reduce allocation latencies by getting ahead of // the proportional sweeper and having spans ready to go for allocation. const sweepBatchSize = 10 nSwept := 0 for sweepone() != ^uintptr(0) { nSwept++ if nSwept%sweepBatchSize == 0 { goschedIfBusy() } } for freeSomeWbufs(true) { // N.B. freeSomeWbufs is already batched internally. goschedIfBusy() } lock(&sweep.lock) if !isSweepDone() { // This can happen if a GC runs between // gosweepone returning ^0 above // and the lock being acquired. unlock(&sweep.lock) continue } sweep.parked = true goparkunlock(&sweep.lock, waitReasonGCSweepWait, traceBlockGCSweep, 1) } } // sweepLocker acquires sweep ownership of spans. type sweepLocker struct { // sweepGen is the sweep generation of the heap. sweepGen uint32 valid bool } // sweepLocked represents sweep ownership of a span. type sweepLocked struct { *mspan } // tryAcquire attempts to acquire sweep ownership of span s. If it // successfully acquires ownership, it blocks sweep completion. func (l *sweepLocker) tryAcquire(s *mspan) (sweepLocked, bool) { if !l.valid { throw("use of invalid sweepLocker") } // Check before attempting to CAS. if atomic.Load(&s.sweepgen) != l.sweepGen-2 { return sweepLocked{}, false } // Attempt to acquire sweep ownership of s. if !atomic.Cas(&s.sweepgen, l.sweepGen-2, l.sweepGen-1) { return sweepLocked{}, false } return sweepLocked{s}, true } // sweepone sweeps some unswept heap span and returns the number of pages returned // to the heap, or ^uintptr(0) if there was nothing to sweep. func sweepone() uintptr { gp := getg() // Increment locks to ensure that the goroutine is not preempted // in the middle of sweep thus leaving the span in an inconsistent state for next GC gp.m.locks++ // TODO(austin): sweepone is almost always called in a loop; // lift the sweepLocker into its callers. sl := sweep.active.begin() if !sl.valid { gp.m.locks-- return ^uintptr(0) } // Find a span to sweep. npages := ^uintptr(0) var noMoreWork bool for { s := mheap_.nextSpanForSweep() if s == nil { noMoreWork = sweep.active.markDrained() break } if state := s.state.get(); state != mSpanInUse { // This can happen if direct sweeping already // swept this span, but in that case the sweep // generation should always be up-to-date. if !(s.sweepgen == sl.sweepGen || s.sweepgen == sl.sweepGen+3) { print("runtime: bad span s.state=", state, " s.sweepgen=", s.sweepgen, " sweepgen=", sl.sweepGen, "\n") throw("non in-use span in unswept list") } continue } if s, ok := sl.tryAcquire(s); ok { // Sweep the span we found. npages = s.npages if s.sweep(false) { // Whole span was freed. Count it toward the // page reclaimer credit since these pages can // now be used for span allocation. mheap_.reclaimCredit.Add(npages) } else { // Span is still in-use, so this returned no // pages to the heap and the span needs to // move to the swept in-use list. npages = 0 } break } } sweep.active.end(sl) if noMoreWork { // The sweep list is empty. There may still be // concurrent sweeps running, but we're at least very // close to done sweeping. // Move the scavenge gen forward (signaling // that there's new work to do) and wake the scavenger. // // The scavenger is signaled by the last sweeper because once // sweeping is done, we will definitely have useful work for // the scavenger to do, since the scavenger only runs over the // heap once per GC cycle. This update is not done during sweep // termination because in some cases there may be a long delay // between sweep done and sweep termination (e.g. not enough // allocations to trigger a GC) which would be nice to fill in // with scavenging work. if debug.scavtrace > 0 { systemstack(func() { lock(&mheap_.lock) // Get released stats. releasedBg := mheap_.pages.scav.releasedBg.Load() releasedEager := mheap_.pages.scav.releasedEager.Load() // Print the line. printScavTrace(releasedBg, releasedEager, false) // Update the stats. mheap_.pages.scav.releasedBg.Add(-releasedBg) mheap_.pages.scav.releasedEager.Add(-releasedEager) unlock(&mheap_.lock) }) } scavenger.ready() } gp.m.locks-- return npages } // isSweepDone reports whether all spans are swept. // // Note that this condition may transition from false to true at any // time as the sweeper runs. It may transition from true to false if a // GC runs; to prevent that the caller must be non-preemptible or must // somehow block GC progress. func isSweepDone() bool { return sweep.active.isDone() } // Returns only when span s has been swept. // //go:nowritebarrier func (s *mspan) ensureSwept() { // Caller must disable preemption. // Otherwise when this function returns the span can become unswept again // (if GC is triggered on another goroutine). gp := getg() if gp.m.locks == 0 && gp.m.mallocing == 0 && gp != gp.m.g0 { throw("mspan.ensureSwept: m is not locked") } // If this operation fails, then that means that there are // no more spans to be swept. In this case, either s has already // been swept, or is about to be acquired for sweeping and swept. sl := sweep.active.begin() if sl.valid { // The caller must be sure that the span is a mSpanInUse span. if s, ok := sl.tryAcquire(s); ok { s.sweep(false) sweep.active.end(sl) return } sweep.active.end(sl) } // Unfortunately we can't sweep the span ourselves. Somebody else // got to it first. We don't have efficient means to wait, but that's // OK, it will be swept fairly soon. for { spangen := atomic.Load(&s.sweepgen) if spangen == sl.sweepGen || spangen == sl.sweepGen+3 { break } osyield() } } // sweep frees or collects finalizers for blocks not marked in the mark phase. // It clears the mark bits in preparation for the next GC round. // Returns true if the span was returned to heap. // If preserve=true, don't return it to heap nor relink in mcentral lists; // caller takes care of it. func (sl *sweepLocked) sweep(preserve bool) bool { // It's critical that we enter this function with preemption disabled, // GC must not start while we are in the middle of this function. gp := getg() if gp.m.locks == 0 && gp.m.mallocing == 0 && gp != gp.m.g0 { throw("mspan.sweep: m is not locked") } s := sl.mspan if !preserve { // We'll release ownership of this span. Nil it out to // prevent the caller from accidentally using it. sl.mspan = nil } sweepgen := mheap_.sweepgen if state := s.state.get(); state != mSpanInUse || s.sweepgen != sweepgen-1 { print("mspan.sweep: state=", state, " sweepgen=", s.sweepgen, " mheap.sweepgen=", sweepgen, "\n") throw("mspan.sweep: bad span state") } trace := traceAcquire() if trace.ok() { trace.GCSweepSpan(s.npages * _PageSize) traceRelease(trace) } mheap_.pagesSwept.Add(int64(s.npages)) spc := s.spanclass size := s.elemsize // The allocBits indicate which unmarked objects don't need to be // processed since they were free at the end of the last GC cycle // and were not allocated since then. // If the allocBits index is >= s.freeindex and the bit // is not marked then the object remains unallocated // since the last GC. // This situation is analogous to being on a freelist. // Unlink & free special records for any objects we're about to free. // Two complications here: // 1. An object can have both finalizer and profile special records. // In such case we need to queue finalizer for execution, // mark the object as live and preserve the profile special. // 2. A tiny object can have several finalizers setup for different offsets. // If such object is not marked, we need to queue all finalizers at once. // Both 1 and 2 are possible at the same time. hadSpecials := s.specials != nil siter := newSpecialsIter(s) for siter.valid() { // A finalizer can be set for an inner byte of an object, find object beginning. objIndex := uintptr(siter.s.offset) / size p := s.base() + objIndex*size mbits := s.markBitsForIndex(objIndex) if !mbits.isMarked() { // This object is not marked and has at least one special record. // Pass 1: see if it has at least one finalizer. hasFin := false endOffset := p - s.base() + size for tmp := siter.s; tmp != nil && uintptr(tmp.offset) < endOffset; tmp = tmp.next { if tmp.kind == _KindSpecialFinalizer { // Stop freeing of object if it has a finalizer. mbits.setMarkedNonAtomic() hasFin = true break } } // Pass 2: queue all finalizers _or_ handle profile record. for siter.valid() && uintptr(siter.s.offset) < endOffset { // Find the exact byte for which the special was setup // (as opposed to object beginning). special := siter.s p := s.base() + uintptr(special.offset) if special.kind == _KindSpecialFinalizer || !hasFin { siter.unlinkAndNext() freeSpecial(special, unsafe.Pointer(p), size) } else { // The object has finalizers, so we're keeping it alive. // All other specials only apply when an object is freed, // so just keep the special record. siter.next() } } } else { // object is still live if siter.s.kind == _KindSpecialReachable { special := siter.unlinkAndNext() (*specialReachable)(unsafe.Pointer(special)).reachable = true freeSpecial(special, unsafe.Pointer(p), size) } else { // keep special record siter.next() } } } if hadSpecials && s.specials == nil { spanHasNoSpecials(s) } if debug.allocfreetrace != 0 || debug.clobberfree != 0 || raceenabled || msanenabled || asanenabled { // Find all newly freed objects. This doesn't have to // efficient; allocfreetrace has massive overhead. mbits := s.markBitsForBase() abits := s.allocBitsForIndex(0) for i := uintptr(0); i < uintptr(s.nelems); i++ { if !mbits.isMarked() && (abits.index < uintptr(s.freeindex) || abits.isMarked()) { x := s.base() + i*s.elemsize if debug.allocfreetrace != 0 { tracefree(unsafe.Pointer(x), size) } if debug.clobberfree != 0 { clobberfree(unsafe.Pointer(x), size) } // User arenas are handled on explicit free. if raceenabled && !s.isUserArenaChunk { racefree(unsafe.Pointer(x), size) } if msanenabled && !s.isUserArenaChunk { msanfree(unsafe.Pointer(x), size) } if asanenabled && !s.isUserArenaChunk { asanpoison(unsafe.Pointer(x), size) } } mbits.advance() abits.advance() } } // Check for zombie objects. if s.freeindex < s.nelems { // Everything < freeindex is allocated and hence // cannot be zombies. // // Check the first bitmap byte, where we have to be // careful with freeindex. obj := uintptr(s.freeindex) if (*s.gcmarkBits.bytep(obj / 8)&^*s.allocBits.bytep(obj / 8))>>(obj%8) != 0 { s.reportZombies() } // Check remaining bytes. for i := obj/8 + 1; i < divRoundUp(uintptr(s.nelems), 8); i++ { if *s.gcmarkBits.bytep(i)&^*s.allocBits.bytep(i) != 0 { s.reportZombies() } } } // Count the number of free objects in this span. nalloc := uint16(s.countAlloc()) nfreed := s.allocCount - nalloc if nalloc > s.allocCount { // The zombie check above should have caught this in // more detail. print("runtime: nelems=", s.nelems, " nalloc=", nalloc, " previous allocCount=", s.allocCount, " nfreed=", nfreed, "\n") throw("sweep increased allocation count") } s.allocCount = nalloc s.freeindex = 0 // reset allocation index to start of span. s.freeIndexForScan = 0 if traceEnabled() { getg().m.p.ptr().trace.reclaimed += uintptr(nfreed) * s.elemsize } // gcmarkBits becomes the allocBits. // get a fresh cleared gcmarkBits in preparation for next GC s.allocBits = s.gcmarkBits s.gcmarkBits = newMarkBits(uintptr(s.nelems)) // refresh pinnerBits if they exists if s.pinnerBits != nil { s.refreshPinnerBits() } // Initialize alloc bits cache. s.refillAllocCache(0) // The span must be in our exclusive ownership until we update sweepgen, // check for potential races. if state := s.state.get(); state != mSpanInUse || s.sweepgen != sweepgen-1 { print("mspan.sweep: state=", state, " sweepgen=", s.sweepgen, " mheap.sweepgen=", sweepgen, "\n") throw("mspan.sweep: bad span state after sweep") } if s.sweepgen == sweepgen+1 || s.sweepgen == sweepgen+3 { throw("swept cached span") } // We need to set s.sweepgen = h.sweepgen only when all blocks are swept, // because of the potential for a concurrent free/SetFinalizer. // // But we need to set it before we make the span available for allocation // (return it to heap or mcentral), because allocation code assumes that a // span is already swept if available for allocation. // // Serialization point. // At this point the mark bits are cleared and allocation ready // to go so release the span. atomic.Store(&s.sweepgen, sweepgen) if s.isUserArenaChunk { if preserve { // This is a case that should never be handled by a sweeper that // preserves the span for reuse. throw("sweep: tried to preserve a user arena span") } if nalloc > 0 { // There still exist pointers into the span or the span hasn't been // freed yet. It's not ready to be reused. Put it back on the // full swept list for the next cycle. mheap_.central[spc].mcentral.fullSwept(sweepgen).push(s) return false } // It's only at this point that the sweeper doesn't actually need to look // at this arena anymore, so subtract from pagesInUse now. mheap_.pagesInUse.Add(-s.npages) s.state.set(mSpanDead) // The arena is ready to be recycled. Remove it from the quarantine list // and place it on the ready list. Don't add it back to any sweep lists. systemstack(func() { // It's the arena code's responsibility to get the chunk on the quarantine // list by the time all references to the chunk are gone. if s.list != &mheap_.userArena.quarantineList { throw("user arena span is on the wrong list") } lock(&mheap_.lock) mheap_.userArena.quarantineList.remove(s) mheap_.userArena.readyList.insert(s) unlock(&mheap_.lock) }) return false } if spc.sizeclass() != 0 { // Handle spans for small objects. if nfreed > 0 { // Only mark the span as needing zeroing if we've freed any // objects, because a fresh span that had been allocated into, // wasn't totally filled, but then swept, still has all of its // free slots zeroed. s.needzero = 1 stats := memstats.heapStats.acquire() atomic.Xadd64(&stats.smallFreeCount[spc.sizeclass()], int64(nfreed)) memstats.heapStats.release() // Count the frees in the inconsistent, internal stats. gcController.totalFree.Add(int64(nfreed) * int64(s.elemsize)) } if !preserve { // The caller may not have removed this span from whatever // unswept set its on but taken ownership of the span for // sweeping by updating sweepgen. If this span still is in // an unswept set, then the mcentral will pop it off the // set, check its sweepgen, and ignore it. if nalloc == 0 { // Free totally free span directly back to the heap. mheap_.freeSpan(s) return true } // Return span back to the right mcentral list. if nalloc == s.nelems { mheap_.central[spc].mcentral.fullSwept(sweepgen).push(s) } else { mheap_.central[spc].mcentral.partialSwept(sweepgen).push(s) } } } else if !preserve { // Handle spans for large objects. if nfreed != 0 { // Free large object span to heap. // NOTE(rsc,dvyukov): The original implementation of efence // in CL 22060046 used sysFree instead of sysFault, so that // the operating system would eventually give the memory // back to us again, so that an efence program could run // longer without running out of memory. Unfortunately, // calling sysFree here without any kind of adjustment of the // heap data structures means that when the memory does // come back to us, we have the wrong metadata for it, either in // the mspan structures or in the garbage collection bitmap. // Using sysFault here means that the program will run out of // memory fairly quickly in efence mode, but at least it won't // have mysterious crashes due to confused memory reuse. // It should be possible to switch back to sysFree if we also // implement and then call some kind of mheap.deleteSpan. if debug.efence > 0 { s.limit = 0 // prevent mlookup from finding this span sysFault(unsafe.Pointer(s.base()), size) } else { mheap_.freeSpan(s) } if goexperiment.AllocHeaders && s.largeType != nil && s.largeType.TFlag&abi.TFlagUnrolledBitmap != 0 { // In the allocheaders experiment, the unrolled GCProg bitmap is allocated separately. // Free the space for the unrolled bitmap. systemstack(func() { s := spanOf(uintptr(unsafe.Pointer(s.largeType))) mheap_.freeManual(s, spanAllocPtrScalarBits) }) // Make sure to zero this pointer without putting the old // value in a write buffer, as the old value might be an // invalid pointer. See arena.go:(*mheap).allocUserArenaChunk. *(*uintptr)(unsafe.Pointer(&s.largeType)) = 0 } // Count the free in the consistent, external stats. stats := memstats.heapStats.acquire() atomic.Xadd64(&stats.largeFreeCount, 1) atomic.Xadd64(&stats.largeFree, int64(size)) memstats.heapStats.release() // Count the free in the inconsistent, internal stats. gcController.totalFree.Add(int64(size)) return true } // Add a large span directly onto the full+swept list. mheap_.central[spc].mcentral.fullSwept(sweepgen).push(s) } return false } // reportZombies reports any marked but free objects in s and throws. // // This generally means one of the following: // // 1. User code converted a pointer to a uintptr and then back // unsafely, and a GC ran while the uintptr was the only reference to // an object. // // 2. User code (or a compiler bug) constructed a bad pointer that // points to a free slot, often a past-the-end pointer. // // 3. The GC two cycles ago missed a pointer and freed a live object, // but it was still live in the last cycle, so this GC cycle found a // pointer to that object and marked it. func (s *mspan) reportZombies() { printlock() print("runtime: marked free object in span ", s, ", elemsize=", s.elemsize, " freeindex=", s.freeindex, " (bad use of unsafe.Pointer? try -d=checkptr)\n") mbits := s.markBitsForBase() abits := s.allocBitsForIndex(0) for i := uintptr(0); i < uintptr(s.nelems); i++ { addr := s.base() + i*s.elemsize print(hex(addr)) alloc := i < uintptr(s.freeindex) || abits.isMarked() if alloc { print(" alloc") } else { print(" free ") } if mbits.isMarked() { print(" marked ") } else { print(" unmarked") } zombie := mbits.isMarked() && !alloc if zombie { print(" zombie") } print("\n") if zombie { length := s.elemsize if length > 1024 { length = 1024 } hexdumpWords(addr, addr+length, nil) } mbits.advance() abits.advance() } throw("found pointer to free object") } // deductSweepCredit deducts sweep credit for allocating a span of // size spanBytes. This must be performed *before* the span is // allocated to ensure the system has enough credit. If necessary, it // performs sweeping to prevent going in to debt. If the caller will // also sweep pages (e.g., for a large allocation), it can pass a // non-zero callerSweepPages to leave that many pages unswept. // // deductSweepCredit makes a worst-case assumption that all spanBytes // bytes of the ultimately allocated span will be available for object // allocation. // // deductSweepCredit is the core of the "proportional sweep" system. // It uses statistics gathered by the garbage collector to perform // enough sweeping so that all pages are swept during the concurrent // sweep phase between GC cycles. // // mheap_ must NOT be locked. func deductSweepCredit(spanBytes uintptr, callerSweepPages uintptr) { if mheap_.sweepPagesPerByte == 0 { // Proportional sweep is done or disabled. return } trace := traceAcquire() if trace.ok() { trace.GCSweepStart() traceRelease(trace) } // Fix debt if necessary. retry: sweptBasis := mheap_.pagesSweptBasis.Load() live := gcController.heapLive.Load() liveBasis := mheap_.sweepHeapLiveBasis newHeapLive := spanBytes if liveBasis < live { // Only do this subtraction when we don't overflow. Otherwise, pagesTarget // might be computed as something really huge, causing us to get stuck // sweeping here until the next mark phase. // // Overflow can happen here if gcPaceSweeper is called concurrently with // sweeping (i.e. not during a STW, like it usually is) because this code // is intentionally racy. A concurrent call to gcPaceSweeper can happen // if a GC tuning parameter is modified and we read an older value of // heapLive than what was used to set the basis. // // This state should be transient, so it's fine to just let newHeapLive // be a relatively small number. We'll probably just skip this attempt to // sweep. // // See issue #57523. newHeapLive += uintptr(live - liveBasis) } pagesTarget := int64(mheap_.sweepPagesPerByte*float64(newHeapLive)) - int64(callerSweepPages) for pagesTarget > int64(mheap_.pagesSwept.Load()-sweptBasis) { if sweepone() == ^uintptr(0) { mheap_.sweepPagesPerByte = 0 break } if mheap_.pagesSweptBasis.Load() != sweptBasis { // Sweep pacing changed. Recompute debt. goto retry } } trace = traceAcquire() if trace.ok() { trace.GCSweepDone() traceRelease(trace) } } // clobberfree sets the memory content at x to bad content, for debugging // purposes. func clobberfree(x unsafe.Pointer, size uintptr) { // size (span.elemsize) is always a multiple of 4. for i := uintptr(0); i < size; i += 4 { *(*uint32)(add(x, i)) = 0xdeadbeef } } // gcPaceSweeper updates the sweeper's pacing parameters. // // Must be called whenever the GC's pacing is updated. // // The world must be stopped, or mheap_.lock must be held. func gcPaceSweeper(trigger uint64) { assertWorldStoppedOrLockHeld(&mheap_.lock) // Update sweep pacing. if isSweepDone() { mheap_.sweepPagesPerByte = 0 } else { // Concurrent sweep needs to sweep all of the in-use // pages by the time the allocated heap reaches the GC // trigger. Compute the ratio of in-use pages to sweep // per byte allocated, accounting for the fact that // some might already be swept. heapLiveBasis := gcController.heapLive.Load() heapDistance := int64(trigger) - int64(heapLiveBasis) // Add a little margin so rounding errors and // concurrent sweep are less likely to leave pages // unswept when GC starts. heapDistance -= 1024 * 1024 if heapDistance < _PageSize { // Avoid setting the sweep ratio extremely high heapDistance = _PageSize } pagesSwept := mheap_.pagesSwept.Load() pagesInUse := mheap_.pagesInUse.Load() sweepDistancePages := int64(pagesInUse) - int64(pagesSwept) if sweepDistancePages <= 0 { mheap_.sweepPagesPerByte = 0 } else { mheap_.sweepPagesPerByte = float64(sweepDistancePages) / float64(heapDistance) mheap_.sweepHeapLiveBasis = heapLiveBasis // Write pagesSweptBasis last, since this // signals concurrent sweeps to recompute // their debt. mheap_.pagesSweptBasis.Store(pagesSwept) } } }