runtime: implement a simple mark/sweep garbage collector
Этот коммит содержится в:
родитель
dbf581b56d
коммит
8402e84b6d
7 изменённых файлов: 477 добавлений и 3 удалений
2
main.go
2
main.go
|
@ -435,7 +435,7 @@ func handleCompilerError(err error) {
|
|||
func main() {
|
||||
outpath := flag.String("o", "", "output filename")
|
||||
opt := flag.String("opt", "z", "optimization level: 0, 1, 2, s, z")
|
||||
gc := flag.String("gc", "dumb", "garbage collector to use (none, dumb)")
|
||||
gc := flag.String("gc", "", "garbage collector to use (none, dumb, marksweep)")
|
||||
printIR := flag.Bool("printir", false, "print LLVM IR")
|
||||
dumpSSA := flag.Bool("dumpssa", false, "dump internal Go SSA")
|
||||
target := flag.String("target", "", "LLVM target")
|
||||
|
|
10
main_test.go
10
main_test.go
|
@ -58,9 +58,19 @@ func runTest(path, tmpdir string, target string, t *testing.T) {
|
|||
t.Fatal("could not read expected output file:", err)
|
||||
}
|
||||
|
||||
var gc string
|
||||
if target == "qemu" {
|
||||
// make sure testdata/gc.go passes
|
||||
gc = "marksweep"
|
||||
} else {
|
||||
// pick the default heap implementation
|
||||
gc = ""
|
||||
}
|
||||
|
||||
// Build the test binary.
|
||||
config := &BuildConfig{
|
||||
opt: "z",
|
||||
gc: gc,
|
||||
printIR: false,
|
||||
dumpSSA: false,
|
||||
debug: false,
|
||||
|
|
|
@ -4,6 +4,8 @@ package runtime
|
|||
|
||||
import (
|
||||
"unsafe"
|
||||
|
||||
"device/arm"
|
||||
)
|
||||
|
||||
const GOARCH = "arm"
|
||||
|
@ -17,12 +19,28 @@ var heapStartSymbol unsafe.Pointer
|
|||
//go:extern _heap_end
|
||||
var heapEndSymbol unsafe.Pointer
|
||||
|
||||
//go:extern _globals_start
|
||||
var globalsStartSymbol unsafe.Pointer
|
||||
|
||||
//go:extern _globals_end
|
||||
var globalsEndSymbol unsafe.Pointer
|
||||
|
||||
//go:extern _stack_top
|
||||
var stackTopSymbol unsafe.Pointer
|
||||
|
||||
var (
|
||||
heapStart = uintptr(unsafe.Pointer(&heapStartSymbol))
|
||||
heapEnd = uintptr(unsafe.Pointer(&heapEndSymbol))
|
||||
heapStart = uintptr(unsafe.Pointer(&heapStartSymbol))
|
||||
heapEnd = uintptr(unsafe.Pointer(&heapEndSymbol))
|
||||
globalsStart = uintptr(unsafe.Pointer(&globalsStartSymbol))
|
||||
globalsEnd = uintptr(unsafe.Pointer(&globalsEndSymbol))
|
||||
stackTop = uintptr(unsafe.Pointer(&stackTopSymbol))
|
||||
)
|
||||
|
||||
// Align on word boundary.
|
||||
func align(ptr uintptr) uintptr {
|
||||
return (ptr + 3) &^ 3
|
||||
}
|
||||
|
||||
func getCurrentStackPointer() uintptr {
|
||||
return arm.ReadRegister("sp")
|
||||
}
|
||||
|
|
384
src/runtime/gc_marksweep.go
Обычный файл
384
src/runtime/gc_marksweep.go
Обычный файл
|
@ -0,0 +1,384 @@
|
|||
// +build gc.marksweep
|
||||
|
||||
package runtime
|
||||
|
||||
// This memory manager is a textbook mark/sweep implementation, heavily inspired
|
||||
// by the MicroPython garbage collector.
|
||||
//
|
||||
// The memory manager internally uses blocks of 4 pointers big (see
|
||||
// bytesPerBlock). Every allocation first rounds up to this size to align every
|
||||
// block. It will first try to find a chain of blocks that is big enough to
|
||||
// satisfy the allocation. If it finds one, it marks the first one as the "head"
|
||||
// and the following ones (if any) as the "tail" (see below). If it cannot find
|
||||
// any free space, it will perform a garbage collection cycle and try again. If
|
||||
// it still cannot find any free space, it gives up.
|
||||
//
|
||||
// Every block has some metadata, which is stored at the beginning of the heap.
|
||||
// The four states are "free", "head", "tail", and "mark". During normal
|
||||
// operation, there are no marked blocks. Every allocated object starts with a
|
||||
// "head" and is followed by "tail" blocks. The reason for this distinction is
|
||||
// that this way, the start and end of every object can be found easily.
|
||||
//
|
||||
// Metadata is stored in a special area at the beginning of the heap, in the
|
||||
// area heapStart..poolStart. The actual blocks are stored in
|
||||
// poolStart..heapEnd.
|
||||
//
|
||||
// More information:
|
||||
// https://github.com/micropython/micropython/wiki/Memory-Manager
|
||||
// "The Garbage Collection Handbook" by Richard Jones, Antony Hosking, Eliot
|
||||
// Moss.
|
||||
|
||||
import (
|
||||
"unsafe"
|
||||
)
|
||||
|
||||
// Set gcDebug to true to print debug information.
|
||||
const (
|
||||
gcDebug = false // print debug info
|
||||
gcAsserts = gcDebug // perform sanity checks
|
||||
)
|
||||
|
||||
// Some globals + constants for the entire GC.
|
||||
|
||||
const (
|
||||
wordsPerBlock = 4 // number of pointers in an allocated block
|
||||
bytesPerBlock = wordsPerBlock * unsafe.Sizeof(heapStart)
|
||||
stateBits = 2 // how many bits a block state takes (see blockState type)
|
||||
blocksPerStateByte = 8 / stateBits
|
||||
)
|
||||
|
||||
var (
|
||||
poolStart uintptr // the first heap pointer
|
||||
nextAlloc gcBlock // the next block that should be tried by the allocator
|
||||
endBlock gcBlock // the block just past the end of the available space
|
||||
)
|
||||
|
||||
// zeroSizedAlloc is just a sentinel that gets returned when allocating 0 bytes.
|
||||
var zeroSizedAlloc uint8
|
||||
|
||||
// Provide some abstraction over heap blocks.
|
||||
|
||||
// blockState stores the four states in which a block can be. It is two bits in
|
||||
// size.
|
||||
type blockState uint8
|
||||
|
||||
const (
|
||||
blockStateFree blockState = 0 // 00
|
||||
blockStateHead blockState = 1 // 01
|
||||
blockStateTail blockState = 2 // 10
|
||||
blockStateMark blockState = 3 // 11
|
||||
blockStateMask blockState = 3 // 11
|
||||
)
|
||||
|
||||
// String returns a human-readable version of the block state, for debugging.
|
||||
func (s blockState) String() string {
|
||||
switch s {
|
||||
case blockStateFree:
|
||||
return "free"
|
||||
case blockStateHead:
|
||||
return "head"
|
||||
case blockStateTail:
|
||||
return "tail"
|
||||
case blockStateMark:
|
||||
return "mark"
|
||||
default:
|
||||
// must never happen
|
||||
return "!err"
|
||||
}
|
||||
}
|
||||
|
||||
// The block number in the pool.
|
||||
type gcBlock uintptr
|
||||
|
||||
// blockFromAddr returns a block given an address somewhere in the heap (which
|
||||
// might not be heap-aligned).
|
||||
func blockFromAddr(addr uintptr) gcBlock {
|
||||
return gcBlock((addr - poolStart) / bytesPerBlock)
|
||||
}
|
||||
|
||||
// Return a pointer to the start of the allocated object.
|
||||
func (b gcBlock) pointer() unsafe.Pointer {
|
||||
return unsafe.Pointer(b.address())
|
||||
}
|
||||
|
||||
// Return the address of the start of the allocated object.
|
||||
func (b gcBlock) address() uintptr {
|
||||
return poolStart + uintptr(b)*bytesPerBlock
|
||||
}
|
||||
|
||||
// findHead returns the head (first block) of an object, assuming the block
|
||||
// points to an allocated object. It returns the same block if this block
|
||||
// already points to the head.
|
||||
func (b gcBlock) findHead() gcBlock {
|
||||
for b.state() == blockStateTail {
|
||||
b--
|
||||
}
|
||||
return b
|
||||
}
|
||||
|
||||
// findNext returns the first block just past the end of the tail. This may or
|
||||
// may not be the head of an object.
|
||||
func (b gcBlock) findNext() gcBlock {
|
||||
if b.state() == blockStateHead {
|
||||
b++
|
||||
}
|
||||
for b.state() == blockStateTail {
|
||||
b++
|
||||
}
|
||||
return b
|
||||
}
|
||||
|
||||
// State returns the current block state.
|
||||
func (b gcBlock) state() blockState {
|
||||
stateBytePtr := (*uint8)(unsafe.Pointer(heapStart + uintptr(b/blocksPerStateByte)))
|
||||
return blockState(*stateBytePtr>>((b%blocksPerStateByte)*2)) % 4
|
||||
}
|
||||
|
||||
// setState sets the current block to the given state, which must contain more
|
||||
// bits than the current state. Allowed transitions: from free to any state and
|
||||
// from head to mark.
|
||||
func (b gcBlock) setState(newState blockState) {
|
||||
stateBytePtr := (*uint8)(unsafe.Pointer(heapStart + uintptr(b/blocksPerStateByte)))
|
||||
*stateBytePtr |= uint8(newState << ((b % blocksPerStateByte) * 2))
|
||||
if gcAsserts && b.state() != newState {
|
||||
runtimePanic("gc: setState() was not successful")
|
||||
}
|
||||
}
|
||||
|
||||
// markFree sets the block state to free, no matter what state it was in before.
|
||||
func (b gcBlock) markFree() {
|
||||
stateBytePtr := (*uint8)(unsafe.Pointer(heapStart + uintptr(b/blocksPerStateByte)))
|
||||
*stateBytePtr &^= uint8(blockStateMask << ((b % blocksPerStateByte) * 2))
|
||||
if gcAsserts && b.state() != blockStateFree {
|
||||
runtimePanic("gc: markFree() was not successful")
|
||||
}
|
||||
}
|
||||
|
||||
// unmark changes the state of the block from mark to head. It must be marked
|
||||
// before calling this function.
|
||||
func (b gcBlock) unmark() {
|
||||
if gcAsserts && b.state() != blockStateMark {
|
||||
runtimePanic("gc: unmark() on a block that is not marked")
|
||||
}
|
||||
clearMask := blockStateMask ^ blockStateHead // the bits to clear from the state
|
||||
stateBytePtr := (*uint8)(unsafe.Pointer(heapStart + uintptr(b/blocksPerStateByte)))
|
||||
*stateBytePtr &^= uint8(clearMask << ((b % blocksPerStateByte) * 2))
|
||||
if gcAsserts && b.state() != blockStateHead {
|
||||
runtimePanic("gc: unmark() was not successful")
|
||||
}
|
||||
}
|
||||
|
||||
// Initialize the memory allocator.
|
||||
// No memory may be allocated before this is called. That means the runtime and
|
||||
// any packages the runtime depends upon may not allocate memory during package
|
||||
// initialization.
|
||||
func init() {
|
||||
totalSize := heapEnd - heapStart
|
||||
|
||||
// Allocate some memory to keep 2 bits of information about every block.
|
||||
metadataSize := totalSize / (blocksPerStateByte * bytesPerBlock)
|
||||
|
||||
// Align the pool.
|
||||
poolStart = (heapStart + metadataSize + (bytesPerBlock - 1)) &^ (bytesPerBlock - 1)
|
||||
poolEnd := heapEnd &^ (bytesPerBlock - 1)
|
||||
numBlocks := (poolEnd - poolStart) / bytesPerBlock
|
||||
endBlock = gcBlock(numBlocks)
|
||||
if gcDebug {
|
||||
println("heapStart: ", heapStart)
|
||||
println("heapEnd: ", heapEnd)
|
||||
println("total size: ", totalSize)
|
||||
println("metadata size: ", metadataSize)
|
||||
println("poolStart: ", poolStart)
|
||||
println("# of blocks: ", numBlocks)
|
||||
println("# of block states:", metadataSize*blocksPerStateByte)
|
||||
}
|
||||
if gcAsserts && metadataSize*blocksPerStateByte < numBlocks {
|
||||
// sanity check
|
||||
runtimePanic("gc: metadata array is too small")
|
||||
}
|
||||
|
||||
// Set all block states to 'free'.
|
||||
memzero(unsafe.Pointer(heapStart), metadataSize)
|
||||
}
|
||||
|
||||
// alloc tries to find some free space on the heap, possibly doing a garbage
|
||||
// collection cycle if needed. If no space is free, it panics.
|
||||
func alloc(size uintptr) unsafe.Pointer {
|
||||
if size == 0 {
|
||||
return unsafe.Pointer(&zeroSizedAlloc)
|
||||
}
|
||||
|
||||
neededBlocks := (size + (bytesPerBlock - 1)) / bytesPerBlock
|
||||
|
||||
// Continue looping until a run of free blocks has been found that fits the
|
||||
// requested size.
|
||||
index := nextAlloc
|
||||
numFreeBlocks := uintptr(0)
|
||||
heapScanCount := uint8(0)
|
||||
for {
|
||||
if index == nextAlloc {
|
||||
if heapScanCount == 0 {
|
||||
heapScanCount = 1
|
||||
} else if heapScanCount == 1 {
|
||||
// The entire heap has been searched for free memory, but none
|
||||
// could be found. Run a garbage collection cycle to reclaim
|
||||
// free memory and try again.
|
||||
heapScanCount = 2
|
||||
GC()
|
||||
} else {
|
||||
// Even after garbage collection, no free memory could be found.
|
||||
runtimePanic("out of memory")
|
||||
}
|
||||
}
|
||||
|
||||
// Wrap around the end of the heap.
|
||||
if index == endBlock {
|
||||
index = 0
|
||||
// Reset numFreeBlocks as allocations cannot wrap.
|
||||
numFreeBlocks = 0
|
||||
}
|
||||
|
||||
// Is the block we're looking at free?
|
||||
if index.state() != blockStateFree {
|
||||
// This block is in use. Try again from this point.
|
||||
numFreeBlocks = 0
|
||||
index++
|
||||
continue
|
||||
}
|
||||
numFreeBlocks++
|
||||
index++
|
||||
|
||||
// Are we finished?
|
||||
if numFreeBlocks == neededBlocks {
|
||||
// Found a big enough range of free blocks!
|
||||
nextAlloc = index
|
||||
thisAlloc := index - gcBlock(neededBlocks)
|
||||
if gcDebug {
|
||||
println("found memory:", thisAlloc.pointer(), int(size))
|
||||
}
|
||||
|
||||
// Set the following blocks as being allocated.
|
||||
thisAlloc.setState(blockStateHead)
|
||||
for i := thisAlloc + 1; i != nextAlloc; i++ {
|
||||
i.setState(blockStateTail)
|
||||
}
|
||||
|
||||
// Return a pointer to this allocation.
|
||||
pointer := thisAlloc.pointer()
|
||||
memzero(pointer, size)
|
||||
return pointer
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
func free(ptr unsafe.Pointer) {
|
||||
// TODO: free blocks on request, when the compiler knows they're unused.
|
||||
}
|
||||
|
||||
// GC performs a garbage collection cycle.
|
||||
func GC() {
|
||||
if gcDebug {
|
||||
println("running collection cycle...")
|
||||
}
|
||||
|
||||
// Mark phase: mark all reachable objects, recursively.
|
||||
markRoots(globalsStart, globalsEnd)
|
||||
markRoots(getCurrentStackPointer(), stackTop) // assume a descending stack
|
||||
|
||||
// Sweep phase: free all non-marked objects and unmark marked objects for
|
||||
// the next collection cycle.
|
||||
sweep()
|
||||
|
||||
// Show how much has been sweeped, for debugging.
|
||||
if gcDebug {
|
||||
dumpHeap()
|
||||
}
|
||||
}
|
||||
|
||||
// markRoots reads all pointers from start to end (exclusive) and if they look
|
||||
// like a heap pointer and are unmarked, marks them and scans that object as
|
||||
// well (recursively). The start and end parameters must be valid pointers and
|
||||
// must be aligned.
|
||||
func markRoots(start, end uintptr) {
|
||||
if gcDebug {
|
||||
println("mark from", start, "to", end, int(end-start))
|
||||
}
|
||||
|
||||
for addr := start; addr != end; addr += unsafe.Sizeof(addr) {
|
||||
root := *(*uintptr)(unsafe.Pointer(addr))
|
||||
if looksLikePointer(root) {
|
||||
block := blockFromAddr(root)
|
||||
head := block.findHead()
|
||||
if head.state() != blockStateMark {
|
||||
if gcDebug {
|
||||
println("found unmarked pointer", root, "at address", addr)
|
||||
}
|
||||
head.setState(blockStateMark)
|
||||
next := block.findNext()
|
||||
// TODO: avoid recursion as much as possible
|
||||
markRoots(head.address(), next.address())
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Sweep goes through all memory and frees unmarked memory.
|
||||
func sweep() {
|
||||
freeCurrentObject := false
|
||||
for block := gcBlock(0); block < endBlock; block++ {
|
||||
switch block.state() {
|
||||
case blockStateHead:
|
||||
// Unmarked head. Free it, including all tail blocks following it.
|
||||
block.markFree()
|
||||
freeCurrentObject = true
|
||||
case blockStateTail:
|
||||
if freeCurrentObject {
|
||||
// This is a tail object following an unmarked head.
|
||||
// Free it now.
|
||||
block.markFree()
|
||||
}
|
||||
case blockStateMark:
|
||||
// This is a marked object. The next tail blocks must not be freed,
|
||||
// but the mark bit must be removed so the next GC cycle will
|
||||
// collect this object if it is unreferenced then.
|
||||
block.unmark()
|
||||
freeCurrentObject = false
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// looksLikePointer returns whether this could be a pointer. Currently, it
|
||||
// simply returns whether it lies anywhere in the heap. Go allows interior
|
||||
// pointers so we can't check alignment or anything like that.
|
||||
func looksLikePointer(ptr uintptr) bool {
|
||||
return ptr >= poolStart && ptr < heapEnd
|
||||
}
|
||||
|
||||
// dumpHeap can be used for debugging purposes. It dumps the state of each heap
|
||||
// block to standard output.
|
||||
func dumpHeap() {
|
||||
println("heap:")
|
||||
for block := gcBlock(0); block < endBlock; block++ {
|
||||
switch block.state() {
|
||||
case blockStateHead:
|
||||
print("*")
|
||||
case blockStateTail:
|
||||
print("-")
|
||||
case blockStateMark:
|
||||
print("#")
|
||||
default: // free
|
||||
print("·")
|
||||
}
|
||||
if block%64 == 63 || block+1 == endBlock {
|
||||
println()
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
func KeepAlive(x interface{}) {
|
||||
// Unimplemented. Only required with SetFinalizer().
|
||||
}
|
||||
|
||||
func SetFinalizer(obj interface{}, finalizer interface{}) {
|
||||
// Unimplemented.
|
||||
}
|
|
@ -58,3 +58,5 @@ SECTIONS
|
|||
/* For the memory allocator. */
|
||||
_heap_start = _ebss;
|
||||
_heap_end = ORIGIN(RAM) + LENGTH(RAM);
|
||||
_globals_start = _sdata;
|
||||
_globals_end = _ebss;
|
||||
|
|
59
testdata/gc.go
предоставленный
Обычный файл
59
testdata/gc.go
предоставленный
Обычный файл
|
@ -0,0 +1,59 @@
|
|||
package main
|
||||
|
||||
var xorshift32State uint32 = 1
|
||||
|
||||
func xorshift32(x uint32) uint32 {
|
||||
// Algorithm "xor" from p. 4 of Marsaglia, "Xorshift RNGs"
|
||||
x ^= x << 13
|
||||
x ^= x >> 17
|
||||
x ^= x << 5
|
||||
return x
|
||||
}
|
||||
|
||||
func randuint32() uint32 {
|
||||
xorshift32State = xorshift32(xorshift32State)
|
||||
return xorshift32State
|
||||
}
|
||||
|
||||
func main() {
|
||||
testNonPointerHeap()
|
||||
}
|
||||
|
||||
var scalarSlices [4][]byte
|
||||
var randSeeds [4]uint32
|
||||
|
||||
func testNonPointerHeap() {
|
||||
// Allocate roughly 0.5MB of memory.
|
||||
for i := 0; i < 1000; i++ {
|
||||
// Pick a random index that the optimizer can't predict.
|
||||
index := randuint32() % 4
|
||||
|
||||
// Check whether the contents of the previous allocation was correct.
|
||||
rand := randSeeds[index]
|
||||
for _, b := range scalarSlices[index] {
|
||||
rand = xorshift32(rand)
|
||||
if b != byte(rand) {
|
||||
panic("memory was overwritten!")
|
||||
}
|
||||
}
|
||||
|
||||
// Allocate a randomly-sized slice, randomly sliced to be smaller.
|
||||
sliceLen := randuint32() % 1024
|
||||
slice := make([]byte, sliceLen)
|
||||
cutLen := randuint32() % 1024
|
||||
if cutLen < sliceLen {
|
||||
slice = slice[cutLen:]
|
||||
}
|
||||
scalarSlices[index] = slice
|
||||
|
||||
// Fill the slice with a pattern that looks random but is easily
|
||||
// calculated and verified.
|
||||
rand = randuint32() + 1
|
||||
randSeeds[index] = rand
|
||||
for i := 0; i < len(slice); i++ {
|
||||
rand = xorshift32(rand)
|
||||
slice[i] = byte(rand)
|
||||
}
|
||||
}
|
||||
println("ok")
|
||||
}
|
1
testdata/gc.txt
предоставленный
Обычный файл
1
testdata/gc.txt
предоставленный
Обычный файл
|
@ -0,0 +1 @@
|
|||
ok
|
Загрузка…
Создание таблицы
Сослаться в новой задаче