123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269 |
- #
- #
- # Nim's Runtime Library
- # (c) Copyright 2013 Andreas Rumpf
- #
- # See the file "copying.txt", included in this
- # distribution, for details about the copyright.
- #
- #[
- Efficient set of pointers for the GC (and repr)
- -----------------------------------------------
- The GC depends on an extremely efficient datastructure for storing a
- set of pointers - this is called a `CellSet` in the source code.
- Inserting, deleting and searching are done in constant time. However,
- modifying a `CellSet` during traversal leads to undefined behaviour.
- All operations on a CellSet have to perform efficiently. Because a Cellset can
- become huge a hash table alone is not suitable for this.
- We use a mixture of bitset and hash table for this. The hash table maps *pages*
- to a page descriptor. The page descriptor contains a bit for any possible cell
- address within this page. So including a cell is done as follows:
- - Find the page descriptor for the page the cell belongs to.
- - Set the appropriate bit in the page descriptor indicating that the
- cell points to the start of a memory block.
- Removing a cell is analogous - the bit has to be set to zero.
- Single page descriptors are never deleted from the hash table. This is not
- needed as the data structures needs to be rebuilt periodically anyway.
- Complete traversal is done in this way::
- for each page descriptor d:
- for each bit in d:
- if bit == 1:
- traverse the pointer belonging to this bit
- ]#
- when defined(gcOrc) or defined(gcArc):
- type
- PCell = Cell
- when not declaredInScope(PageShift):
- include bitmasks
- else:
- type
- RefCount = int
- Cell {.pure.} = object
- refcount: RefCount # the refcount and some flags
- typ: PNimType
- when trackAllocationSource:
- filename: cstring
- line: int
- when useCellIds:
- id: int
- PCell = ptr Cell
- type
- PPageDesc = ptr PageDesc
- BitIndex = range[0..UnitsPerPage-1]
- PageDesc {.final, pure.} = object
- next: PPageDesc # all nodes are connected with this pointer
- key: uint # start address at bit 0
- bits: array[BitIndex, int] # a bit vector
- PPageDescArray = ptr UncheckedArray[PPageDesc]
- CellSet {.final, pure.} = object
- counter, max: int
- head: PPageDesc
- data: PPageDescArray
- when defined(gcOrc) or defined(gcArc):
- discard
- else:
- include cellseqs_v1
- # ------------------- cell set handling ---------------------------------------
- const
- InitCellSetSize = 1024 # must be a power of two!
- proc init(s: var CellSet) =
- s.data = cast[PPageDescArray](alloc0(InitCellSetSize * sizeof(PPageDesc)))
- s.max = InitCellSetSize-1
- s.counter = 0
- s.head = nil
- proc deinit(s: var CellSet) =
- var it = s.head
- while it != nil:
- var n = it.next
- dealloc(it)
- it = n
- s.head = nil # play it safe here
- dealloc(s.data)
- s.data = nil
- s.counter = 0
- proc nextTry(h, maxHash: int): int {.inline.} =
- result = ((5*h) + 1) and maxHash
- # For any initial h in range(maxHash), repeating that maxHash times
- # generates each int in range(maxHash) exactly once (see any text on
- # random-number generation for proof).
- proc cellSetGet(t: CellSet, key: uint): PPageDesc =
- var h = cast[int](key) and t.max
- while t.data[h] != nil:
- if t.data[h].key == key: return t.data[h]
- h = nextTry(h, t.max)
- return nil
- proc cellSetRawInsert(t: CellSet, data: PPageDescArray, desc: PPageDesc) =
- var h = cast[int](desc.key) and t.max
- while data[h] != nil:
- sysAssert(data[h] != desc, "CellSetRawInsert 1")
- h = nextTry(h, t.max)
- sysAssert(data[h] == nil, "CellSetRawInsert 2")
- data[h] = desc
- proc cellSetEnlarge(t: var CellSet) =
- var oldMax = t.max
- t.max = ((t.max+1)*2)-1
- var n = cast[PPageDescArray](alloc0((t.max + 1) * sizeof(PPageDesc)))
- for i in 0 .. oldMax:
- if t.data[i] != nil:
- cellSetRawInsert(t, n, t.data[i])
- dealloc(t.data)
- t.data = n
- proc cellSetPut(t: var CellSet, key: uint): PPageDesc =
- var h = cast[int](key) and t.max
- while true:
- var x = t.data[h]
- if x == nil: break
- if x.key == key: return x
- h = nextTry(h, t.max)
- if ((t.max+1)*2 < t.counter*3) or ((t.max+1)-t.counter < 4):
- cellSetEnlarge(t)
- inc(t.counter)
- h = cast[int](key) and t.max
- while t.data[h] != nil: h = nextTry(h, t.max)
- sysAssert(t.data[h] == nil, "CellSetPut")
- # the new page descriptor goes into result
- result = cast[PPageDesc](alloc0(sizeof(PageDesc)))
- result.next = t.head
- result.key = key
- t.head = result
- t.data[h] = result
- # ---------- slightly higher level procs --------------------------------------
- proc contains(s: CellSet, cell: PCell): bool =
- var u = cast[uint](cell)
- var t = cellSetGet(s, u shr PageShift)
- if t != nil:
- u = (u mod PageSize) div MemAlign
- result = (t.bits[u shr IntShift] and (1 shl (u and IntMask))) != 0
- else:
- result = false
- proc incl(s: var CellSet, cell: PCell) =
- var u = cast[uint](cell)
- var t = cellSetPut(s, u shr PageShift)
- u = (u mod PageSize) div MemAlign
- t.bits[u shr IntShift] = t.bits[u shr IntShift] or (1 shl (u and IntMask))
- proc excl(s: var CellSet, cell: PCell) =
- var u = cast[uint](cell)
- var t = cellSetGet(s, u shr PageShift)
- if t != nil:
- u = (u mod PageSize) div MemAlign
- t.bits[u shr IntShift] = (t.bits[u shr IntShift] and
- not (1 shl (u and IntMask)))
- proc containsOrIncl(s: var CellSet, cell: PCell): bool =
- var u = cast[uint](cell)
- var t = cellSetGet(s, u shr PageShift)
- if t != nil:
- u = (u mod PageSize) div MemAlign
- result = (t.bits[u shr IntShift] and (1 shl (u and IntMask))) != 0
- if not result:
- t.bits[u shr IntShift] = t.bits[u shr IntShift] or
- (1 shl (u and IntMask))
- else:
- incl(s, cell)
- result = false
- iterator elements(t: CellSet): PCell {.inline.} =
- # while traversing it is forbidden to add pointers to the tree!
- var r = t.head
- while r != nil:
- var i: uint = 0
- while int(i) <= high(r.bits):
- var w = r.bits[i] # taking a copy of r.bits[i] here is correct, because
- # modifying operations are not allowed during traversation
- var j: uint = 0
- while w != 0: # test all remaining bits for zero
- if (w and 1) != 0: # the bit is set!
- yield cast[PCell]((r.key shl PageShift) or
- (i shl IntShift + j) * MemAlign)
- inc(j)
- w = w shr 1
- inc(i)
- r = r.next
- when false:
- type
- CellSetIter = object
- p: PPageDesc
- i, w, j: int
- proc next(it: var CellSetIter): PCell =
- while true:
- while it.w != 0: # test all remaining bits for zero
- if (it.w and 1) != 0: # the bit is set!
- result = cast[PCell]((it.p.key shl PageShift) or
- (it.i shl IntShift +% it.j) *% MemAlign)
- inc(it.j)
- it.w = it.w shr 1
- return
- else:
- inc(it.j)
- it.w = it.w shr 1
- # load next w:
- if it.i >= high(it.p.bits):
- it.i = 0
- it.j = 0
- it.p = it.p.next
- if it.p == nil: return nil
- else:
- inc it.i
- it.w = it.p.bits[i]
- proc init(it: var CellSetIter; t: CellSet): PCell =
- it.p = t.head
- it.i = -1
- it.w = 0
- result = it.next
- iterator elementsExcept(t, s: CellSet): PCell {.inline.} =
- var r = t.head
- while r != nil:
- let ss = cellSetGet(s, r.key)
- var i:uint = 0
- while int(i) <= high(r.bits):
- var w = r.bits[i]
- if ss != nil:
- w = w and not ss.bits[i]
- var j:uint = 0
- while w != 0:
- if (w and 1) != 0:
- yield cast[PCell]((r.key shl PageShift) or
- (i shl IntShift + j) * MemAlign)
- inc(j)
- w = w shr 1
- inc(i)
- r = r.next
|