src/internal/runtime/maps/table.go - go - Git at Google

 // Copyright 2024 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 package maps

 import (
 	"internal/abi"
 	"internal/goarch"
 	"internal/runtime/math"
 	"unsafe"
 )

 // Maximum size of a table before it is split at the directory level.
 //
 // TODO: Completely made up value. This should be tuned for performance vs grow
 // latency.
 // TODO: This should likely be based on byte size, as copying costs will
 // dominate grow latency for large objects.
 const maxTableCapacity = 1024

 // Ensure the max capacity fits in uint16, used for capacity and growthLeft
 // below.
 var _ = uint16(maxTableCapacity)

 // table is a Swiss table hash table structure.
 //
 // Each table is a complete hash table implementation.
 //
 // Map uses one or more tables to store entries. Extendible hashing (hash
 // prefix) is used to select the table to use for a specific key. Using
 // multiple tables enables incremental growth by growing only one table at a
 // time.
 type table struct {
 	// The number of filled slots (i.e. the number of elements in the table).
 	used uint16

 	// The total number of slots (always 2^N). Equal to
 	// `(groups.lengthMask+1)*abi.MapGroupSlots`.
 	capacity uint16

 	// The number of slots we can still fill without needing to rehash.
 	//
 	// We rehash when used + tombstones > loadFactor*capacity, including
 	// tombstones so the table doesn't overfill with tombstones. This field
 	// counts down remaining empty slots before the next rehash.
 	growthLeft uint16

 	// The number of bits used by directory lookups above this table. Note
 	// that this may be less then globalDepth, if the directory has grown
 	// but this table has not yet been split.
 	localDepth uint8

 	// Index of this table in the Map directory. This is the index of the
 	// _first_ location in the directory. The table may occur in multiple
 	// sequential indices.
 	//
 	// index is -1 if the table is stale (no longer installed in the
 	// directory).
 	index int

 	// groups is an array of slot groups. Each group holds abi.MapGroupSlots
 	// key/elem slots and their control bytes. A table has a fixed size
 	// groups array. The table is replaced (in rehash) when more space is
 	// required.
 	//
 	// TODO(prattmic): keys and elements are interleaved to maximize
 	// locality, but it comes at the expense of wasted space for some types
 	// (consider uint8 key, uint64 element). Consider placing all keys
 	// together in these cases to save space.
 	groups groupsReference
 }

 func newTable(typ *abi.MapType, capacity uint64, index int, localDepth uint8) *table {
 	if capacity < abi.MapGroupSlots {
 		capacity = abi.MapGroupSlots
 	}

 	t := &table{
 		index:      index,
 		localDepth: localDepth,
 	}

 	if capacity > maxTableCapacity {
 		panic("initial table capacity too large")
 	}

 	// N.B. group count must be a power of two for probeSeq to visit every
 	// group.
 	capacity, overflow := alignUpPow2(capacity)
 	if overflow {
 		panic("rounded-up capacity overflows uint64")
 	}

 	t.reset(typ, uint16(capacity))

 	return t
 }

 // reset resets the table with new, empty groups with the specified new total
 // capacity.
 func (t *table) reset(typ *abi.MapType, capacity uint16) {
 	groupCount := uint64(capacity) / abi.MapGroupSlots
 	t.groups = newGroups(typ, groupCount)
 	t.capacity = capacity
 	t.growthLeft = t.maxGrowthLeft()

 	for i := uint64(0); i <= t.groups.lengthMask; i++ {
 		g := t.groups.group(typ, i)
 		g.ctrls().setEmpty()
 	}
 }

 // maxGrowthLeft is the number of inserts we can do before
 // resizing, starting from an empty table.
 func (t *table) maxGrowthLeft() uint16 {
 	if t.capacity == 0 {
 		// No real reason to support zero capacity table, since an
 		// empty Map simply won't have a table.
 		panic("table must have positive capacity")
 	} else if t.capacity <= abi.MapGroupSlots {
 		// If the map fits in a single group then we're able to fill all of
 		// the slots except 1 (an empty slot is needed to terminate find
 		// operations).
 		//
 		// TODO(go.dev/issue/54766): With a special case in probing for
 		// single-group tables, we could fill all slots.
 		return t.capacity - 1
 	} else {
 		if t.capacity > math.MaxUint16/maxAvgGroupLoad {
 			panic("overflow")
 		}
 		return (t.capacity * maxAvgGroupLoad) / abi.MapGroupSlots
 	}

 }

 func (t *table) Used() uint64 {
 	return uint64(t.used)
 }

 // Get performs a lookup of the key that key points to. It returns a pointer to
 // the element, or false if the key doesn't exist.
 func (t *table) Get(typ *abi.MapType, m *Map, key unsafe.Pointer) (unsafe.Pointer, bool) {
 	// TODO(prattmic): We could avoid hashing in a variety of special
 	// cases.
 	//
 	// - One entry maps could just directly compare the single entry
 	//   without hashing.
 	// - String keys could do quick checks of a few bytes before hashing.
 	hash := typ.Hasher(key, m.seed)
 	_, elem, ok := t.getWithKey(typ, hash, key)
 	return elem, ok
 }

 // getWithKey performs a lookup of key, returning a pointer to the version of
 // the key in the map in addition to the element.
 //
 // This is relevant when multiple different key values compare equal (e.g.,
 // +0.0 and -0.0). When a grow occurs during iteration, iteration perform a
 // lookup of keys from the old group in the new group in order to correctly
 // expose updated elements. For NeedsKeyUpdate keys, iteration also must return
 // the new key value, not the old key value.
 // hash must be the hash of the key.
 func (t *table) getWithKey(typ *abi.MapType, hash uintptr, key unsafe.Pointer) (unsafe.Pointer, unsafe.Pointer, bool) {
 	// To find the location of a key in the table, we compute hash(key). From
 	// h1(hash(key)) and the capacity, we construct a probeSeq that visits
 	// every group of slots in some interesting order. See [probeSeq].
 	//
 	// We walk through these indices. At each index, we select the entire
 	// group starting with that index and extract potential candidates:
 	// occupied slots with a control byte equal to h2(hash(key)). The key
 	// at candidate slot i is compared with key; if key == g.slot(i).key
 	// we are done and return the slot; if there is an empty slot in the
 	// group, we stop and return an error; otherwise we continue to the
 	// next probe index. Tombstones (ctrlDeleted) effectively behave like
 	// full slots that never match the value we're looking for.
 	//
 	// The h2 bits ensure when we compare a key we are likely to have
 	// actually found the object. That is, the chance is low that keys
 	// compare false. Thus, when we search for an object, we are unlikely
 	// to call Equal many times. This likelihood can be analyzed as follows
 	// (assuming that h2 is a random enough hash function).
 	//
 	// Let's assume that there are k "wrong" objects that must be examined
 	// in a probe sequence. For example, when doing a find on an object
 	// that is in the table, k is the number of objects between the start
 	// of the probe sequence and the final found object (not including the
 	// final found object). The expected number of objects with an h2 match
 	// is then k/128. Measurements and analysis indicate that even at high
 	// load factors, k is less than 32, meaning that the number of false
 	// positive comparisons we must perform is less than 1/8 per find.
 	seq := makeProbeSeq(h1(hash), t.groups.lengthMask)
 	h2Hash := h2(hash)
 	for ; ; seq = seq.next() {
 		g := t.groups.group(typ, seq.offset)

 		match := g.ctrls().matchH2(h2Hash)

 		for match != 0 {
 			i := match.first()

 			slotKey := g.key(typ, i)
 			if typ.IndirectKey() {
 				slotKey = *((*unsafe.Pointer)(slotKey))
 			}
 			if typ.Key.Equal(key, slotKey) {
 				slotElem := g.elem(typ, i)
 				if typ.IndirectElem() {
 					slotElem = *((*unsafe.Pointer)(slotElem))
 				}
 				return slotKey, slotElem, true
 			}
 			match = match.removeFirst()
 		}

 		match = g.ctrls().matchEmpty()
 		if match != 0 {
 			// Finding an empty slot means we've reached the end of
 			// the probe sequence.
 			return nil, nil, false
 		}
 	}
 }

 func (t *table) getWithoutKey(typ *abi.MapType, hash uintptr, key unsafe.Pointer) (unsafe.Pointer, bool) {
 	seq := makeProbeSeq(h1(hash), t.groups.lengthMask)
 	h2Hash := h2(hash)
 	for ; ; seq = seq.next() {
 		g := t.groups.group(typ, seq.offset)

 		match := g.ctrls().matchH2(h2Hash)

 		for match != 0 {
 			i := match.first()

 			slotKey := g.key(typ, i)
 			if typ.IndirectKey() {
 				slotKey = *((*unsafe.Pointer)(slotKey))
 			}
 			if typ.Key.Equal(key, slotKey) {
 				slotElem := g.elem(typ, i)
 				if typ.IndirectElem() {
 					slotElem = *((*unsafe.Pointer)(slotElem))
 				}
 				return slotElem, true
 			}
 			match = match.removeFirst()
 		}

 		match = g.ctrls().matchEmpty()
 		if match != 0 {
 			// Finding an empty slot means we've reached the end of
 			// the probe sequence.
 			return nil, false
 		}
 	}
 }

 // PutSlot returns a pointer to the element slot where an inserted element
 // should be written, and ok if it returned a valid slot.
 //
 // PutSlot returns ok false if the table was split and the Map needs to find
 // the new table.
 //
 // hash must be the hash of key.
 func (t *table) PutSlot(typ *abi.MapType, m *Map, hash uintptr, key unsafe.Pointer) (unsafe.Pointer, bool) {
 	seq := makeProbeSeq(h1(hash), t.groups.lengthMask)

 	// As we look for a match, keep track of the first deleted slot we
 	// find, which we'll use to insert the new entry if necessary.
 	var firstDeletedGroup groupReference
 	var firstDeletedSlot uintptr

 	h2Hash := h2(hash)
 	for ; ; seq = seq.next() {
 		g := t.groups.group(typ, seq.offset)
 		match := g.ctrls().matchH2(h2Hash)

 		// Look for an existing slot containing this key.
 		for match != 0 {
 			i := match.first()

 			slotKey := g.key(typ, i)
 			if typ.IndirectKey() {
 				slotKey = *((*unsafe.Pointer)(slotKey))
 			}
 			if typ.Key.Equal(key, slotKey) {
 				if typ.NeedKeyUpdate() {
 					typedmemmove(typ.Key, slotKey, key)
 				}

 				slotElem := g.elem(typ, i)
 				if typ.IndirectElem() {
 					slotElem = *((*unsafe.Pointer)(slotElem))
 				}

 				t.checkInvariants(typ, m)
 				return slotElem, true
 			}
 			match = match.removeFirst()
 		}

 		// No existing slot for this key in this group. Is this the end
 		// of the probe sequence?
 		match = g.ctrls().matchEmptyOrDeleted()
 		if match == 0 {
 			continue // nothing but filled slots. Keep probing.
 		}
 		i := match.first()
 		if g.ctrls().get(i) == ctrlDeleted {
 			// There are some deleted slots. Remember
 			// the first one, and keep probing.
 			if firstDeletedGroup.data == nil {
 				firstDeletedGroup = g
 				firstDeletedSlot = i
 			}
 			continue
 		}
 		// We've found an empty slot, which means we've reached the end of
 		// the probe sequence.

 		// If we found a deleted slot along the way, we can
 		// replace it without consuming growthLeft.
 		if firstDeletedGroup.data != nil {
 			g = firstDeletedGroup
 			i = firstDeletedSlot
 			t.growthLeft++ // will be decremented below to become a no-op.
 		}

 		// If we have no space left, first try to remove some tombstones.
 		if t.growthLeft == 0 {
 			t.pruneTombstones(typ, m)
 		}

 		// If there is room left to grow, just insert the new entry.
 		if t.growthLeft > 0 {
 			slotKey := g.key(typ, i)
 			if typ.IndirectKey() {
 				kmem := newobject(typ.Key)
 				*(*unsafe.Pointer)(slotKey) = kmem
 				slotKey = kmem
 			}
 			typedmemmove(typ.Key, slotKey, key)

 			slotElem := g.elem(typ, i)
 			if typ.IndirectElem() {
 				emem := newobject(typ.Elem)
 				*(*unsafe.Pointer)(slotElem) = emem
 				slotElem = emem
 			}

 			g.ctrls().set(i, ctrl(h2Hash))
 			t.growthLeft--
 			t.used++
 			m.used++

 			t.checkInvariants(typ, m)
 			return slotElem, true
 		}

 		t.rehash(typ, m)
 		return nil, false
 	}
 }

 // uncheckedPutSlot inserts an entry known not to be in the table.
 // This is used for grow/split where we are making a new table from
 // entries in an existing table.
 //
 // Decrements growthLeft and increments used.
 //
 // Requires that the entry does not exist in the table, and that the table has
 // room for another element without rehashing.
 //
 // Requires that there are no deleted entries in the table.
 //
 // For indirect keys and/or elements, the key and elem pointers can be
 // put directly into the map, they do not need to be copied. This
 // requires the caller to ensure that the referenced memory never
 // changes (by sourcing those pointers from another indirect key/elem
 // map).
 func (t *table) uncheckedPutSlot(typ *abi.MapType, hash uintptr, key, elem unsafe.Pointer) {
 	if t.growthLeft == 0 {
 		panic("invariant failed: growthLeft is unexpectedly 0")
 	}

 	// Given key and its hash hash(key), to insert it, we construct a
 	// probeSeq, and use it to find the first group with an unoccupied (empty
 	// or deleted) slot. We place the key/value into the first such slot in
 	// the group and mark it as full with key's H2.
 	seq := makeProbeSeq(h1(hash), t.groups.lengthMask)
 	for ; ; seq = seq.next() {
 		g := t.groups.group(typ, seq.offset)

 		match := g.ctrls().matchEmptyOrDeleted()
 		if match != 0 {
 			i := match.first()

 			slotKey := g.key(typ, i)
 			if typ.IndirectKey() {
 				*(*unsafe.Pointer)(slotKey) = key
 			} else {
 				typedmemmove(typ.Key, slotKey, key)
 			}

 			slotElem := g.elem(typ, i)
 			if typ.IndirectElem() {
 				*(*unsafe.Pointer)(slotElem) = elem
 			} else {
 				typedmemmove(typ.Elem, slotElem, elem)
 			}

 			t.growthLeft--
 			t.used++
 			g.ctrls().set(i, ctrl(h2(hash)))
 			return
 		}
 	}
 }

 // Delete returns true if it put a tombstone in t.
 func (t *table) Delete(typ *abi.MapType, m *Map, hash uintptr, key unsafe.Pointer) bool {
 	seq := makeProbeSeq(h1(hash), t.groups.lengthMask)
 	h2Hash := h2(hash)
 	for ; ; seq = seq.next() {
 		g := t.groups.group(typ, seq.offset)
 		match := g.ctrls().matchH2(h2Hash)

 		for match != 0 {
 			i := match.first()

 			slotKey := g.key(typ, i)
 			origSlotKey := slotKey
 			if typ.IndirectKey() {
 				slotKey = *((*unsafe.Pointer)(slotKey))
 			}

 			if typ.Key.Equal(key, slotKey) {
 				t.used--
 				m.used--

 				if typ.IndirectKey() {
 					// Clearing the pointer is sufficient.
 					*(*unsafe.Pointer)(origSlotKey) = nil
 				} else if typ.Key.Pointers() {
 					// Only bothing clear the key if there
 					// are pointers in it.
 					typedmemclr(typ.Key, slotKey)
 				}

 				slotElem := g.elem(typ, i)
 				if typ.IndirectElem() {
 					// Clearing the pointer is sufficient.
 					*(*unsafe.Pointer)(slotElem) = nil
 				} else {
 					// Unlike keys, always clear the elem (even if
 					// it contains no pointers), as compound
 					// assignment operations depend on cleared
 					// deleted values. See
 					// https://go.dev/issue/25936.
 					typedmemclr(typ.Elem, slotElem)
 				}

 				// Only a full group can appear in the middle
 				// of a probe sequence (a group with at least
 				// one empty slot terminates probing). Once a
 				// group becomes full, it stays full until
 				// rehashing/resizing. So if the group isn't
 				// full now, we can simply remove the element.
 				// Otherwise, we create a tombstone to mark the
 				// slot as deleted.
 				var tombstone bool
 				if g.ctrls().matchEmpty() != 0 {
 					g.ctrls().set(i, ctrlEmpty)
 					t.growthLeft++
 				} else {
 					g.ctrls().set(i, ctrlDeleted)
 					tombstone = true
 				}

 				t.checkInvariants(typ, m)
 				return tombstone
 			}
 			match = match.removeFirst()
 		}

 		match = g.ctrls().matchEmpty()
 		if match != 0 {
 			// Finding an empty slot means we've reached the end of
 			// the probe sequence.
 			return false
 		}
 	}
 }

 // pruneTombstones goes through the table and tries to remove
 // tombstones that are no longer needed. Best effort.
 // Note that it only removes tombstones, it does not move elements.
 // Moving elements would do a better job but is infeasbile due to
 // iterator semantics.
 //
 // Pruning should only succeed if it can remove O(n) tombstones.
 // It would be bad if we did O(n) work to find 1 tombstone to remove.
 // Then the next insert would spend another O(n) work to find 1 more
 // tombstone to remove, etc.
 //
 // We really need to remove O(n) tombstones so we can pay for the cost
 // of finding them. If we can't, then we need to grow (which is also O(n),
 // but guarantees O(n) subsequent inserts can happen in constant time).
 func (t *table) pruneTombstones(typ *abi.MapType, m *Map) {
 	if t.tombstones()*10 < t.capacity { // 10% of capacity
 		// Not enough tombstones to be worth the effort.
 		return
 	}

 	// Bit set marking all the groups whose tombstones are needed.
 	var needed [(maxTableCapacity/abi.MapGroupSlots + 31) / 32]uint32

 	// Trace the probe sequence of every full entry.
 	for i := uint64(0); i <= t.groups.lengthMask; i++ {
 		g := t.groups.group(typ, i)
 		match := g.ctrls().matchFull()
 		for match != 0 {
 			j := match.first()
 			match = match.removeFirst()
 			key := g.key(typ, j)
 			if typ.IndirectKey() {
 				key = *((*unsafe.Pointer)(key))
 			}
 			if !typ.Key.Equal(key, key) {
 				// Key not equal to itself. We never have to find these
 				// keys on lookup (only on iteration), so we can break
 				// their probe sequences at will.
 				continue
 			}
 			// Walk probe sequence for this key.
 			// Each tombstone group we need to walk past is marked required.
 			hash := typ.Hasher(key, m.seed)
 			for seq := makeProbeSeq(h1(hash), t.groups.lengthMask); ; seq = seq.next() {
 				if seq.offset == i {
 					break // reached group of element in probe sequence
 				}
 				g := t.groups.group(typ, seq.offset)
 				m := g.ctrls().matchEmptyOrDeleted()
 				if m != 0 { // must be deleted, not empty, as we haven't found our key yet
 					// Mark this group's tombstone as required.
 					needed[seq.offset/32] |= 1 << (seq.offset % 32)
 				}
 			}
 		}
 		if g.ctrls().matchEmpty() != 0 {
 			// Also mark non-tombstone-containing groups, so we don't try
 			// to remove tombstones from them below.
 			needed[i/32] |= 1 << (i % 32)
 		}
 	}

 	// First, see if we can remove enough tombstones to restore capacity.
 	// This function is O(n), so only remove tombstones if we can remove
 	// enough of them to justify the O(n) cost.
 	cnt := 0
 	for i := uint64(0); i <= t.groups.lengthMask; i++ {
 		if needed[i/32]>>(i%32)&1 != 0 {
 			continue
 		}
 		g := t.groups.group(typ, i)
 		m := g.ctrls().matchEmptyOrDeleted() // must be deleted
 		cnt += m.count()
 	}
 	if cnt*10 < int(t.capacity) { // Can we restore 10% of capacity?
 		return // don't bother removing tombstones. Caller will grow instead.
 	}

 	// Prune unneeded tombstones.
 	for i := uint64(0); i <= t.groups.lengthMask; i++ {
 		if needed[i/32]>>(i%32)&1 != 0 {
 			continue
 		}
 		g := t.groups.group(typ, i)
 		m := g.ctrls().matchEmptyOrDeleted() // must be deleted
 		for m != 0 {
 			k := m.first()
 			m = m.removeFirst()
 			g.ctrls().set(k, ctrlEmpty)
 			t.growthLeft++
 		}
 		// TODO: maybe we could convert all slots at once
 		// using some bitvector trickery.
 	}
 }

 // tombstones returns the number of deleted (tombstone) entries in the table. A
 // tombstone is a slot that has been deleted but is still considered occupied
 // so as not to violate the probing invariant.
 func (t *table) tombstones() uint16 {
 	return (t.capacity*maxAvgGroupLoad)/abi.MapGroupSlots - t.used - t.growthLeft
 }

 // Clear deletes all entries from the map resulting in an empty map.
 func (t *table) Clear(typ *abi.MapType) {
 	mgl := t.maxGrowthLeft()
 	if t.used == 0 && t.growthLeft == mgl { // no current entries and no tombstones
 		return
 	}
 	// We only want to do the work of clearing slots
 	// if they are full. But we also don't want to do too
 	// much work to figure out whether a slot is full or not,
 	// especially if clearing a slot is cheap.
 	//  1) We decide group-by-group instead of slot-by-slot.
 	//     If any slot in a group is full, we zero the whole group.
 	//  2) If groups are unlikely to be empty, don't bother
 	//     testing for it.
 	//  3) If groups are 50%/50% likely to be empty, also don't
 	//     bother testing, as it confuses the branch predictor. See #75097.
 	//  4) But if a group is really large, do the test anyway, as
 	//     clearing is expensive.
 	fullTest := uint64(t.used)*4 <= t.groups.lengthMask // less than ~0.25 entries per group -> >3/4 empty groups
 	if typ.SlotSize > 32 {
 		// For large slots, it is always worth doing the test first.
 		fullTest = true
 	}
 	if fullTest {
 		for i := uint64(0); i <= t.groups.lengthMask; i++ {
 			g := t.groups.group(typ, i)
 			if g.ctrls().anyFull() {
 				typedmemclr(typ.Group, g.data)
 			}
 			g.ctrls().setEmpty()
 		}
 	} else {
 		for i := uint64(0); i <= t.groups.lengthMask; i++ {
 			g := t.groups.group(typ, i)
 			typedmemclr(typ.Group, g.data)
 			g.ctrls().setEmpty()
 		}
 	}
 	t.used = 0
 	t.growthLeft = mgl
 }

 type Iter struct {
 	key  unsafe.Pointer // Must be in first position.  Write nil to indicate iteration end (see cmd/compile/internal/walk/range.go).
 	elem unsafe.Pointer // Must be in second position (see cmd/compile/internal/walk/range.go).
 	typ  *abi.MapType
 	m    *Map

 	// Randomize iteration order by starting iteration at a random slot
 	// offset. The offset into the directory uses a separate offset, as it
 	// must adjust when the directory grows.
 	entryOffset uint64
 	dirOffset   uint64

 	// Snapshot of Map.clearSeq at iteration initialization time. Used to
 	// detect clear during iteration.
 	clearSeq uint64

 	// Value of Map.globalDepth during the last call to Next. Used to
 	// detect directory grow during iteration.
 	globalDepth uint8

 	// dirIdx is the current directory index, prior to adjustment by
 	// dirOffset.
 	dirIdx int

 	// tab is the table at dirIdx during the previous call to Next.
 	tab *table

 	// group is the group at entryIdx during the previous call to Next.
 	group groupReference

 	// entryIdx is the current entry index, prior to adjustment by entryOffset.
 	// The lower 3 bits of the index are the slot index, and the upper bits
 	// are the group index.
 	entryIdx uint64
 }

 // Init initializes Iter for iteration.
 func (it *Iter) Init(typ *abi.MapType, m *Map) {
 	it.typ = typ

 	if m == nil || m.used == 0 {
 		return
 	}

 	dirIdx := 0
 	var groupSmall groupReference
 	if m.dirLen <= 0 {
 		// Use dirIdx == -1 as sentinel for small maps.
 		dirIdx = -1
 		groupSmall.data = m.dirPtr
 	}

 	it.m = m
 	it.entryOffset = rand()
 	it.dirOffset = rand()
 	it.globalDepth = m.globalDepth
 	it.dirIdx = dirIdx
 	it.group = groupSmall
 	it.clearSeq = m.clearSeq
 }

 func (it *Iter) Initialized() bool {
 	return it.typ != nil
 }

 // Map returns the map this iterator is iterating over.
 func (it *Iter) Map() *Map {
 	return it.m
 }

 // Key returns a pointer to the current key. nil indicates end of iteration.
 //
 // Must not be called prior to Next.
 func (it *Iter) Key() unsafe.Pointer {
 	return it.key
 }

 // Key returns a pointer to the current element. nil indicates end of
 // iteration.
 //
 // Must not be called prior to Next.
 func (it *Iter) Elem() unsafe.Pointer {
 	return it.elem
 }

 func (it *Iter) nextDirIdx() {
 	// Skip other entries in the directory that refer to the same
 	// logical table. There are two cases of this:
 	//
 	// Consider this directory:
 	//
 	// - 0: *t1
 	// - 1: *t1
 	// - 2: *t2a
 	// - 3: *t2b
 	//
 	// At some point, the directory grew to accommodate a split of
 	// t2. t1 did not split, so entries 0 and 1 both point to t1.
 	// t2 did split, so the two halves were installed in entries 2
 	// and 3.
 	//
 	// If dirIdx is 0 and it.tab is t1, then we should skip past
 	// entry 1 to avoid repeating t1.
 	//
 	// If dirIdx is 2 and it.tab is t2 (pre-split), then we should
 	// skip past entry 3 because our pre-split t2 already covers
 	// all keys from t2a and t2b (except for new insertions, which
 	// iteration need not return).
 	//
 	// We can achieve both of these by using to difference between
 	// the directory and table depth to compute how many entries
 	// the table covers.
 	entries := 1 << (it.m.globalDepth - it.tab.localDepth)
 	it.dirIdx += entries
 	it.tab = nil
 	it.group = groupReference{}
 	it.entryIdx = 0
 }

 // Return the appropriate key/elem for key at slotIdx index within it.group, if
 // any.
 func (it *Iter) grownKeyElem(key unsafe.Pointer, slotIdx uintptr) (unsafe.Pointer, unsafe.Pointer, bool) {
 	newKey, newElem, ok := it.m.getWithKey(it.typ, key)
 	if !ok {
 		// Key has likely been deleted, and
 		// should be skipped.
 		//
 		// One exception is keys that don't
 		// compare equal to themselves (e.g.,
 		// NaN). These keys cannot be looked
 		// up, so getWithKey will fail even if
 		// the key exists.
 		//
 		// However, we are in luck because such
 		// keys cannot be updated and they
 		// cannot be deleted except with clear.
 		// Thus if no clear has occurred, the
 		// key/elem must still exist exactly as
 		// in the old groups, so we can return
 		// them from there.
 		//
 		// TODO(prattmic): Consider checking
 		// clearSeq early. If a clear occurred,
 		// Next could always return
 		// immediately, as iteration doesn't
 		// need to return anything added after
 		// clear.
 		if it.clearSeq == it.m.clearSeq && !it.typ.Key.Equal(key, key) {
 			elem := it.group.elem(it.typ, slotIdx)
 			if it.typ.IndirectElem() {
 				elem = *((*unsafe.Pointer)(elem))
 			}
 			return key, elem, true
 		}

 		// This entry doesn't exist anymore.
 		return nil, nil, false
 	}

 	return newKey, newElem, true
 }

 // Next proceeds to the next element in iteration, which can be accessed via
 // the Key and Elem methods.
 //
 // The table can be mutated during iteration, though there is no guarantee that
 // the mutations will be visible to the iteration.
 //
 // Init must be called prior to Next.
 func (it *Iter) Next() {
 	if it.m == nil {
 		// Map was empty at Iter.Init.
 		it.key = nil
 		it.elem = nil
 		return
 	}

 	if it.m.writing != 0 {
 		fatal("concurrent map iteration and map write")
 		return
 	}

 	if it.dirIdx < 0 {
 		// Map was small at Init.
 		for ; it.entryIdx < abi.MapGroupSlots; it.entryIdx++ {
 			k := uintptr(it.entryIdx+it.entryOffset) % abi.MapGroupSlots

 			if (it.group.ctrls().get(k) & ctrlEmpty) == ctrlEmpty {
 				// Empty or deleted.
 				continue
 			}

 			key := it.group.key(it.typ, k)
 			if it.typ.IndirectKey() {
 				key = *((*unsafe.Pointer)(key))
 			}

 			// As below, if we have grown to a full map since Init,
 			// we continue to use the old group to decide the keys
 			// to return, but must look them up again in the new
 			// tables.
 			grown := it.m.dirLen > 0
 			var elem unsafe.Pointer
 			if grown {
 				var ok bool
 				newKey, newElem, ok := it.m.getWithKey(it.typ, key)
 				if !ok {
 					// See comment below.
 					if it.clearSeq == it.m.clearSeq && !it.typ.Key.Equal(key, key) {
 						elem = it.group.elem(it.typ, k)
 						if it.typ.IndirectElem() {
 							elem = *((*unsafe.Pointer)(elem))
 						}
 					} else {
 						continue
 					}
 				} else {
 					key = newKey
 					elem = newElem
 				}
 			} else {
 				elem = it.group.elem(it.typ, k)
 				if it.typ.IndirectElem() {
 					elem = *((*unsafe.Pointer)(elem))
 				}
 			}

 			it.entryIdx++
 			it.key = key
 			it.elem = elem
 			return
 		}
 		it.key = nil
 		it.elem = nil
 		return
 	}

 	if it.globalDepth != it.m.globalDepth {
 		// Directory has grown since the last call to Next. Adjust our
 		// directory index.
 		//
 		// Consider:
 		//
 		// Before:
 		// - 0: *t1
 		// - 1: *t2  <- dirIdx
 		//
 		// After:
 		// - 0: *t1a (split)
 		// - 1: *t1b (split)
 		// - 2: *t2  <- dirIdx
 		// - 3: *t2
 		//
 		// That is, we want to double the current index when the
 		// directory size doubles (or quadruple when the directory size
 		// quadruples, etc).
 		//
 		// The actual (randomized) dirIdx is computed below as:
 		//
 		// dirIdx := (it.dirIdx + it.dirOffset) % it.m.dirLen
 		//
 		// Multiplication is associative across modulo operations,
 		// A * (B % C) = (A * B) % (A * C),
 		// provided that A is positive.
 		//
 		// Thus we can achieve this by adjusting it.dirIdx,
 		// it.dirOffset, and it.m.dirLen individually.
 		orders := it.m.globalDepth - it.globalDepth
 		it.dirIdx <<= orders
 		it.dirOffset <<= orders
 		// it.m.dirLen was already adjusted when the directory grew.

 		it.globalDepth = it.m.globalDepth
 	}

 	// Continue iteration until we find a full slot.
 	for ; it.dirIdx < it.m.dirLen; it.nextDirIdx() {
 		// Resolve the table.
 		if it.tab == nil {
 			dirIdx := int((uint64(it.dirIdx) + it.dirOffset) & uint64(it.m.dirLen-1))
 			newTab := it.m.directoryAt(uintptr(dirIdx))
 			if newTab.index != dirIdx {
 				// Normally we skip past all duplicates of the
 				// same entry in the table (see updates to
 				// it.dirIdx at the end of the loop below), so
 				// this case wouldn't occur.
 				//
 				// But on the very first call, we have a
 				// completely randomized dirIdx that may refer
 				// to a middle of a run of tables in the
 				// directory. Do a one-time adjustment of the
 				// offset to ensure we start at first index for
 				// newTable.
 				diff := dirIdx - newTab.index
 				it.dirOffset -= uint64(diff)
 				dirIdx = newTab.index
 			}
 			it.tab = newTab
 		}

 		// N.B. Use it.tab, not newTab. It is important to use the old
 		// table for key selection if the table has grown. See comment
 		// on grown below.

 		entryMask := uint64(it.tab.capacity) - 1
 		if it.entryIdx > entryMask {
 			// Continue to next table.
 			continue
 		}

 		// Fast path: skip matching and directly check if entryIdx is a
 		// full slot.
 		//
 		// In the slow path below, we perform an 8-slot match check to
 		// look for full slots within the group.
 		//
 		// However, with a max load factor of 7/8, each slot in a
 		// mostly full map has a high probability of being full. Thus
 		// it is cheaper to check a single slot than do a full control
 		// match.

 		entryIdx := (it.entryIdx + it.entryOffset) & entryMask
 		slotIdx := uintptr(entryIdx & (abi.MapGroupSlots - 1))
 		if slotIdx == 0 || it.group.data == nil {
 			// Only compute the group (a) when we switch
 			// groups (slotIdx rolls over) and (b) on the
 			// first iteration in this table (slotIdx may
 			// not be zero due to entryOffset).
 			groupIdx := entryIdx >> abi.MapGroupSlotsBits
 			it.group = it.tab.groups.group(it.typ, groupIdx)
 		}

 		if (it.group.ctrls().get(slotIdx) & ctrlEmpty) == 0 {
 			// Slot full.

 			key := it.group.key(it.typ, slotIdx)
 			if it.typ.IndirectKey() {
 				key = *((*unsafe.Pointer)(key))
 			}

 			grown := it.tab.index == -1
 			var elem unsafe.Pointer
 			if grown {
 				newKey, newElem, ok := it.grownKeyElem(key, slotIdx)
 				if !ok {
 					// This entry doesn't exist
 					// anymore. Continue to the
 					// next one.
 					goto next
 				} else {
 					key = newKey
 					elem = newElem
 				}
 			} else {
 				elem = it.group.elem(it.typ, slotIdx)
 				if it.typ.IndirectElem() {
 					elem = *((*unsafe.Pointer)(elem))
 				}
 			}

 			it.entryIdx++
 			it.key = key
 			it.elem = elem
 			return
 		}

 	next:
 		it.entryIdx++

 		// Slow path: use a match on the control word to jump ahead to
 		// the next full slot.
 		//
 		// This is highly effective for maps with particularly low load
 		// (e.g., map allocated with large hint but few insertions).
 		//
 		// For maps with medium load (e.g., 3-4 empty slots per group)
 		// it also tends to work pretty well. Since slots within a
 		// group are filled in order, then if there have been no
 		// deletions, a match will allow skipping past all empty slots
 		// at once.
 		//
 		// Note: it is tempting to cache the group match result in the
 		// iterator to use across Next calls. However because entries
 		// may be deleted between calls later calls would still need to
 		// double-check the control value.

 		var groupMatch bitset
 		for it.entryIdx <= entryMask {
 			entryIdx := (it.entryIdx + it.entryOffset) & entryMask
 			slotIdx := uintptr(entryIdx & (abi.MapGroupSlots - 1))

 			if slotIdx == 0 || it.group.data == nil {
 				// Only compute the group (a) when we switch
 				// groups (slotIdx rolls over) and (b) on the
 				// first iteration in this table (slotIdx may
 				// not be zero due to entryOffset).
 				groupIdx := entryIdx >> abi.MapGroupSlotsBits
 				it.group = it.tab.groups.group(it.typ, groupIdx)
 			}

 			if groupMatch == 0 {
 				groupMatch = it.group.ctrls().matchFull()

 				if slotIdx != 0 {
 					// Starting in the middle of the group.
 					// Ignore earlier groups.
 					groupMatch = groupMatch.removeBelow(slotIdx)
 				}

 				// Skip over groups that are composed of only empty or
 				// deleted slots.
 				if groupMatch == 0 {
 					// Jump past remaining slots in this
 					// group.
 					it.entryIdx += abi.MapGroupSlots - uint64(slotIdx)
 					continue
 				}

 				i := groupMatch.first()
 				it.entryIdx += uint64(i - slotIdx)
 				if it.entryIdx > entryMask {
 					// Past the end of this table's iteration.
 					continue
 				}
 				entryIdx += uint64(i - slotIdx)
 				slotIdx = i
 			}

 			key := it.group.key(it.typ, slotIdx)
 			if it.typ.IndirectKey() {
 				key = *((*unsafe.Pointer)(key))
 			}

 			// If the table has changed since the last
 			// call, then it has grown or split. In this
 			// case, further mutations (changes to
 			// key->elem or deletions) will not be visible
 			// in our snapshot table. Instead we must
 			// consult the new table by doing a full
 			// lookup.
 			//
 			// We still use our old table to decide which
 			// keys to lookup in order to avoid returning
 			// the same key twice.
 			grown := it.tab.index == -1
 			var elem unsafe.Pointer
 			if grown {
 				newKey, newElem, ok := it.grownKeyElem(key, slotIdx)
 				if !ok {
 					// This entry doesn't exist anymore.
 					// Continue to the next one.
 					groupMatch = groupMatch.removeFirst()
 					if groupMatch == 0 {
 						// No more entries in this
 						// group. Continue to next
 						// group.
 						it.entryIdx += abi.MapGroupSlots - uint64(slotIdx)
 						continue
 					}

 					// Next full slot.
 					i := groupMatch.first()
 					it.entryIdx += uint64(i - slotIdx)
 					continue
 				} else {
 					key = newKey
 					elem = newElem
 				}
 			} else {
 				elem = it.group.elem(it.typ, slotIdx)
 				if it.typ.IndirectElem() {
 					elem = *((*unsafe.Pointer)(elem))
 				}
 			}

 			// Jump ahead to the next full slot or next group.
 			groupMatch = groupMatch.removeFirst()
 			if groupMatch == 0 {
 				// No more entries in
 				// this group. Continue
 				// to next group.
 				it.entryIdx += abi.MapGroupSlots - uint64(slotIdx)
 			} else {
 				// Next full slot.
 				i := groupMatch.first()
 				it.entryIdx += uint64(i - slotIdx)
 			}

 			it.key = key
 			it.elem = elem
 			return
 		}

 		// Continue to next table.
 	}

 	it.key = nil
 	it.elem = nil
 	return
 }

 // Replaces the table with one larger table or two split tables to fit more
 // entries. Since the table is replaced, t is now stale and should not be
 // modified.
 func (t *table) rehash(typ *abi.MapType, m *Map) {
 	// TODO(prattmic): SwissTables typically perform a "rehash in place"
 	// operation which recovers capacity consumed by tombstones without growing
 	// the table by reordering slots as necessary to maintain the probe
 	// invariant while eliminating all tombstones.
 	//
 	// However, it is unclear how to make rehash in place work with
 	// iteration. Since iteration simply walks through all slots in order
 	// (with random start offset), reordering the slots would break
 	// iteration.
 	//
 	// As an alternative, we could do a "resize" to new groups allocation
 	// of the same size. This would eliminate the tombstones, but using a
 	// new allocation, so the existing grow support in iteration would
 	// continue to work.

 	newCapacity := 2 * t.capacity
 	if newCapacity <= maxTableCapacity {
 		t.grow(typ, m, newCapacity)
 		return
 	}

 	t.split(typ, m)
 }

 // Bitmask for the last selection bit at this depth.
 func localDepthMask(localDepth uint8) uintptr {
 	if goarch.PtrSize == 4 {
 		return uintptr(1) << (32 - localDepth)
 	}
 	return uintptr(1) << (64 - localDepth)
 }

 // split the table into two, installing the new tables in the map directory.
 func (t *table) split(typ *abi.MapType, m *Map) {
 	localDepth := t.localDepth
 	localDepth++

 	// TODO: is this the best capacity?
 	left := newTable(typ, maxTableCapacity, -1, localDepth)
 	right := newTable(typ, maxTableCapacity, -1, localDepth)

 	// Split in half at the localDepth bit from the top.
 	mask := localDepthMask(localDepth)

 	for i := uint64(0); i <= t.groups.lengthMask; i++ {
 		g := t.groups.group(typ, i)
 		for j := uintptr(0); j < abi.MapGroupSlots; j++ {
 			if (g.ctrls().get(j) & ctrlEmpty) == ctrlEmpty {
 				// Empty or deleted
 				continue
 			}

 			key := g.key(typ, j)
 			if typ.IndirectKey() {
 				key = *((*unsafe.Pointer)(key))
 			}

 			elem := g.elem(typ, j)
 			if typ.IndirectElem() {
 				elem = *((*unsafe.Pointer)(elem))
 			}

 			hash := typ.Hasher(key, m.seed)
 			var newTable *table
 			if hash&mask == 0 {
 				newTable = left
 			} else {
 				newTable = right
 			}
 			newTable.uncheckedPutSlot(typ, hash, key, elem)
 		}
 	}

 	m.installTableSplit(t, left, right)
 	t.index = -1
 }

 // grow the capacity of the table by allocating a new table with a bigger array
 // and uncheckedPutting each element of the table into the new table (we know
 // that no insertion here will Put an already-present value), and discard the
 // old table.
 func (t *table) grow(typ *abi.MapType, m *Map, newCapacity uint16) {
 	newTable := newTable(typ, uint64(newCapacity), t.index, t.localDepth)

 	if t.capacity > 0 {
 		for i := uint64(0); i <= t.groups.lengthMask; i++ {
 			g := t.groups.group(typ, i)
 			for j := uintptr(0); j < abi.MapGroupSlots; j++ {
 				if (g.ctrls().get(j) & ctrlEmpty) == ctrlEmpty {
 					// Empty or deleted
 					continue
 				}

 				key := g.key(typ, j)
 				if typ.IndirectKey() {
 					key = *((*unsafe.Pointer)(key))
 				}

 				elem := g.elem(typ, j)
 				if typ.IndirectElem() {
 					elem = *((*unsafe.Pointer)(elem))
 				}

 				hash := typ.Hasher(key, m.seed)

 				newTable.uncheckedPutSlot(typ, hash, key, elem)
 			}
 		}
 	}

 	newTable.checkInvariants(typ, m)
 	m.replaceTable(newTable)
 	t.index = -1
 }

 // probeSeq maintains the state for a probe sequence that iterates through the
 // groups in a table. The sequence is a triangular progression of the form
 //
 //	p(i) := (i^2 + i)/2 + hash (mod mask+1)
 //
 // The sequence effectively outputs the indexes of *groups*. The group
 // machinery allows us to check an entire group with minimal branching.
 //
 // It turns out that this probe sequence visits every group exactly once if
 // the number of groups is a power of two, since (i^2+i)/2 is a bijection in
 // Z/(2^m). See https://en.wikipedia.org/wiki/Quadratic_probing
 type probeSeq struct {
 	mask   uint64
 	offset uint64
 	index  uint64
 }

 func makeProbeSeq(hash uintptr, mask uint64) probeSeq {
 	return probeSeq{
 		mask:   mask,
 		offset: uint64(hash) & mask,
 		index:  0,
 	}
 }

 func (s probeSeq) next() probeSeq {
 	s.index++
 	s.offset = (s.offset + s.index) & s.mask
 	return s
 }

 func (t *table) clone(typ *abi.MapType) *table {
 	// Shallow copy the table structure.
 	t2 := new(table)
 	*t2 = *t
 	t = t2

 	// We need to just deep copy the groups.data field.
 	oldGroups := t.groups
 	newGroups := newGroups(typ, oldGroups.lengthMask+1)
 	for i := uint64(0); i <= oldGroups.lengthMask; i++ {
 		oldGroup := oldGroups.group(typ, i)
 		newGroup := newGroups.group(typ, i)
 		cloneGroup(typ, newGroup, oldGroup)
 	}
 	t.groups = newGroups

 	return t
 }