src/cmd/compile/internal/ssa/poset.go - go - Git at Google

 // Copyright 2018 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 package ssa

 import (
 	"fmt"
 	"os"
 )

 // If true, check poset integrity after every mutation
 var debugPoset = false

 const uintSize = 32 << (^uint(0) >> 32 & 1) // 32 or 64

 // bitset is a bit array for dense indexes.
 type bitset []uint

 func newBitset(n int) bitset {
 	return make(bitset, (n+uintSize-1)/uintSize)
 }

 func (bs bitset) Reset() {
 	for i := range bs {
 		bs[i] = 0
 	}
 }

 func (bs bitset) Set(idx uint32) {
 	bs[idx/uintSize] |= 1 << (idx % uintSize)
 }

 func (bs bitset) Clear(idx uint32) {
 	bs[idx/uintSize] &^= 1 << (idx % uintSize)
 }

 func (bs bitset) Test(idx uint32) bool {
 	return bs[idx/uintSize]&(1<<(idx%uintSize)) != 0
 }

 type undoType uint8

 const (
 	undoInvalid     undoType = iota
 	undoCheckpoint           // a checkpoint to group undo passes
 	undoSetChl               // change back left child of undo.idx to undo.edge
 	undoSetChr               // change back right child of undo.idx to undo.edge
 	undoNonEqual             // forget that SSA value undo.ID is non-equal to undo.idx (another ID)
 	undoNewNode              // remove new node created for SSA value undo.ID
 	undoNewConstant          // remove the constant node idx from the constants map
 	undoAliasNode            // unalias SSA value undo.ID so that it points back to node index undo.idx
 	undoNewRoot              // remove node undo.idx from root list
 	undoChangeRoot           // remove node undo.idx from root list, and put back undo.edge.Target instead
 	undoMergeRoot            // remove node undo.idx from root list, and put back its children instead
 )

 // posetUndo represents an undo pass to be performed.
 // It's an union of fields that can be used to store information,
 // and typ is the discriminant, that specifies which kind
 // of operation must be performed. Not all fields are always used.
 type posetUndo struct {
 	typ  undoType
 	idx  uint32
 	ID   ID
 	edge posetEdge
 }

 const (
 	// Make poset handle constants as unsigned numbers.
 	posetFlagUnsigned = 1 << iota
 )

 // A poset edge. The zero value is the null/empty edge.
 // Packs target node index (31 bits) and strict flag (1 bit).
 type posetEdge uint32

 func newedge(t uint32, strict bool) posetEdge {
 	s := uint32(0)
 	if strict {
 		s = 1
 	}
 	return posetEdge(t<<1 | s)
 }
 func (e posetEdge) Target() uint32 { return uint32(e) >> 1 }
 func (e posetEdge) Strict() bool   { return uint32(e)&1 != 0 }
 func (e posetEdge) String() string {
 	s := fmt.Sprint(e.Target())
 	if e.Strict() {
 		s += "*"
 	}
 	return s
 }

 // posetNode is a node of a DAG within the poset.
 type posetNode struct {
 	l, r posetEdge
 }

 // poset is a union-find data structure that can represent a partially ordered set
 // of SSA values. Given a binary relation that creates a partial order (eg: '<'),
 // clients can record relations between SSA values using SetOrder, and later
 // check relations (in the transitive closure) with Ordered. For instance,
 // if SetOrder is called to record that A<B and B<C, Ordered will later confirm
 // that A<C.
 //
 // It is possible to record equality relations between SSA values with SetEqual and check
 // equality with Equal. Equality propagates into the transitive closure for the partial
 // order so that if we know that A<B<C and later learn that A==D, Ordered will return
 // true for D<C.
 //
 // It is also possible to record inequality relations between nodes with SetNonEqual;
 // non-equality relations are not transitive, but they can still be useful: for instance
 // if we know that A<=B and later we learn that A!=B, we can deduce that A<B.
 // NonEqual can be used to check whether it is known that the nodes are different, either
 // because SetNonEqual was called before, or because we know that they are strictly ordered.
 //
 // poset will refuse to record new relations that contradict existing relations:
 // for instance if A<B<C, calling SetOrder for C<A will fail returning false; also
 // calling SetEqual for C==A will fail.
 //
 // poset is implemented as a forest of DAGs; in each DAG, if there is a path (directed)
 // from node A to B, it means that A<B (or A<=B). Equality is represented by mapping
 // two SSA values to the same DAG node; when a new equality relation is recorded
 // between two existing nodes,the nodes are merged, adjusting incoming and outgoing edges.
 //
 // Constants are specially treated. When a constant is added to the poset, it is
 // immediately linked to other constants already present; so for instance if the
 // poset knows that x<=3, and then x is tested against 5, 5 is first added and linked
 // 3 (using 3<5), so that the poset knows that x<=3<5; at that point, it is able
 // to answer x<5 correctly. This means that all constants are always within the same
 // DAG; as an implementation detail, we enfoce that the DAG containtining the constants
 // is always the first in the forest.
 //
 // poset is designed to be memory efficient and do little allocations during normal usage.
 // Most internal data structures are pre-allocated and flat, so for instance adding a
 // new relation does not cause any allocation. For performance reasons,
 // each node has only up to two outgoing edges (like a binary tree), so intermediate
 // "dummy" nodes are required to represent more than two relations. For instance,
 // to record that A<I, A<J, A<K (with no known relation between I,J,K), we create the
 // following DAG:
 //
 //         A
 //        / \
 //       I  dummy
 //           /  \
 //          J    K
 //
 type poset struct {
 	lastidx   uint32            // last generated dense index
 	flags     uint8             // internal flags
 	values    map[ID]uint32     // map SSA values to dense indexes
 	constants map[int64]uint32  // record SSA constants together with their value
 	nodes     []posetNode       // nodes (in all DAGs)
 	roots     []uint32          // list of root nodes (forest)
 	noneq     map[uint32]bitset // non-equal relations
 	undo      []posetUndo       // undo chain
 }

 func newPoset() *poset {
 	return &poset{
 		values:    make(map[ID]uint32),
 		constants: make(map[int64]uint32, 8),
 		nodes:     make([]posetNode, 1, 16),
 		roots:     make([]uint32, 0, 4),
 		noneq:     make(map[uint32]bitset),
 		undo:      make([]posetUndo, 0, 4),
 	}
 }

 func (po *poset) SetUnsigned(uns bool) {
 	if uns {
 		po.flags |= posetFlagUnsigned
 	} else {
 		po.flags &^= posetFlagUnsigned
 	}
 }

 // Handle children
 func (po *poset) setchl(i uint32, l posetEdge) { po.nodes[i].l = l }
 func (po *poset) setchr(i uint32, r posetEdge) { po.nodes[i].r = r }
 func (po *poset) chl(i uint32) uint32          { return po.nodes[i].l.Target() }
 func (po *poset) chr(i uint32) uint32          { return po.nodes[i].r.Target() }
 func (po *poset) children(i uint32) (posetEdge, posetEdge) {
 	return po.nodes[i].l, po.nodes[i].r
 }

 // upush records a new undo step. It can be used for simple
 // undo passes that record up to one index and one edge.
 func (po *poset) upush(typ undoType, p uint32, e posetEdge) {
 	po.undo = append(po.undo, posetUndo{typ: typ, idx: p, edge: e})
 }

 // upushnew pushes an undo pass for a new node
 func (po *poset) upushnew(id ID, idx uint32) {
 	po.undo = append(po.undo, posetUndo{typ: undoNewNode, ID: id, idx: idx})
 }

 // upushneq pushes a new undo pass for a nonequal relation
 func (po *poset) upushneq(idx1 uint32, idx2 uint32) {
 	po.undo = append(po.undo, posetUndo{typ: undoNonEqual, ID: ID(idx1), idx: idx2})
 }

 // upushalias pushes a new undo pass for aliasing two nodes
 func (po *poset) upushalias(id ID, i2 uint32) {
 	po.undo = append(po.undo, posetUndo{typ: undoAliasNode, ID: id, idx: i2})
 }

 // upushconst pushes a new undo pass for a new constant
 func (po *poset) upushconst(idx uint32, old uint32) {
 	po.undo = append(po.undo, posetUndo{typ: undoNewConstant, idx: idx, ID: ID(old)})
 }

 // addchild adds i2 as direct child of i1.
 func (po *poset) addchild(i1, i2 uint32, strict bool) {
 	i1l, i1r := po.children(i1)
 	e2 := newedge(i2, strict)

 	if i1l == 0 {
 		po.setchl(i1, e2)
 		po.upush(undoSetChl, i1, 0)
 	} else if i1r == 0 {
 		po.setchr(i1, e2)
 		po.upush(undoSetChr, i1, 0)
 	} else {
 		// If n1 already has two children, add an intermediate dummy
 		// node to record the relation correctly (without relating
 		// n2 to other existing nodes). Use a non-deterministic value
 		// to decide whether to append on the left or the right, to avoid
 		// creating degenerated chains.
 		//
 		//      n1
 		//     /  \
 		//   i1l  dummy
 		//        /   \
 		//      i1r   n2
 		//
 		dummy := po.newnode(nil)
 		if (i1^i2)&1 != 0 { // non-deterministic
 			po.setchl(dummy, i1r)
 			po.setchr(dummy, e2)
 			po.setchr(i1, newedge(dummy, false))
 			po.upush(undoSetChr, i1, i1r)
 		} else {
 			po.setchl(dummy, i1l)
 			po.setchr(dummy, e2)
 			po.setchl(i1, newedge(dummy, false))
 			po.upush(undoSetChl, i1, i1l)
 		}
 	}
 }

 // newnode allocates a new node bound to SSA value n.
 // If n is nil, this is a dummy node (= only used internally).
 func (po *poset) newnode(n *Value) uint32 {
 	i := po.lastidx + 1
 	po.lastidx++
 	po.nodes = append(po.nodes, posetNode{})
 	if n != nil {
 		if po.values[n.ID] != 0 {
 			panic("newnode for Value already inserted")
 		}
 		po.values[n.ID] = i
 		po.upushnew(n.ID, i)
 	} else {
 		po.upushnew(0, i)
 	}
 	return i
 }

 // lookup searches for a SSA value into the forest of DAGS, and return its node.
 // Constants are materialized on the fly during lookup.
 func (po *poset) lookup(n *Value) (uint32, bool) {
 	i, f := po.values[n.ID]
 	if !f && n.isGenericIntConst() {
 		po.newconst(n)
 		i, f = po.values[n.ID]
 	}
 	return i, f
 }

 // newconst creates a node for a constant. It links it to other constants, so
 // that n<=5 is detected true when n<=3 is known to be true.
 // TODO: this is O(N), fix it.
 func (po *poset) newconst(n *Value) {
 	if !n.isGenericIntConst() {
 		panic("newconst on non-constant")
 	}

 	// If the same constant is already present in the poset through a different
 	// Value, just alias to it without allocating a new node.
 	val := n.AuxInt
 	if po.flags&posetFlagUnsigned != 0 {
 		val = int64(n.AuxUnsigned())
 	}
 	if c, found := po.constants[val]; found {
 		po.values[n.ID] = c
 		po.upushalias(n.ID, 0)
 		return
 	}

 	// Create the new node for this constant
 	i := po.newnode(n)

 	// If this is the first constant, put it as a new root, as
 	// we can't record an existing connection so we don't have
 	// a specific DAG to add it to. Notice that we want all
 	// constants to be in root #0, so make sure the new root
 	// goes there.
 	if len(po.constants) == 0 {
 		idx := len(po.roots)
 		po.roots = append(po.roots, i)
 		po.roots[0], po.roots[idx] = po.roots[idx], po.roots[0]
 		po.upush(undoNewRoot, i, 0)
 		po.constants[val] = i
 		po.upushconst(i, 0)
 		return
 	}

 	// Find the lower and upper bound among existing constants. That is,
 	// find the higher constant that is lower than the one that we're adding,
 	// and the lower constant that is higher.
 	// The loop is duplicated to handle signed and unsigned comparison,
 	// depending on how the poset was configured.
 	var lowerptr, higherptr uint32

 	if po.flags&posetFlagUnsigned != 0 {
 		var lower, higher uint64
 		val1 := n.AuxUnsigned()
 		for val2, ptr := range po.constants {
 			val2 := uint64(val2)
 			if val1 == val2 {
 				panic("unreachable")
 			}
 			if val2 < val1 && (lowerptr == 0 || val2 > lower) {
 				lower = val2
 				lowerptr = ptr
 			} else if val2 > val1 && (higherptr == 0 || val2 < higher) {
 				higher = val2
 				higherptr = ptr
 			}
 		}
 	} else {
 		var lower, higher int64
 		val1 := n.AuxInt
 		for val2, ptr := range po.constants {
 			if val1 == val2 {
 				panic("unreachable")
 			}
 			if val2 < val1 && (lowerptr == 0 || val2 > lower) {
 				lower = val2
 				lowerptr = ptr
 			} else if val2 > val1 && (higherptr == 0 || val2 < higher) {
 				higher = val2
 				higherptr = ptr
 			}
 		}
 	}

 	if lowerptr == 0 && higherptr == 0 {
 		// This should not happen, as at least one
 		// other constant must exist if we get here.
 		panic("no constant found")
 	}

 	// Create the new node and connect it to the bounds, so that
 	// lower < n < higher. We could have found both bounds or only one
 	// of them, depending on what other constants are present in the poset.
 	// Notice that we always link constants together, so they
 	// are always part of the same DAG.
 	switch {
 	case lowerptr != 0 && higherptr != 0:
 		// Both bounds are present, record lower < n < higher.
 		po.addchild(lowerptr, i, true)
 		po.addchild(i, higherptr, true)

 	case lowerptr != 0:
 		// Lower bound only, record lower < n.
 		po.addchild(lowerptr, i, true)

 	case higherptr != 0:
 		// Higher bound only. To record n < higher, we need
 		// a dummy root:
 		//
 		//        dummy
 		//        /   \
 		//      root   \
 		//       /      n
 		//     ....    /
 		//       \    /
 		//       higher
 		//
 		i2 := higherptr
 		r2 := po.findroot(i2)
 		if r2 != po.roots[0] { // all constants should be in root #0
 			panic("constant not in root #0")
 		}
 		dummy := po.newnode(nil)
 		po.changeroot(r2, dummy)
 		po.upush(undoChangeRoot, dummy, newedge(r2, false))
 		po.addchild(dummy, r2, false)
 		po.addchild(dummy, i, false)
 		po.addchild(i, i2, true)
 	}

 	po.constants[val] = i
 	po.upushconst(i, 0)
 }

 // aliasnewnode records that a single node n2 (not in the poset yet) is an alias
 // of the master node n1.
 func (po *poset) aliasnewnode(n1, n2 *Value) {
 	i1, i2 := po.values[n1.ID], po.values[n2.ID]
 	if i1 == 0 || i2 != 0 {
 		panic("aliasnewnode invalid arguments")
 	}

 	po.values[n2.ID] = i1
 	po.upushalias(n2.ID, 0)
 }

 // aliasnodes records that all the nodes i2s are aliases of a single master node n1.
 // aliasnodes takes care of rearranging the DAG, changing references of parent/children
 // of nodes in i2s, so that they point to n1 instead.
 // Complexity is O(n) (with n being the total number of nodes in the poset, not just
 // the number of nodes being aliased).
 func (po *poset) aliasnodes(n1 *Value, i2s bitset) {
 	i1 := po.values[n1.ID]
 	if i1 == 0 {
 		panic("aliasnode for non-existing node")
 	}
 	if i2s.Test(i1) {
 		panic("aliasnode i2s contains n1 node")
 	}

 	// Go through all the nodes to adjust parent/chidlren of nodes in i2s
 	for idx, n := range po.nodes {
 		// Do not touch i1 itself, otherwise we can create useless self-loops
 		if uint32(idx) == i1 {
 			continue
 		}
 		l, r := n.l, n.r

 		// Rename all references to i2s into i1
 		if i2s.Test(l.Target()) {
 			po.setchl(uint32(idx), newedge(i1, l.Strict()))
 			po.upush(undoSetChl, uint32(idx), l)
 		}
 		if i2s.Test(r.Target()) {
 			po.setchr(uint32(idx), newedge(i1, r.Strict()))
 			po.upush(undoSetChr, uint32(idx), r)
 		}

 		// Connect all chidren of i2s to i1 (unless those children
 		// are in i2s as well, in which case it would be useless)
 		if i2s.Test(uint32(idx)) {
 			if l != 0 && !i2s.Test(l.Target()) {
 				po.addchild(i1, l.Target(), l.Strict())
 			}
 			if r != 0 && !i2s.Test(r.Target()) {
 				po.addchild(i1, r.Target(), r.Strict())
 			}
 			po.setchl(uint32(idx), 0)
 			po.setchr(uint32(idx), 0)
 			po.upush(undoSetChl, uint32(idx), l)
 			po.upush(undoSetChr, uint32(idx), r)
 		}
 	}

 	// Reassign all existing IDs that point to i2 to i1.
 	// This includes n2.ID.
 	for k, v := range po.values {
 		if i2s.Test(v) {
 			po.values[k] = i1
 			po.upushalias(k, v)
 		}
 	}

 	// If one of the aliased nodes is a constant, then make sure
 	// po.constants is updated to point to the master node.
 	for val, idx := range po.constants {
 		if i2s.Test(idx) {
 			po.constants[val] = i1
 			po.upushconst(i1, idx)
 		}
 	}
 }

 func (po *poset) isroot(r uint32) bool {
 	for i := range po.roots {
 		if po.roots[i] == r {
 			return true
 		}
 	}
 	return false
 }

 func (po *poset) changeroot(oldr, newr uint32) {
 	for i := range po.roots {
 		if po.roots[i] == oldr {
 			po.roots[i] = newr
 			return
 		}
 	}
 	panic("changeroot on non-root")
 }

 func (po *poset) removeroot(r uint32) {
 	for i := range po.roots {
 		if po.roots[i] == r {
 			po.roots = append(po.roots[:i], po.roots[i+1:]...)
 			return
 		}
 	}
 	panic("removeroot on non-root")
 }

 // dfs performs a depth-first search within the DAG whose root is r.
 // f is the visit function called for each node; if it returns true,
 // the search is aborted and true is returned. The root node is
 // visited too.
 // If strict, ignore edges across a path until at least one
 // strict edge is found. For instance, for a chain A<=B<=C<D<=E<F,
 // a strict walk visits D,E,F.
 // If the visit ends, false is returned.
 func (po *poset) dfs(r uint32, strict bool, f func(i uint32) bool) bool {
 	closed := newBitset(int(po.lastidx + 1))
 	open := make([]uint32, 1, 64)
 	open[0] = r

 	if strict {
 		// Do a first DFS; walk all paths and stop when we find a strict
 		// edge, building a "next" list of nodes reachable through strict
 		// edges. This will be the bootstrap open list for the real DFS.
 		next := make([]uint32, 0, 64)

 		for len(open) > 0 {
 			i := open[len(open)-1]
 			open = open[:len(open)-1]

 			// Don't visit the same node twice. Notice that all nodes
 			// across non-strict paths are still visited at least once, so
 			// a non-strict path can never obscure a strict path to the
 			// same node.
 			if !closed.Test(i) {
 				closed.Set(i)

 				l, r := po.children(i)
 				if l != 0 {
 					if l.Strict() {
 						next = append(next, l.Target())
 					} else {
 						open = append(open, l.Target())
 					}
 				}
 				if r != 0 {
 					if r.Strict() {
 						next = append(next, r.Target())
 					} else {
 						open = append(open, r.Target())
 					}
 				}
 			}
 		}
 		open = next
 		closed.Reset()
 	}

 	for len(open) > 0 {
 		i := open[len(open)-1]
 		open = open[:len(open)-1]

 		if !closed.Test(i) {
 			if f(i) {
 				return true
 			}
 			closed.Set(i)
 			l, r := po.children(i)
 			if l != 0 {
 				open = append(open, l.Target())
 			}
 			if r != 0 {
 				open = append(open, r.Target())
 			}
 		}
 	}
 	return false
 }

 // Returns true if there is a path from i1 to i2.
 // If strict ==  true: if the function returns true, then i1 <  i2.
 // If strict == false: if the function returns true, then i1 <= i2.
 // If the function returns false, no relation is known.
 func (po *poset) reaches(i1, i2 uint32, strict bool) bool {
 	return po.dfs(i1, strict, func(n uint32) bool {
 		return n == i2
 	})
 }

 // findroot finds i's root, that is which DAG contains i.
 // Returns the root; if i is itself a root, it is returned.
 // Panic if i is not in any DAG.
 func (po *poset) findroot(i uint32) uint32 {
 	// TODO(rasky): if needed, a way to speed up this search is
 	// storing a bitset for each root using it as a mini bloom filter
 	// of nodes present under that root.
 	for _, r := range po.roots {
 		if po.reaches(r, i, false) {
 			return r
 		}
 	}
 	panic("findroot didn't find any root")
 }

 // mergeroot merges two DAGs into one DAG by creating a new dummy root
 func (po *poset) mergeroot(r1, r2 uint32) uint32 {
 	// Root #0 is special as it contains all constants. Since mergeroot
 	// discards r2 as root and keeps r1, make sure that r2 is not root #0,
 	// otherwise constants would move to a different root.
 	if r2 == po.roots[0] {
 		r1, r2 = r2, r1
 	}
 	r := po.newnode(nil)
 	po.setchl(r, newedge(r1, false))
 	po.setchr(r, newedge(r2, false))
 	po.changeroot(r1, r)
 	po.removeroot(r2)
 	po.upush(undoMergeRoot, r, 0)
 	return r
 }

 // collapsepath marks n1 and n2 as equal and collapses as equal all
 // nodes across all paths between n1 and n2. If a strict edge is
 // found, the function does not modify the DAG and returns false.
 // Complexity is O(n).
 func (po *poset) collapsepath(n1, n2 *Value) bool {
 	i1, i2 := po.values[n1.ID], po.values[n2.ID]
 	if po.reaches(i1, i2, true) {
 		return false
 	}

 	// Find all the paths from i1 to i2
 	paths := po.findpaths(i1, i2)
 	// Mark all nodes in all the paths as aliases of n1
 	// (excluding n1 itself)
 	paths.Clear(i1)
 	po.aliasnodes(n1, paths)
 	return true
 }

 // findpaths is a recursive function that calculates all paths from cur to dst
 // and return them as a bitset (the index of a node is set in the bitset if
 // that node is on at least one path from cur to dst).
 // We do a DFS from cur (stopping going deep any time we reach dst, if ever),
 // and mark as part of the paths any node that has a children which is already
 // part of the path (or is dst itself).
 func (po *poset) findpaths(cur, dst uint32) bitset {
 	seen := newBitset(int(po.lastidx + 1))
 	path := newBitset(int(po.lastidx + 1))
 	path.Set(dst)
 	po.findpaths1(cur, dst, seen, path)
 	return path
 }

 func (po *poset) findpaths1(cur, dst uint32, seen bitset, path bitset) {
 	if cur == dst {
 		return
 	}
 	seen.Set(cur)
 	l, r := po.chl(cur), po.chr(cur)
 	if !seen.Test(l) {
 		po.findpaths1(l, dst, seen, path)
 	}
 	if !seen.Test(r) {
 		po.findpaths1(r, dst, seen, path)
 	}
 	if path.Test(l) || path.Test(r) {
 		path.Set(cur)
 	}
 }

 // Check whether it is recorded that i1!=i2
 func (po *poset) isnoneq(i1, i2 uint32) bool {
 	if i1 == i2 {
 		return false
 	}
 	if i1 < i2 {
 		i1, i2 = i2, i1
 	}

 	// Check if we recorded a non-equal relation before
 	if bs, ok := po.noneq[i1]; ok && bs.Test(i2) {
 		return true
 	}
 	return false
 }

 // Record that i1!=i2
 func (po *poset) setnoneq(n1, n2 *Value) {
 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)

 	// If any of the nodes do not exist in the poset, allocate them. Since
 	// we don't know any relation (in the partial order) about them, they must
 	// become independent roots.
 	if !f1 {
 		i1 = po.newnode(n1)
 		po.roots = append(po.roots, i1)
 		po.upush(undoNewRoot, i1, 0)
 	}
 	if !f2 {
 		i2 = po.newnode(n2)
 		po.roots = append(po.roots, i2)
 		po.upush(undoNewRoot, i2, 0)
 	}

 	if i1 == i2 {
 		panic("setnoneq on same node")
 	}
 	if i1 < i2 {
 		i1, i2 = i2, i1
 	}
 	bs := po.noneq[i1]
 	if bs == nil {
 		// Given that we record non-equality relations using the
 		// higher index as a key, the bitsize will never change size.
 		// TODO(rasky): if memory is a problem, consider allocating
 		// a small bitset and lazily grow it when higher indices arrive.
 		bs = newBitset(int(i1))
 		po.noneq[i1] = bs
 	} else if bs.Test(i2) {
 		// Already recorded
 		return
 	}
 	bs.Set(i2)
 	po.upushneq(i1, i2)
 }

 // CheckIntegrity verifies internal integrity of a poset. It is intended
 // for debugging purposes.
 func (po *poset) CheckIntegrity() {
 	// Record which index is a constant
 	constants := newBitset(int(po.lastidx + 1))
 	for _, c := range po.constants {
 		constants.Set(c)
 	}

 	// Verify that each node appears in a single DAG, and that
 	// all constants are within the first DAG
 	seen := newBitset(int(po.lastidx + 1))
 	for ridx, r := range po.roots {
 		if r == 0 {
 			panic("empty root")
 		}

 		po.dfs(r, false, func(i uint32) bool {
 			if seen.Test(i) {
 				panic("duplicate node")
 			}
 			seen.Set(i)
 			if constants.Test(i) {
 				if ridx != 0 {
 					panic("constants not in the first DAG")
 				}
 			}
 			return false
 		})
 	}

 	// Verify that values contain the minimum set
 	for id, idx := range po.values {
 		if !seen.Test(idx) {
 			panic(fmt.Errorf("spurious value [%d]=%d", id, idx))
 		}
 	}

 	// Verify that only existing nodes have non-zero children
 	for i, n := range po.nodes {
 		if n.l|n.r != 0 {
 			if !seen.Test(uint32(i)) {
 				panic(fmt.Errorf("children of unknown node %d->%v", i, n))
 			}
 			if n.l.Target() == uint32(i) || n.r.Target() == uint32(i) {
 				panic(fmt.Errorf("self-loop on node %d", i))
 			}
 		}
 	}
 }

 // CheckEmpty checks that a poset is completely empty.
 // It can be used for debugging purposes, as a poset is supposed to
 // be empty after it's fully rolled back through Undo.
 func (po *poset) CheckEmpty() error {
 	if len(po.nodes) != 1 {
 		return fmt.Errorf("non-empty nodes list: %v", po.nodes)
 	}
 	if len(po.values) != 0 {
 		return fmt.Errorf("non-empty value map: %v", po.values)
 	}
 	if len(po.roots) != 0 {
 		return fmt.Errorf("non-empty root list: %v", po.roots)
 	}
 	if len(po.constants) != 0 {
 		return fmt.Errorf("non-empty constants: %v", po.constants)
 	}
 	if len(po.undo) != 0 {
 		return fmt.Errorf("non-empty undo list: %v", po.undo)
 	}
 	if po.lastidx != 0 {
 		return fmt.Errorf("lastidx index is not zero: %v", po.lastidx)
 	}
 	for _, bs := range po.noneq {
 		for _, x := range bs {
 			if x != 0 {
 				return fmt.Errorf("non-empty noneq map")
 			}
 		}
 	}
 	return nil
 }

 // DotDump dumps the poset in graphviz format to file fn, with the specified title.
 func (po *poset) DotDump(fn string, title string) error {
 	f, err := os.Create(fn)
 	if err != nil {
 		return err
 	}
 	defer f.Close()

 	// Create reverse index mapping (taking aliases into account)
 	names := make(map[uint32]string)
 	for id, i := range po.values {
 		s := names[i]
 		if s == "" {
 			s = fmt.Sprintf("v%d", id)
 		} else {
 			s += fmt.Sprintf(", v%d", id)
 		}
 		names[i] = s
 	}

 	// Create reverse constant mapping
 	consts := make(map[uint32]int64)
 	for val, idx := range po.constants {
 		consts[idx] = val
 	}

 	fmt.Fprintf(f, "digraph poset {\n")
 	fmt.Fprintf(f, "\tedge [ fontsize=10 ]\n")
 	for ridx, r := range po.roots {
 		fmt.Fprintf(f, "\tsubgraph root%d {\n", ridx)
 		po.dfs(r, false, func(i uint32) bool {
 			if val, ok := consts[i]; ok {
 				// Constant
 				var vals string
 				if po.flags&posetFlagUnsigned != 0 {
 					vals = fmt.Sprint(uint64(val))
 				} else {
 					vals = fmt.Sprint(int64(val))
 				}
 				fmt.Fprintf(f, "\t\tnode%d [shape=box style=filled fillcolor=cadetblue1 label=<%s <font point-size=\"6\">%s [%d]</font>>]\n",
 					i, vals, names[i], i)
 			} else {
 				// Normal SSA value
 				fmt.Fprintf(f, "\t\tnode%d [label=<%s <font point-size=\"6\">[%d]</font>>]\n", i, names[i], i)
 			}
 			chl, chr := po.children(i)
 			for _, ch := range []posetEdge{chl, chr} {
 				if ch != 0 {
 					if ch.Strict() {
 						fmt.Fprintf(f, "\t\tnode%d -> node%d [label=\" <\" color=\"red\"]\n", i, ch.Target())
 					} else {
 						fmt.Fprintf(f, "\t\tnode%d -> node%d [label=\" <=\" color=\"green\"]\n", i, ch.Target())
 					}
 				}
 			}
 			return false
 		})
 		fmt.Fprintf(f, "\t}\n")
 	}
 	fmt.Fprintf(f, "\tlabelloc=\"t\"\n")
 	fmt.Fprintf(f, "\tlabeldistance=\"3.0\"\n")
 	fmt.Fprintf(f, "\tlabel=%q\n", title)
 	fmt.Fprintf(f, "}\n")
 	return nil
 }

 // Ordered reports whether n1<n2. It returns false either when it is
 // certain that n1<n2 is false, or if there is not enough information
 // to tell.
 // Complexity is O(n).
 func (po *poset) Ordered(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call Ordered with n1==n2")
 	}

 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)
 	if !f1 || !f2 {
 		return false
 	}

 	return i1 != i2 && po.reaches(i1, i2, true)
 }

 // Ordered reports whether n1<=n2. It returns false either when it is
 // certain that n1<=n2 is false, or if there is not enough information
 // to tell.
 // Complexity is O(n).
 func (po *poset) OrderedOrEqual(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call Ordered with n1==n2")
 	}

 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)
 	if !f1 || !f2 {
 		return false
 	}

 	return i1 == i2 || po.reaches(i1, i2, false)
 }

 // Equal reports whether n1==n2. It returns false either when it is
 // certain that n1==n2 is false, or if there is not enough information
 // to tell.
 // Complexity is O(1).
 func (po *poset) Equal(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call Equal with n1==n2")
 	}

 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)
 	return f1 && f2 && i1 == i2
 }

 // NonEqual reports whether n1!=n2. It returns false either when it is
 // certain that n1!=n2 is false, or if there is not enough information
 // to tell.
 // Complexity is O(n) (because it internally calls Ordered to see if we
 // can infer n1!=n2 from n1<n2 or n2<n1).
 func (po *poset) NonEqual(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call NonEqual with n1==n2")
 	}

 	// If we never saw the nodes before, we don't
 	// have a recorded non-equality.
 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)
 	if !f1 || !f2 {
 		return false
 	}

 	// Check if we recored inequality
 	if po.isnoneq(i1, i2) {
 		return true
 	}

 	// Check if n1<n2 or n2<n1, in which case we can infer that n1!=n2
 	if po.Ordered(n1, n2) || po.Ordered(n2, n1) {
 		return true
 	}

 	return false
 }

 // setOrder records that n1<n2 or n1<=n2 (depending on strict). Returns false
 // if this is a contradiction.
 // Implements SetOrder() and SetOrderOrEqual()
 func (po *poset) setOrder(n1, n2 *Value, strict bool) bool {
 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)

 	switch {
 	case !f1 && !f2:
 		// Neither n1 nor n2 are in the poset, so they are not related
 		// in any way to existing nodes.
 		// Create a new DAG to record the relation.
 		i1, i2 = po.newnode(n1), po.newnode(n2)
 		po.roots = append(po.roots, i1)
 		po.upush(undoNewRoot, i1, 0)
 		po.addchild(i1, i2, strict)

 	case f1 && !f2:
 		// n1 is in one of the DAGs, while n2 is not. Add n2 as children
 		// of n1.
 		i2 = po.newnode(n2)
 		po.addchild(i1, i2, strict)

 	case !f1 && f2:
 		// n1 is not in any DAG but n2 is. If n2 is a root, we can put
 		// n1 in its place as a root; otherwise, we need to create a new
 		// dummy root to record the relation.
 		i1 = po.newnode(n1)

 		if po.isroot(i2) {
 			po.changeroot(i2, i1)
 			po.upush(undoChangeRoot, i1, newedge(i2, strict))
 			po.addchild(i1, i2, strict)
 			return true
 		}

 		// Search for i2's root; this requires a O(n) search on all
 		// DAGs
 		r := po.findroot(i2)

 		// Re-parent as follows:
 		//
 		//                  dummy
 		//     r            /   \
 		//      \   ===>   r    i1
 		//      i2          \   /
 		//                    i2
 		//
 		dummy := po.newnode(nil)
 		po.changeroot(r, dummy)
 		po.upush(undoChangeRoot, dummy, newedge(r, false))
 		po.addchild(dummy, r, false)
 		po.addchild(dummy, i1, false)
 		po.addchild(i1, i2, strict)

 	case f1 && f2:
 		// If the nodes are aliased, fail only if we're setting a strict order
 		// (that is, we cannot set n1<n2 if n1==n2).
 		if i1 == i2 {
 			return !strict
 		}

 		// If we are trying to record n1<=n2 but we learned that n1!=n2,
 		// record n1<n2, as it provides more information.
 		if !strict && po.isnoneq(i1, i2) {
 			strict = true
 		}

 		// Both n1 and n2 are in the poset. This is the complex part of the algorithm
 		// as we need to find many different cases and DAG shapes.

 		// Check if n1 somehow reaches n2
 		if po.reaches(i1, i2, false) {
 			// This is the table of all cases we need to handle:
 			//
 			//      DAG          New      Action
 			//      ---------------------------------------------------
 			// #1:  N1<=X<=N2 |  N1<=N2 | do nothing
 			// #2:  N1<=X<=N2 |  N1<N2  | add strict edge (N1<N2)
 			// #3:  N1<X<N2   |  N1<=N2 | do nothing (we already know more)
 			// #4:  N1<X<N2   |  N1<N2  | do nothing

 			// Check if we're in case #2
 			if strict && !po.reaches(i1, i2, true) {
 				po.addchild(i1, i2, true)
 				return true
 			}

 			// Case #1, #3 o #4: nothing to do
 			return true
 		}

 		// Check if n2 somehow reaches n1
 		if po.reaches(i2, i1, false) {
 			// This is the table of all cases we need to handle:
 			//
 			//      DAG           New      Action
 			//      ---------------------------------------------------
 			// #5:  N2<=X<=N1  |  N1<=N2 | collapse path (learn that N1=X=N2)
 			// #6:  N2<=X<=N1  |  N1<N2  | contradiction
 			// #7:  N2<X<N1    |  N1<=N2 | contradiction in the path
 			// #8:  N2<X<N1    |  N1<N2  | contradiction

 			if strict {
 				// Cases #6 and #8: contradiction
 				return false
 			}

 			// We're in case #5 or #7. Try to collapse path, and that will
 			// fail if it realizes that we are in case #7.
 			return po.collapsepath(n2, n1)
 		}

 		// We don't know of any existing relation between n1 and n2. They could
 		// be part of the same DAG or not.
 		// Find their roots to check whether they are in the same DAG.
 		r1, r2 := po.findroot(i1), po.findroot(i2)
 		if r1 != r2 {
 			// We need to merge the two DAGs to record a relation between the nodes
 			po.mergeroot(r1, r2)
 		}

 		// Connect n1 and n2
 		po.addchild(i1, i2, strict)
 	}

 	return true
 }

 // SetOrder records that n1<n2. Returns false if this is a contradiction
 // Complexity is O(1) if n2 was never seen before, or O(n) otherwise.
 func (po *poset) SetOrder(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call SetOrder with n1==n2")
 	}
 	return po.setOrder(n1, n2, true)
 }

 // SetOrderOrEqual records that n1<=n2. Returns false if this is a contradiction
 // Complexity is O(1) if n2 was never seen before, or O(n) otherwise.
 func (po *poset) SetOrderOrEqual(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call SetOrder with n1==n2")
 	}
 	return po.setOrder(n1, n2, false)
 }

 // SetEqual records that n1==n2. Returns false if this is a contradiction
 // (that is, if it is already recorded that n1<n2 or n2<n1).
 // Complexity is O(1) if n2 was never seen before, or O(n) otherwise.
 func (po *poset) SetEqual(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call Add with n1==n2")
 	}

 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)

 	switch {
 	case !f1 && !f2:
 		i1 = po.newnode(n1)
 		po.roots = append(po.roots, i1)
 		po.upush(undoNewRoot, i1, 0)
 		po.aliasnewnode(n1, n2)
 	case f1 && !f2:
 		po.aliasnewnode(n1, n2)
 	case !f1 && f2:
 		po.aliasnewnode(n2, n1)
 	case f1 && f2:
 		if i1 == i2 {
 			// Already aliased, ignore
 			return true
 		}

 		// If we recorded that n1!=n2, this is a contradiction.
 		if po.isnoneq(i1, i2) {
 			return false
 		}

 		// If we already knew that n1<=n2, we can collapse the path to
 		// record n1==n2 (and viceversa).
 		if po.reaches(i1, i2, false) {
 			return po.collapsepath(n1, n2)
 		}
 		if po.reaches(i2, i1, false) {
 			return po.collapsepath(n2, n1)
 		}

 		r1 := po.findroot(i1)
 		r2 := po.findroot(i2)
 		if r1 != r2 {
 			// Merge the two DAGs so we can record relations between the nodes
 			po.mergeroot(r1, r2)
 		}

 		// Set n2 as alias of n1. This will also update all the references
 		// to n2 to become references to n1
 		i2s := newBitset(int(po.lastidx) + 1)
 		i2s.Set(i2)
 		po.aliasnodes(n1, i2s)
 	}
 	return true
 }

 // SetNonEqual records that n1!=n2. Returns false if this is a contradiction
 // (that is, if it is already recorded that n1==n2).
 // Complexity is O(n).
 func (po *poset) SetNonEqual(n1, n2 *Value) bool {
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}
 	if n1.ID == n2.ID {
 		panic("should not call SetNonEqual with n1==n2")
 	}

 	// Check whether the nodes are already in the poset
 	i1, f1 := po.lookup(n1)
 	i2, f2 := po.lookup(n2)

 	// If either node wasn't present, we just record the new relation
 	// and exit.
 	if !f1 || !f2 {
 		po.setnoneq(n1, n2)
 		return true
 	}

 	// See if we already know this, in which case there's nothing to do.
 	if po.isnoneq(i1, i2) {
 		return true
 	}

 	// Check if we're contradicting an existing equality relation
 	if po.Equal(n1, n2) {
 		return false
 	}

 	// Record non-equality
 	po.setnoneq(n1, n2)

 	// If we know that i1<=i2 but not i1<i2, learn that as we
 	// now know that they are not equal. Do the same for i2<=i1.
 	// Do this check only if both nodes were already in the DAG,
 	// otherwise there cannot be an existing relation.
 	if po.reaches(i1, i2, false) && !po.reaches(i1, i2, true) {
 		po.addchild(i1, i2, true)
 	}
 	if po.reaches(i2, i1, false) && !po.reaches(i2, i1, true) {
 		po.addchild(i2, i1, true)
 	}

 	return true
 }

 // Checkpoint saves the current state of the DAG so that it's possible
 // to later undo this state.
 // Complexity is O(1).
 func (po *poset) Checkpoint() {
 	po.undo = append(po.undo, posetUndo{typ: undoCheckpoint})
 }

 // Undo restores the state of the poset to the previous checkpoint.
 // Complexity depends on the type of operations that were performed
 // since the last checkpoint; each Set* operation creates an undo
 // pass which Undo has to revert with a worst-case complexity of O(n).
 func (po *poset) Undo() {
 	if len(po.undo) == 0 {
 		panic("empty undo stack")
 	}
 	if debugPoset {
 		defer po.CheckIntegrity()
 	}

 	for len(po.undo) > 0 {
 		pass := po.undo[len(po.undo)-1]
 		po.undo = po.undo[:len(po.undo)-1]

 		switch pass.typ {
 		case undoCheckpoint:
 			return

 		case undoSetChl:
 			po.setchl(pass.idx, pass.edge)

 		case undoSetChr:
 			po.setchr(pass.idx, pass.edge)

 		case undoNonEqual:
 			po.noneq[uint32(pass.ID)].Clear(pass.idx)

 		case undoNewNode:
 			if pass.idx != po.lastidx {
 				panic("invalid newnode index")
 			}
 			if pass.ID != 0 {
 				if po.values[pass.ID] != pass.idx {
 					panic("invalid newnode undo pass")
 				}
 				delete(po.values, pass.ID)
 			}
 			po.setchl(pass.idx, 0)
 			po.setchr(pass.idx, 0)
 			po.nodes = po.nodes[:pass.idx]
 			po.lastidx--

 		case undoNewConstant:
 			// FIXME: remove this O(n) loop
 			var val int64
 			var i uint32
 			for val, i = range po.constants {
 				if i == pass.idx {
 					break
 				}
 			}
 			if i != pass.idx {
 				panic("constant not found in undo pass")
 			}
 			if pass.ID == 0 {
 				delete(po.constants, val)
 			} else {
 				// Restore previous index as constant node
 				// (also restoring the invariant on correct bounds)
 				oldidx := uint32(pass.ID)
 				po.constants[val] = oldidx
 			}

 		case undoAliasNode:
 			ID, prev := pass.ID, pass.idx
 			cur := po.values[ID]
 			if prev == 0 {
 				// Born as an alias, die as an alias
 				delete(po.values, ID)
 			} else {
 				if cur == prev {
 					panic("invalid aliasnode undo pass")
 				}
 				// Give it back previous value
 				po.values[ID] = prev
 			}

 		case undoNewRoot:
 			i := pass.idx
 			l, r := po.children(i)
 			if l|r != 0 {
 				panic("non-empty root in undo newroot")
 			}
 			po.removeroot(i)

 		case undoChangeRoot:
 			i := pass.idx
 			l, r := po.children(i)
 			if l|r != 0 {
 				panic("non-empty root in undo changeroot")
 			}
 			po.changeroot(i, pass.edge.Target())

 		case undoMergeRoot:
 			i := pass.idx
 			l, r := po.children(i)
 			po.changeroot(i, l.Target())
 			po.roots = append(po.roots, r.Target())

 		default:
 			panic(pass.typ)
 		}
 	}

 	if debugPoset && po.CheckEmpty() != nil {
 		panic("poset not empty at the end of undo")
 	}
 }