// Copyright 2013 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. package pointer // This file implements Hash-Value Numbering (HVN), a pre-solver // constraint optimization described in Hardekopf & Lin, SAS'07 (see // doc.go) that analyses the graph topology to determine which sets of // variables are "pointer equivalent" (PE), i.e. must have identical // points-to sets in the solution. // // A separate ("offline") graph is constructed. Its nodes are those of // the main-graph, plus an additional node *X for each pointer node X. // With this graph we can reason about the unknown points-to set of // dereferenced pointers. (We do not generalize this to represent // unknown fields x->f, perhaps because such fields would be numerous, // though it might be worth an experiment.) // // Nodes whose points-to relations are not entirely captured by the // graph are marked as "indirect": the *X nodes, the parameters of // address-taken functions (which includes all functions in method // sets), or nodes updated by the solver rules for reflection, etc. // // All addr (y=&x) nodes are initially assigned a pointer-equivalence // (PE) label equal to x's nodeid in the main graph. (These are the // only PE labels that are less than len(a.nodes).) // // All offsetAddr (y=&x.f) constraints are initially assigned a PE // label; such labels are memoized, keyed by (x, f), so that equivalent // nodes y as assigned the same label. // // Then we process each strongly connected component (SCC) of the graph // in topological order, assigning it a PE label based on the set P of // PE labels that flow to it from its immediate dependencies. // // If any node in P is "indirect", the entire SCC is assigned a fresh PE // label. Otherwise: // // |P|=0 if P is empty, all nodes in the SCC are non-pointers (e.g. // uninitialized variables, or formal params of dead functions) // and the SCC is assigned the PE label of zero. // // |P|=1 if P is a singleton, the SCC is assigned the same label as the // sole element of P. // // |P|>1 if P contains multiple labels, a unique label representing P is // invented and recorded in an hash table, so that other // equivalent SCCs may also be assigned this label, akin to // conventional hash-value numbering in a compiler. // // Finally, a renumbering is computed such that each node is replaced by // the lowest-numbered node with the same PE label. All constraints are // renumbered, and any resulting duplicates are eliminated. // // The only nodes that are not renumbered are the objects x in addr // (y=&x) constraints, since the ids of these nodes (and fields derived // from them via offsetAddr rules) are the elements of all points-to // sets, so they must remain as they are if we want the same solution. // // The solverStates (node.solve) for nodes in the same equivalence class // are linked together so that all nodes in the class have the same // solution. This avoids the need to renumber nodeids buried in // Queries, cgnodes, etc (like (*analysis).renumber() does) since only // the solution is needed. // // The result of HVN is that the number of distinct nodes and // constraints is reduced, but the solution is identical (almost---see // CROSS-CHECK below). In particular, both linear and cyclic chains of // copies are each replaced by a single node. // // Nodes and constraints created "online" (e.g. while solving reflection // constraints) are not subject to this optimization. // // PERFORMANCE // // In two benchmarks (guru and godoc), HVN eliminates about two thirds // of nodes, the majority accounted for by non-pointers: nodes of // non-pointer type, pointers that remain nil, formal parameters of dead // functions, nodes of untracked types, etc. It also reduces the number // of constraints, also by about two thirds, and the solving time by // 30--42%, although we must pay about 15% for the running time of HVN // itself. The benefit is greater for larger applications. // // There are many possible optimizations to improve the performance: // * Use fewer than 1:1 onodes to main graph nodes: many of the onodes // we create are not needed. // * HU (HVN with Union---see paper): coalesce "union" peLabels when // their expanded-out sets are equal. // * HR (HVN with deReference---see paper): this will require that we // apply HVN until fixed point, which may need more bookkeeping of the // correspondence of main nodes to onodes. // * Location Equivalence (see paper): have points-to sets contain not // locations but location-equivalence class labels, each representing // a set of locations. // * HVN with field-sensitive ref: model each of the fields of a // pointer-to-struct. // // CROSS-CHECK // // To verify the soundness of the optimization, when the // debugHVNCrossCheck option is enabled, we run the solver twice, once // before and once after running HVN, dumping the solution to disk, and // then we compare the results. If they are not identical, the analysis // panics. // // The solution dumped to disk includes only the N*N submatrix of the // complete solution where N is the number of nodes after generation. // In other words, we ignore pointer variables and objects created by // the solver itself, since their numbering depends on the solver order, // which is affected by the optimization. In any case, that's the only // part the client cares about. // // The cross-check is too strict and may fail spuriously. Although the // H&L paper describing HVN states that the solutions obtained should be // identical, this is not the case in practice because HVN can collapse // cycles involving *p even when pts(p)={}. Consider this example // distilled from testdata/hello.go: // // var x T // func f(p **T) { // t0 = *p // ... // t1 = φ(t0, &x) // *p = t1 // } // // If f is dead code, we get: // unoptimized: pts(p)={} pts(t0)={} pts(t1)={&x} // optimized: pts(p)={} pts(t0)=pts(t1)=pts(*p)={&x} // // It's hard to argue that this is a bug: the result is sound and the // loss of precision is inconsequential---f is dead code, after all. // But unfortunately it limits the usefulness of the cross-check since // failures must be carefully analyzed. Ben Hardekopf suggests (in // personal correspondence) some approaches to mitigating it: // // If there is a node with an HVN points-to set that is a superset // of the NORM points-to set, then either it's a bug or it's a // result of this issue. If it's a result of this issue, then in // the offline constraint graph there should be a REF node inside // some cycle that reaches this node, and in the NORM solution the // pointer being dereferenced by that REF node should be the empty // set. If that isn't true then this is a bug. If it is true, then // you can further check that in the NORM solution the "extra" // points-to info in the HVN solution does in fact come from that // purported cycle (if it doesn't, then this is still a bug). If // you're doing the further check then you'll need to do it for // each "extra" points-to element in the HVN points-to set. // // There are probably ways to optimize these checks by taking // advantage of graph properties. For example, extraneous points-to // info will flow through the graph and end up in many // nodes. Rather than checking every node with extra info, you // could probably work out the "origin point" of the extra info and // just check there. Note that the check in the first bullet is // looking for soundness bugs, while the check in the second bullet // is looking for precision bugs; depending on your needs, you may // care more about one than the other. // // which we should evaluate. The cross-check is nonetheless invaluable // for all but one of the programs in the pointer_test suite. import ( "fmt" "go/types" "io" "reflect" "golang.org/x/tools/container/intsets" ) // A peLabel is a pointer-equivalence label: two nodes with the same // peLabel have identical points-to solutions. // // The numbers are allocated consecutively like so: // 0 not a pointer // 1..N-1 addrConstraints (equals the constraint's .src field, hence sparse) // ... offsetAddr constraints // ... SCCs (with indirect nodes or multiple inputs) // // Each PE label denotes a set of pointers containing a single addr, a // single offsetAddr, or some set of other PE labels. // type peLabel int type hvn struct { a *analysis N int // len(a.nodes) immediately after constraint generation log io.Writer // (optional) log of HVN lemmas onodes []*onode // nodes of the offline graph label peLabel // the next available PE label hvnLabel map[string]peLabel // hash-value numbering (PE label) for each set of onodeids stack []onodeid // DFS stack index int32 // next onode.index, from Tarjan's SCC algorithm // For each distinct offsetAddrConstraint (src, offset) pair, // offsetAddrLabels records a unique PE label >= N. offsetAddrLabels map[offsetAddr]peLabel } // The index of an node in the offline graph. // (Currently the first N align with the main nodes, // but this may change with HRU.) type onodeid uint32 // An onode is a node in the offline constraint graph. // (Where ambiguous, members of analysis.nodes are referred to as // "main graph" nodes.) // // Edges in the offline constraint graph (edges and implicit) point to // the source, i.e. against the flow of values: they are dependencies. // Implicit edges are used for SCC computation, but not for gathering // incoming labels. // type onode struct { rep onodeid // index of representative of SCC in offline constraint graph edges intsets.Sparse // constraint edges X-->Y (this onode is X) implicit intsets.Sparse // implicit edges *X-->*Y (this onode is X) peLabels intsets.Sparse // set of peLabels are pointer-equivalent to this one indirect bool // node has points-to relations not represented in graph // Tarjan's SCC algorithm index, lowlink int32 // Tarjan numbering scc int32 // -ve => on stack; 0 => unvisited; +ve => node is root of a found SCC } type offsetAddr struct { ptr nodeid offset uint32 } // nextLabel issues the next unused pointer-equivalence label. func (h *hvn) nextLabel() peLabel { h.label++ return h.label } // ref(X) returns the index of the onode for *X. func (h *hvn) ref(id onodeid) onodeid { return id + onodeid(len(h.a.nodes)) } // hvn computes pointer-equivalence labels (peLabels) using the Hash-based // Value Numbering (HVN) algorithm described in Hardekopf & Lin, SAS'07. // func (a *analysis) hvn() { start("HVN") if a.log != nil { fmt.Fprintf(a.log, "\n\n==== Pointer equivalence optimization\n\n") } h := hvn{ a: a, N: len(a.nodes), log: a.log, hvnLabel: make(map[string]peLabel), offsetAddrLabels: make(map[offsetAddr]peLabel), } if h.log != nil { fmt.Fprintf(h.log, "\nCreating offline graph nodes...\n") } // Create offline nodes. The first N nodes correspond to main // graph nodes; the next N are their corresponding ref() nodes. h.onodes = make([]*onode, 2*h.N) for id := range a.nodes { id := onodeid(id) h.onodes[id] = &onode{} h.onodes[h.ref(id)] = &onode{indirect: true} } // Each node initially represents just itself. for id, o := range h.onodes { o.rep = onodeid(id) } h.markIndirectNodes() // Reserve the first N PE labels for addrConstraints. h.label = peLabel(h.N) // Add offline constraint edges. if h.log != nil { fmt.Fprintf(h.log, "\nAdding offline graph edges...\n") } for _, c := range a.constraints { if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "; %s\n", c) } c.presolve(&h) } // Find and collapse SCCs. if h.log != nil { fmt.Fprintf(h.log, "\nFinding SCCs...\n") } h.index = 1 for id, o := range h.onodes { if id > 0 && o.index == 0 { // Start depth-first search at each unvisited node. h.visit(onodeid(id)) } } // Dump the solution // (NB: somewhat redundant with logging from simplify().) if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\nPointer equivalences:\n") for id, o := range h.onodes { if id == 0 { continue } if id == int(h.N) { fmt.Fprintf(h.log, "---\n") } fmt.Fprintf(h.log, "o%d\t", id) if o.rep != onodeid(id) { fmt.Fprintf(h.log, "rep=o%d", o.rep) } else { fmt.Fprintf(h.log, "p%d", o.peLabels.Min()) if o.indirect { fmt.Fprint(h.log, " indirect") } } fmt.Fprintln(h.log) } } // Simplify the main constraint graph h.simplify() a.showCounts() stop("HVN") } // ---- constraint-specific rules ---- // dst := &src func (c *addrConstraint) presolve(h *hvn) { // Each object (src) is an initial PE label. label := peLabel(c.src) // label < N if debugHVNVerbose && h.log != nil { // duplicate log messages are possible fmt.Fprintf(h.log, "\tcreate p%d: {&n%d}\n", label, c.src) } odst := onodeid(c.dst) osrc := onodeid(c.src) // Assign dst this label. h.onodes[odst].peLabels.Insert(int(label)) if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\to%d has p%d\n", odst, label) } h.addImplicitEdge(h.ref(odst), osrc) // *dst ~~> src. } // dst = src func (c *copyConstraint) presolve(h *hvn) { odst := onodeid(c.dst) osrc := onodeid(c.src) h.addEdge(odst, osrc) // dst --> src h.addImplicitEdge(h.ref(odst), h.ref(osrc)) // *dst ~~> *src } // dst = *src + offset func (c *loadConstraint) presolve(h *hvn) { odst := onodeid(c.dst) osrc := onodeid(c.src) if c.offset == 0 { h.addEdge(odst, h.ref(osrc)) // dst --> *src } else { // We don't interpret load-with-offset, e.g. results // of map value lookup, R-block of dynamic call, slice // copy/append, reflection. h.markIndirect(odst, "load with offset") } } // *dst + offset = src func (c *storeConstraint) presolve(h *hvn) { odst := onodeid(c.dst) osrc := onodeid(c.src) if c.offset == 0 { h.onodes[h.ref(odst)].edges.Insert(int(osrc)) // *dst --> src if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\to%d --> o%d\n", h.ref(odst), osrc) } } // We don't interpret store-with-offset. // See discussion of soundness at markIndirectNodes. } // dst = &src.offset func (c *offsetAddrConstraint) presolve(h *hvn) { // Give each distinct (addr, offset) pair a fresh PE label. // The cache performs CSE, effectively. key := offsetAddr{c.src, c.offset} label, ok := h.offsetAddrLabels[key] if !ok { label = h.nextLabel() h.offsetAddrLabels[key] = label if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\tcreate p%d: {&n%d.#%d}\n", label, c.src, c.offset) } } // Assign dst this label. h.onodes[c.dst].peLabels.Insert(int(label)) if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\to%d has p%d\n", c.dst, label) } } // dst = src.(typ) where typ is an interface func (c *typeFilterConstraint) presolve(h *hvn) { h.markIndirect(onodeid(c.dst), "typeFilter result") } // dst = src.(typ) where typ is concrete func (c *untagConstraint) presolve(h *hvn) { odst := onodeid(c.dst) for end := odst + onodeid(h.a.sizeof(c.typ)); odst < end; odst++ { h.markIndirect(odst, "untag result") } } // dst = src.method(c.params...) func (c *invokeConstraint) presolve(h *hvn) { // All methods are address-taken functions, so // their formal P-blocks were already marked indirect. // Mark the caller's targets node as indirect. sig := c.method.Type().(*types.Signature) id := c.params h.markIndirect(onodeid(c.params), "invoke targets node") id++ id += nodeid(h.a.sizeof(sig.Params())) // Mark the caller's R-block as indirect. end := id + nodeid(h.a.sizeof(sig.Results())) for id < end { h.markIndirect(onodeid(id), "invoke R-block") id++ } } // markIndirectNodes marks as indirect nodes whose points-to relations // are not entirely captured by the offline graph, including: // // (a) All address-taken nodes (including the following nodes within // the same object). This is described in the paper. // // The most subtle cause of indirect nodes is the generation of // store-with-offset constraints since the offline graph doesn't // represent them. A global audit of constraint generation reveals the // following uses of store-with-offset: // // (b) genDynamicCall, for P-blocks of dynamically called functions, // to which dynamic copy edges will be added to them during // solving: from storeConstraint for standalone functions, // and from invokeConstraint for methods. // All such P-blocks must be marked indirect. // (c) MakeUpdate, to update the value part of a map object. // All MakeMap objects's value parts must be marked indirect. // (d) copyElems, to update the destination array. // All array elements must be marked indirect. // // Not all indirect marking happens here. ref() nodes are marked // indirect at construction, and each constraint's presolve() method may // mark additional nodes. // func (h *hvn) markIndirectNodes() { // (a) all address-taken nodes, plus all nodes following them // within the same object, since these may be indirectly // stored or address-taken. for _, c := range h.a.constraints { if c, ok := c.(*addrConstraint); ok { start := h.a.enclosingObj(c.src) end := start + nodeid(h.a.nodes[start].obj.size) for id := c.src; id < end; id++ { h.markIndirect(onodeid(id), "A-T object") } } } // (b) P-blocks of all address-taken functions. for id := 0; id < h.N; id++ { obj := h.a.nodes[id].obj // TODO(adonovan): opt: if obj.cgn.fn is a method and // obj.cgn is not its shared contour, this is an // "inlined" static method call. We needn't consider it // address-taken since no invokeConstraint will affect it. if obj != nil && obj.flags&otFunction != 0 && h.a.atFuncs[obj.cgn.fn] { // address-taken function if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "n%d is address-taken: %s\n", id, obj.cgn.fn) } h.markIndirect(onodeid(id), "A-T func identity") id++ sig := obj.cgn.fn.Signature psize := h.a.sizeof(sig.Params()) if sig.Recv() != nil { psize += h.a.sizeof(sig.Recv().Type()) } for end := id + int(psize); id < end; id++ { h.markIndirect(onodeid(id), "A-T func P-block") } id-- continue } } // (c) all map objects' value fields. for _, id := range h.a.mapValues { h.markIndirect(onodeid(id), "makemap.value") } // (d) all array element objects. // TODO(adonovan): opt: can we do better? for id := 0; id < h.N; id++ { // Identity node for an object of array type? if tArray, ok := h.a.nodes[id].typ.(*types.Array); ok { // Mark the array element nodes indirect. // (Skip past the identity field.) for range h.a.flatten(tArray.Elem()) { id++ h.markIndirect(onodeid(id), "array elem") } } } } func (h *hvn) markIndirect(oid onodeid, comment string) { h.onodes[oid].indirect = true if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\to%d is indirect: %s\n", oid, comment) } } // Adds an edge dst-->src. // Note the unusual convention: edges are dependency (contraflow) edges. func (h *hvn) addEdge(odst, osrc onodeid) { h.onodes[odst].edges.Insert(int(osrc)) if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\to%d --> o%d\n", odst, osrc) } } func (h *hvn) addImplicitEdge(odst, osrc onodeid) { h.onodes[odst].implicit.Insert(int(osrc)) if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\to%d ~~> o%d\n", odst, osrc) } } // visit implements the depth-first search of Tarjan's SCC algorithm. // Precondition: x is canonical. func (h *hvn) visit(x onodeid) { h.checkCanonical(x) xo := h.onodes[x] xo.index = h.index xo.lowlink = h.index h.index++ h.stack = append(h.stack, x) // push assert(xo.scc == 0, "node revisited") xo.scc = -1 var deps []int deps = xo.edges.AppendTo(deps) deps = xo.implicit.AppendTo(deps) for _, y := range deps { // Loop invariant: x is canonical. y := h.find(onodeid(y)) if x == y { continue // nodes already coalesced } xo := h.onodes[x] yo := h.onodes[y] switch { case yo.scc > 0: // y is already a collapsed SCC case yo.scc < 0: // y is on the stack, and thus in the current SCC. if yo.index < xo.lowlink { xo.lowlink = yo.index } default: // y is unvisited; visit it now. h.visit(y) // Note: x and y are now non-canonical. x = h.find(onodeid(x)) if yo.lowlink < xo.lowlink { xo.lowlink = yo.lowlink } } } h.checkCanonical(x) // Is x the root of an SCC? if xo.lowlink == xo.index { // Coalesce all nodes in the SCC. if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "scc o%d\n", x) } for { // Pop y from stack. i := len(h.stack) - 1 y := h.stack[i] h.stack = h.stack[:i] h.checkCanonical(x) xo := h.onodes[x] h.checkCanonical(y) yo := h.onodes[y] if xo == yo { // SCC is complete. xo.scc = 1 h.labelSCC(x) break } h.coalesce(x, y) } } } // Precondition: x is canonical. func (h *hvn) labelSCC(x onodeid) { h.checkCanonical(x) xo := h.onodes[x] xpe := &xo.peLabels // All indirect nodes get new labels. if xo.indirect { label := h.nextLabel() if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\tcreate p%d: indirect SCC\n", label) fmt.Fprintf(h.log, "\to%d has p%d\n", x, label) } // Remove pre-labeling, in case a direct pre-labeled node was // merged with an indirect one. xpe.Clear() xpe.Insert(int(label)) return } // Invariant: all peLabels sets are non-empty. // Those that are logically empty contain zero as their sole element. // No other sets contains zero. // Find all labels coming in to the coalesced SCC node. for _, y := range xo.edges.AppendTo(nil) { y := h.find(onodeid(y)) if y == x { continue // already coalesced } ype := &h.onodes[y].peLabels if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\tedge from o%d = %s\n", y, ype) } if ype.IsEmpty() { if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\tnode has no PE label\n") } } assert(!ype.IsEmpty(), "incoming node has no PE label") if ype.Has(0) { // {0} represents a non-pointer. assert(ype.Len() == 1, "PE set contains {0, ...}") } else { xpe.UnionWith(ype) } } switch xpe.Len() { case 0: // SCC has no incoming non-zero PE labels: it is a non-pointer. xpe.Insert(0) case 1: // already a singleton default: // SCC has multiple incoming non-zero PE labels. // Find the canonical label representing this set. // We use String() as a fingerprint consistent with Equals(). key := xpe.String() label, ok := h.hvnLabel[key] if !ok { label = h.nextLabel() if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\tcreate p%d: union %s\n", label, xpe.String()) } h.hvnLabel[key] = label } xpe.Clear() xpe.Insert(int(label)) } if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\to%d has p%d\n", x, xpe.Min()) } } // coalesce combines two nodes in the offline constraint graph. // Precondition: x and y are canonical. func (h *hvn) coalesce(x, y onodeid) { xo := h.onodes[x] yo := h.onodes[y] // x becomes y's canonical representative. yo.rep = x if debugHVNVerbose && h.log != nil { fmt.Fprintf(h.log, "\tcoalesce o%d into o%d\n", y, x) } // x accumulates y's edges. xo.edges.UnionWith(&yo.edges) yo.edges.Clear() // x accumulates y's implicit edges. xo.implicit.UnionWith(&yo.implicit) yo.implicit.Clear() // x accumulates y's pointer-equivalence labels. xo.peLabels.UnionWith(&yo.peLabels) yo.peLabels.Clear() // x accumulates y's indirect flag. if yo.indirect { xo.indirect = true } } // simplify computes a degenerate renumbering of nodeids from the PE // labels assigned by the hvn, and uses it to simplify the main // constraint graph, eliminating non-pointer nodes and duplicate // constraints. // func (h *hvn) simplify() { // canon maps each peLabel to its canonical main node. canon := make([]nodeid, h.label) for i := range canon { canon[i] = nodeid(h.N) // indicates "unset" } // mapping maps each main node index to the index of the canonical node. mapping := make([]nodeid, len(h.a.nodes)) for id := range h.a.nodes { id := nodeid(id) if id == 0 { canon[0] = 0 mapping[0] = 0 continue } oid := h.find(onodeid(id)) peLabels := &h.onodes[oid].peLabels assert(peLabels.Len() == 1, "PE class is not a singleton") label := peLabel(peLabels.Min()) canonID := canon[label] if canonID == nodeid(h.N) { // id becomes the representative of the PE label. canonID = id canon[label] = canonID if h.a.log != nil { fmt.Fprintf(h.a.log, "\tpts(n%d) is canonical : \t(%s)\n", id, h.a.nodes[id].typ) } } else { // Link the solver states for the two nodes. assert(h.a.nodes[canonID].solve != nil, "missing solver state") h.a.nodes[id].solve = h.a.nodes[canonID].solve if h.a.log != nil { // TODO(adonovan): debug: reorganize the log so it prints // one line: // pe y = x1, ..., xn // for each canonical y. Requires allocation. fmt.Fprintf(h.a.log, "\tpts(n%d) = pts(n%d) : %s\n", id, canonID, h.a.nodes[id].typ) } } mapping[id] = canonID } // Renumber the constraints, eliminate duplicates, and eliminate // any containing non-pointers (n0). addrs := make(map[addrConstraint]bool) copys := make(map[copyConstraint]bool) loads := make(map[loadConstraint]bool) stores := make(map[storeConstraint]bool) offsetAddrs := make(map[offsetAddrConstraint]bool) untags := make(map[untagConstraint]bool) typeFilters := make(map[typeFilterConstraint]bool) invokes := make(map[invokeConstraint]bool) nbefore := len(h.a.constraints) cc := h.a.constraints[:0] // in-situ compaction for _, c := range h.a.constraints { // Renumber. switch c := c.(type) { case *addrConstraint: // Don't renumber c.src since it is the label of // an addressable object and will appear in PT sets. c.dst = mapping[c.dst] default: c.renumber(mapping) } if c.ptr() == 0 { continue // skip: constraint attached to non-pointer } var dup bool switch c := c.(type) { case *addrConstraint: _, dup = addrs[*c] addrs[*c] = true case *copyConstraint: if c.src == c.dst { continue // skip degenerate copies } if c.src == 0 { continue // skip copy from non-pointer } _, dup = copys[*c] copys[*c] = true case *loadConstraint: if c.src == 0 { continue // skip load from non-pointer } _, dup = loads[*c] loads[*c] = true case *storeConstraint: if c.src == 0 { continue // skip store from non-pointer } _, dup = stores[*c] stores[*c] = true case *offsetAddrConstraint: if c.src == 0 { continue // skip offset from non-pointer } _, dup = offsetAddrs[*c] offsetAddrs[*c] = true case *untagConstraint: if c.src == 0 { continue // skip untag of non-pointer } _, dup = untags[*c] untags[*c] = true case *typeFilterConstraint: if c.src == 0 { continue // skip filter of non-pointer } _, dup = typeFilters[*c] typeFilters[*c] = true case *invokeConstraint: if c.params == 0 { panic("non-pointer invoke.params") } if c.iface == 0 { continue // skip invoke on non-pointer } _, dup = invokes[*c] invokes[*c] = true default: // We don't bother de-duping advanced constraints // (e.g. reflection) since they are uncommon. // Eliminate constraints containing non-pointer nodeids. // // We use reflection to find the fields to avoid // adding yet another method to constraint. // // TODO(adonovan): experiment with a constraint // method that returns a slice of pointers to // nodeids fields to enable uniform iteration; // the renumber() method could be removed and // implemented using the new one. // // TODO(adonovan): opt: this is unsound since // some constraints still have an effect if one // of the operands is zero: rVCall, rVMapIndex, // rvSetMapIndex. Handle them specially. rtNodeid := reflect.TypeOf(nodeid(0)) x := reflect.ValueOf(c).Elem() for i, nf := 0, x.NumField(); i < nf; i++ { f := x.Field(i) if f.Type() == rtNodeid { if f.Uint() == 0 { dup = true // skip it break } } } } if dup { continue // skip duplicates } cc = append(cc, c) } h.a.constraints = cc if h.log != nil { fmt.Fprintf(h.log, "#constraints: was %d, now %d\n", nbefore, len(h.a.constraints)) } } // find returns the canonical onodeid for x. // (The onodes form a disjoint set forest.) func (h *hvn) find(x onodeid) onodeid { // TODO(adonovan): opt: this is a CPU hotspot. Try "union by rank". xo := h.onodes[x] rep := xo.rep if rep != x { rep = h.find(rep) // simple path compression xo.rep = rep } return rep } func (h *hvn) checkCanonical(x onodeid) { if debugHVN { assert(x == h.find(x), "not canonical") } } func assert(p bool, msg string) { if debugHVN && !p { panic("assertion failed: " + msg) } }