Skip to content

Commit

Permalink
Add modules for deterministic total ordering derivation from partial …
Browse files Browse the repository at this point in the history
…ord (#1335)

The intention of this logic is to allow us to specify partial orderings
when orderings are needed (e.g. beginblock, endblock, upgrade orders),
and then have an automatic derivation of the relevant total ordering.

partialord_test.go gives a sense of how the API would look if we went with
this.

Co-authored-by: Roman <roman@osmosis.team>
Co-authored-by: Matt, Park <45252226+mattverse@users.noreply.github.com>
  • Loading branch information
3 people authored Apr 25, 2022
1 parent 66ebf33 commit a572cb3
Show file tree
Hide file tree
Showing 7 changed files with 623 additions and 0 deletions.
1 change: 1 addition & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -49,6 +49,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0

### Minor improvements & Bug Fixes

* [#1335](https://github.com/osmosis-labs/osmosis/pull/1335) Add utility for deriving total orderings from partial orderings.
* [#1308](https://github.com/osmosis-labs/osmosis/pull/1308) Make panics inside of epochs no longer chain halt by default.
* [#1286](https://github.com/osmosis-labs/osmosis/pull/1286) Fix release build scripts.
* [#1203](https://github.com/osmosis-labs/osmosis/pull/1203) cleanup Makefile and ci workflows
Expand Down
320 changes: 320 additions & 0 deletions osmoutils/partialord/internal/dag/dag.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,320 @@
package dag

import (
"fmt"
"sort"
)

// DAG struct maintains a directed acyclic graph, using adjacency lists to track edges.
type DAG struct {
// there is a directed edge from u -> v, if directedEdgeList[u][v] = 1
// there is a directed edge from v -> u, if directedEdgeList[u][v] = -1
directedEdgeList []map[int]int8
nodeNameToId map[string]int
idToNodeNames map[int]string
}

func NewDAG(nodes []string) DAG {
nodeNameToId := make(map[string]int, len(nodes))
idToNodeNames := make(map[int]string, len(nodes))
directedEdgeList := make([]map[int]int8, len(nodes))
for i, node := range nodes {
nodeNameToId[node] = i
idToNodeNames[i] = node
directedEdgeList[i] = map[int]int8{}
}
if len(nodeNameToId) != len(nodes) {
panic("provided multiple nodes with the same name")
}
return DAG{
directedEdgeList: directedEdgeList,
nodeNameToId: nodeNameToId,
idToNodeNames: idToNodeNames,
}
}

// Copy returns a new dag struct that is a copy of the original dag.
// Edges can be mutated in the copy, without altering the original.
func (dag DAG) Copy() DAG {
directedEdgeList := make([]map[int]int8, len(dag.nodeNameToId))
for i := 0; i < len(dag.nodeNameToId); i++ {
originalEdgeList := dag.directedEdgeList[i]
directedEdgeList[i] = make(map[int]int8, len(originalEdgeList))
for k, v := range originalEdgeList {
directedEdgeList[i][k] = v
}
}
// we re-use nodeNameToId and idToNodeNames as these are fixed at dag creation.
return DAG{
directedEdgeList: directedEdgeList,
nodeNameToId: dag.nodeNameToId,
idToNodeNames: dag.idToNodeNames,
}
}

func (dag DAG) hasDirectedEdge(u, v int) bool {
uAdjacencyList := dag.directedEdgeList[u]
_, exists := uAdjacencyList[v]
return exists
}

// addEdge adds a directed edge from u -> v.
func (dag *DAG) addEdge(u, v int) error {
if u == v {
return fmt.Errorf("can't make self-edge")
}
if dag.hasDirectedEdge(v, u) {
return fmt.Errorf("dag has conflicting edge")
}
dag.directedEdgeList[u][v] = 1
dag.directedEdgeList[v][u] = -1
return nil
}

// replaceEdge adds a directed edge from u -> v.
// it removes any edge that may already exist between the two.
func (dag *DAG) replaceEdge(u, v int) error {
if u == v {
return fmt.Errorf("can't make self-edge")
}

dag.directedEdgeList[u][v] = 1
dag.directedEdgeList[v][u] = -1
return nil
}

// resetEdges deletes all edges directed to or from node `u`
func (dag *DAG) resetEdges(u int) {
edges := dag.directedEdgeList[u]
for v := range edges {
delete(dag.directedEdgeList[v], u)
}
dag.directedEdgeList[u] = map[int]int8{}
}

// deleteEdge deletes edges between u and v.
func (dag *DAG) deleteEdge(u, v int) {
delete(dag.directedEdgeList[u], v)
delete(dag.directedEdgeList[v], u)
}

// AddEdge checks if either edge between u and v exists and adds a directed edge from u -> v
func (dag *DAG) AddEdge(u, v string) error {
uIndex, uExists := dag.nodeNameToId[u]
vIndex, vExists := dag.nodeNameToId[v]
if !uExists || !vExists {
return fmt.Errorf("one of %s, %s does not exist in dag", u, v)
}
return dag.addEdge(uIndex, vIndex)
}

// ReplaceEdge adds a directed edge from u -> v.
// it removes any edge that may already exist between the two.
func (dag *DAG) ReplaceEdge(u, v string) error {
uIndex, uExists := dag.nodeNameToId[u]
vIndex, vExists := dag.nodeNameToId[v]
if !uExists || !vExists {
return fmt.Errorf("one of %s, %s does not exist in dag", u, v)
}
return dag.replaceEdge(uIndex, vIndex)
}

// AddFirstElements sets the provided elements to be first in all orderings.
// So if were making an ordering over {A, B, C, D, E}, and elems provided is {D, B, A}
// then we are guaranteed that the total ordering will begin with {D, B, A}
func (dag *DAG) AddFirstElements(nodes ...string) error {
nodeIds, err := dag.namesToIds(nodes)
if err != nil {
return err
}

return dag.addFirst(nodeIds)
}

func (dag *DAG) addFirst(nodes []int) error {
nodeMap := map[int]bool{}
for i := 0; i < len(nodes); i++ {
nodeMap[nodes[i]] = true
}
// First we add an edge from nodes[-1] to every node in the graph aside from the provided first nodes.
// then we make nodes[-1] depend on nodes[-2], etc.
// We also clear all other edges from nodes[-2], to override previous settings.
lastOfFirstNodes := nodes[len(nodes)-1]
for i := 0; i < len(dag.nodeNameToId); i++ {
// skip any node in the 'first set'
_, inMap := nodeMap[i]
if inMap {
continue
}
// We make everything on `lastOfFirstNodes`, and therefore have an edge from `lastOfFirstNodes` to it
err := dag.replaceEdge(lastOfFirstNodes, i)
// can't happen by above check
if err != nil {
return err
}
}

// Make nodes[i+1] depend on nodes[i]
for i := len(nodes) - 2; i >= 0; i-- {
dag.resetEdges(nodes[i])
err := dag.replaceEdge(nodes[i], nodes[i+1])
// can't happen by above check
if err != nil {
return err
}
}
return nil
}

// AddLastElements sets the provided elements to be last in all orderings.
// So if were making an ordering over {A, B, C, D, E}, and elems provided is {D, B, A}
// then we are guaranteed that the total ordering will end with {D, B, A}
func (dag *DAG) AddLastElements(nodes ...string) error {
nodeIds, err := dag.namesToIds(nodes)
if err != nil {
return err
}

return dag.addLast(nodeIds)
}

func (dag *DAG) addLast(nodes []int) error {
nodeMap := map[int]bool{}
for i := 0; i < len(nodes); i++ {
nodeMap[nodes[i]] = true
}
// First we add an edge from every node in the graph aside from the provided last nodes, to nodes[0]
// then we make nodes[1] depend on nodes[0], etc.
// We also clear all other edges from nodes[1], to override previous settings.
firstOfLastNodes := nodes[0]
for i := 0; i < len(dag.nodeNameToId); i++ {
// skip any node in the 'last set'
_, inMap := nodeMap[i]
if inMap {
continue
}
// We make `firstOfLastNodes` depend on every node, and therefore have an edge from each node to `firstOfLastNodes`
err := dag.replaceEdge(i, firstOfLastNodes)
// can't happen by above check
if err != nil {
return err
}
}

// Make nodes[i] depend on nodes[i-1], and clear all other edges from nodes[i]
for i := 1; i < len(nodes); i++ {
dag.resetEdges(nodes[i])
err := dag.replaceEdge(nodes[i-1], nodes[i])
// can't happen by above check
if err != nil {
return err
}
}
return nil
}

func (dag DAG) hasEdges() bool {
for _, m := range dag.directedEdgeList {
if len(m) > 0 {
return true
}
}
return false
}

func (dag *DAG) namesToIds(names []string) ([]int, error) {
nodeIds := []int{}
for _, name := range names {
nodeIndex, nodeExists := dag.nodeNameToId[name]
if !nodeExists {
return []int{}, fmt.Errorf("%s does not exist in dag", name)
}
nodeIds = append(nodeIds, nodeIndex)
}
return nodeIds, nil
}

func (dag DAG) idsToNames(ids []int) []string {
sortedNames := make([]string, 0, len(ids))
for i := 0; i < len(dag.nodeNameToId); i++ {
id := ids[i]
sortedNames = append(sortedNames, dag.idToNodeNames[id])
}
return sortedNames
}

func (dag DAG) hasIncomingEdge(u int) bool {
adjacencyList := dag.directedEdgeList[u]
for _, v := range adjacencyList {
if v == -1 {
return true
}
}
return false
}

// returns nodes with no incoming edges.
func (dag *DAG) topologicalTopLevelNodes() []int {
topLevelNodes := []int{}

for i := 0; i < len(dag.nodeNameToId); i++ {
if !dag.hasIncomingEdge(i) {
topLevelNodes = append(topLevelNodes, i)
}
}

return topLevelNodes
}

// Returns a Topological Sort of the DAG, using Kahn's algorithm.
// https://en.wikipedia.org/wiki/Topological_sorting#Kahn's_algorithm
func (dag DAG) TopologicalSort() []string {
// G is the mutable graph we work on, which we remove edges from.
G := dag.Copy()
// L in pseudocode
sortedIDs := make([]int, 0, len(dag.nodeNameToId))
topLevelNodes := dag.topologicalTopLevelNodes()

// while len(topLevelNodes) != 0
for {
if len(topLevelNodes) == 0 {
break
}
// pop a node `n`` off of topLevelNodes
n := topLevelNodes[0]
topLevelNodes = topLevelNodes[1:]
// add it to the sorted list
sortedIDs = append(sortedIDs, n)
nEdgeList := G.directedEdgeList[n]

// normally we'd do map iteration, but because we need cross-machine determinism,
// we gather all the nodes M for which there is an edge n -> m, sort that list,
// and then iterate over it.
nodesM := make([]int, 0, len(nEdgeList))
for m, direction := range nEdgeList {
if direction != 1 {
panic("dag: topological sort correctness error. " +
"Popped node n was expected to have no incoming edges")
}
nodesM = append(nodesM, m)
}

sort.Ints(nodesM)

for _, m := range nodesM {
// remove edge from n -> m
G.deleteEdge(n, m)
// if m has no incomingEdges, add to topLevelNodes
if !G.hasIncomingEdge(m) {
topLevelNodes = append(topLevelNodes, m)
}
}
}

if G.hasEdges() {
fmt.Println(G)
panic("dag: invalid construction, attempted to topologically sort a tree that is not a dag. A cycle exists")
}

return dag.idsToNames(sortedIDs)
}
Loading

0 comments on commit a572cb3

Please sign in to comment.