diff options
| author | Gustav Sörnäs <gusso230@student.liu.se> | 2020-12-15 17:52:58 +0100 |
|---|---|---|
| committer | Gustav Sörnäs <gusso230@student.liu.se> | 2020-12-15 17:52:58 +0100 |
| commit | 6c8acb4f4eabb20da41b941158bf52038035699f (patch) | |
| tree | ef680ba06131b77d82b6dafc3c9750b58b256c14 /store.py | |
| parent | ace809ebf6f38b1d4fc9f4ec59890d738b7ca583 (diff) | |
| parent | 21a531eac5b953aeab14e4e8ae887695e8a4c4aa (diff) | |
| download | tdde25-6c8acb4f4eabb20da41b941158bf52038035699f.tar.gz | |
Merge remote-tracking branch 'origin/union-find'
Diffstat (limited to 'store.py')
| -rw-r--r-- | store.py | 66 |
1 files changed, 64 insertions, 2 deletions
@@ -9,6 +9,35 @@ class Node: self.lng = float(lng) self.neighbours = [] + self.parent = None + self.size = 1 + + def find_root(self): + """ Recursively find the root of this node. """ + if not self.parent: + return self + else: + return self.parent.find_root() + + def union(self, other): + """ Mark this node and some other node as part of the same tree. """ + this = self.find_root() + other = other.find_root() + + # If we share the same root we are already part of the same tree + if this == other: + return + + # Minimize tree size. This ensures optimal complexity. + # We could also store the rank instead. + if this.size < other.size: + this, other = other, this + + # This is safe since other is a root node and currently doesn't have a + # parent. + other.parent = this + this.size += other.size + def coord_tuple(self): return self.lat, self.lng @@ -29,6 +58,8 @@ def add_neighbours(nodes): nodes[node1].neighbours.append(nodes[node2]) nodes[node2].neighbours.append(nodes[node1]) + # These two are neighbours and should be part of the same tree. + nodes[node1].union(nodes[node2]) return nodes @@ -45,11 +76,42 @@ def extract_osm_nodes(f_name): add_neighbours(nodes) - # remove nodes without neighbours. + # Remove nodes without neighbours for node_id, node in nodes.copy().items(): if not node.neighbours: del nodes[node_id] + # Construct a forest of disjoint trees. + # The forest is a { root: tree }-dict. If we construct a relation where + # two nodes relate to each other if they are a part of the same tree, + # this can be shown to be an equivalence relation where the equivalence + # class is some node in the tree. In our case, the equivalence class + # becomes the root of each node since it will be the same for all nodes + # in the same tree due our use of union-find. + forest = defaultdict(dict) + for node_id, node in nodes.items(): + forest[node.find_root().id][node_id] = node + + # Find the largest disjoint tree. + # We store the root so we can easily test if a node is part of this + # tree or not. + best_size = 0 + best_tree = None + best_root = None + for root in forest: + tree = forest[root] + size = len(tree) + if size > best_size: + best_size = size + best_tree = tree + best_root = root + + unconnected_nodes = [] + for _, node in nodes.items(): + if node.find_root().id != best_root: + unconnected_nodes.append(node) + + nodes = best_tree # create a "grid" by grouping nearby nodes. for node in nodes.copy().values(): @@ -62,7 +124,7 @@ def extract_osm_nodes(f_name): else: grid[key] = [node] - return nodes, grid + return nodes, grid, unconnected_nodes def select_nodes_in_rectangle(nodes, min_lat, max_lat, min_long, max_long): |
