-
Notifications
You must be signed in to change notification settings - Fork 121
/
Copy path032_TREE.py
53 lines (43 loc) · 1.58 KB
/
032_TREE.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
#!/usr/bin/env python
'''
A solution to a ROSALIND bioinformatics problem.
Problem Title: Completing a Tree
Rosalind ID: TREE
Rosalind #: 032
URL: http://rosalind.info/problems/tree/
'''
with open('data/rosalind_tree.txt') as input_data:
edges = input_data.read().strip().split('\n')
n = int(edges.pop(0))
edges = [map(int,edge.split()) for edge in edges]
# List of sets of nodes which are connected to eachother.
# Initially start with completely disconnected nodes.
connected_nodes = [{i} for i in range(1,n+1)]
for edge in edges:
temp_nodes = set()
del_nodes = []
for nodes in connected_nodes:
# If both nodes in the edge are already connected, we're done.
if (edge[0] in nodes) and (edge[1] in nodes):
break
# Check if only one end of the edge is in a given set of node. If so, store the nodes.
elif (edge[0] in nodes) or (edge[1] in nodes):
# Add all the nodes to a temporary set. Store the connected nodes for deletion.
temp_nodes.update(nodes)
del_nodes.append(nodes)
# If we've found matches in two separate nodes, we're guaranteed to be done searching.
if len(del_nodes) == 2:
break
# Check if an update is necessary.
if len(del_nodes) != 0:
# Make sure both nodes in the edge get added.
temp_nodes.add(edge[0])
temp_nodes.add(edge[1])
# Remove the old connected nodes.
for nodes in del_nodes:
connected_nodes.remove(nodes)
# Add one new connected node containing all the nodes.
connected_nodes.append(temp_nodes)
print len(connected_nodes)-1
with open('output/032_TREE.txt', 'w') as output_data:
output_data.write(str(len(connected_nodes)-1))