-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathNussinov.py
More file actions
103 lines (87 loc) · 2.94 KB
/
Copy pathNussinov.py
File metadata and controls
103 lines (87 loc) · 2.94 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
'''
included for reference
this is an early version of our Nussinov algorithm
which has since been replaced by the file energy_min.py
''''
import sys
import matplotlib.pyplot as plt
import forgi.visual.mplotlib as fvm
import forgi
def build_matrix(sequence):
size = len(sequence)
matrix = []
matrix.append([" "] + sequence)
for i in range(size):
matrix.append([sequence[i]])
for j in range(size):
matrix[i+1].append(0)
return matrix
def complement(n1, n2):
if n1 == "a" and n2 in "ut":
return 1
elif n1 in "tu" and n2 == "a":
return 1
elif n1 in "ut" and n2 == "g":
return 1
elif n1 == "g" and n2 in "ut":
return 1
elif n1 == "c" and n2 == "g":
return 1
else:
return 1 if (n1 == "g" and n2 == "c") else 0
def fill_matrix(matrix):
counter = 1
for i in range(1, len(matrix)):
for j in range(i + 1, len(matrix)):
matrix[j-i][j] = nuss_func(matrix, j-i, j)
def traceback(results, matrix, i, j):
# print("in", i, j)
if j <= i:
return
elif matrix[i][j] == matrix[i][j-1]:
traceback(results, matrix, i, j-1)
return
else:
for k in range(i, j):
if complement(matrix[0][k], matrix[0][j]):
if k > 1:
if matrix[i][j] == matrix[i][k-1] + matrix[k+1][j-1] + 1:
results.append((k, j))
traceback(results, matrix, i, k-1)
traceback(results, matrix, k+1, j-1)
return
# print("out3")
elif matrix[i][j] == matrix[k+1][j-1] + 1:
results.append((k, j))
traceback(results, matrix, i, k-1)
traceback(results, matrix, k+1, j-1)
return
# print("out3")
def nuss_func(matrix, i, j):
# hanging_i = matrix[1+1][j]
hanging_j = matrix[i][j-1]
# joined = matrix[i+1][j-1] + complement(matrix[0][j], matrix[i][0])
sub_structures = get_max_substructures(matrix, i, j)
# return max(hanging_i, hanging_j, joined, sub_structures)
return max(hanging_j, sub_structures)
def get_max_substructures(matrix, i, j):
max = 0
temp = 0
for k in range(i, j):
if complement(matrix[0][k], matrix[0][j]):
if k > 1 :
temp = matrix[i][k-1] + matrix[k+1][j-1] + 1
else:
temp = matrix[k+1][j-1] + 1
if temp > max:
max = temp
return max
def nussinov(sequence):
# print(sequence)
matrix = build_matrix(sequence)
fill_matrix(matrix)
results = []
traceback(results, matrix, 1, len(matrix[0])-1)
return results
def print_matrix(matrix):
print('\n'.join([''.join(['%4s' % item for item in row])for row in matrix]))