-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathmain.py
99 lines (82 loc) · 3.08 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
from misc import *
from prediction import *
from mix_bag import *
import argparse
import networkx as nx
def main():
# Load the data first
data = load_data()
# Create two graph using networkx
hgraph = nx.Graph(data.humanppi)
fgraph = nx.Graph(data.functions)
if args.classifier == 'spl':
flagged = get_shortest_path(hgraph)
else:
flagged = []
# If chosen to test, run the below.
if args.test2:
print('run predictions on test2 set')
proteins_test2 = data.test2
# Run the prediction on test2
predictions = predict_cps(proteins_test2, hgraph, fgraph)
print(zip(proteins_test2, predictions))
# Write results to file.
write_test2_prediction(proteins_test2, predictions)
else:
# take sample if no arguments were provided and test this on test1
# and predict the cancer-relatedness of each of the proteins
sampler = Sampler(data.test1, args.samplesize)
results = []
for i in range(args.kfoldcross):
sample = zip(*sampler.remainder)[0]
predictions = predict_cps(sample, hgraph, fgraph)
# Add remainder of sample and results to empty array and resample
result = Results(sampler.remainder, predictions)
results.append(result)
sampler.resample()
if args.verbose:
result.print_results()
result.print_confusion_matrix()
# evaluate the performance
f_measures = [i.f_measure for i in results]
avg_f_measure = sum(f_measures) / float(len(f_measures))
print("\n\nAverage F-Measure:", avg_f_measure)
# Exit
pause = raw_input("Presss any key to continue..")
return 0
def get_options():
parser = argparse.ArgumentParser()
parser.add_argument('-v', '--verbose',
action='store_true',
help='Increases verbosity. ')
parser.add_argument('-k', '--kfoldcross', type=int, default=10,
help='Cross validation in K times')
parser.add_argument('-s', '--samplesize', type=float, default=0.9,
help='Percentage of test1 to train on. Example:\
-s 0.9 will use 90 percent of test1 to train on.')
parser.add_argument('-t', '--test2', default=False,
action='store_true',
help='Run predictions on trainingset Test2.txt.')
parser.add_argument('-c', '--classifier', default='wnc',
help='Classifier to use in the prediction task. :\
wnc - weighted neighbor counting classifier,\
spl - shortest path length classifier')
args = parser.parse_args()
return args
if __name__ == '__main__':
args = get_options()
assert 0 < args.samplesize < 1
print(args)
try:
import networkx
import colorama
import h5py
import numpy
import matplotlib
main()
except Exception as e:
raise
else:
pass
finally:
pass