-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathextract_cluster_centers.py
executable file
·91 lines (70 loc) · 2.5 KB
/
extract_cluster_centers.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#!/usr/bin/python
from sys import argv,exit
from os import popen, system
import string
def Help():
print
print 'Usage: '+argv[0]+' <.info file> <number of cluster centers> '
print ' The .info file needs to be of the format created by the'
print ' clustering program cluster_info_silent.out. '
print ' This utility needs to be run from the same directory as where the'
print ' clustering program was run. (Its a paths thing.)'
print
exit()
if len(argv)<2:
Help()
try:
NSTRUCT = int(argv[-1])
del(argv[-1])
except:
NSTRUCT = 9999999
infiles = argv[1:]
for infile in infiles:
assert( infile[-4:] == 'info') # Its output from Phil's clustering program
lines = popen('grep CLUSTER_RMSDS '+infile).readlines()
count = 0
taglist = {}
whichcenter = {}
for line in lines:
cols = string.split(line)
clustercenter = cols[3]
cols = string.split(clustercenter,':')
outfilename = cols[0]
if not outfilename in taglist.keys():
taglist[ outfilename ] = []
fulltag = cols[1]
if fulltag.find('S') > -1:
tag = 'S'+string.join(string.split(fulltag,'S')[1:],'S')
elif fulltag.find('F') > -1:
tag = 'F'+string.join(string.split(fulltag,'F')[1:],'S')
else:
tag = fulltag
taglist[outfilename].append(tag)
whichcenter[tag] = count
count = count+1
if (count >= NSTRUCT):break
for outfilename in taglist.keys():
templist = outfilename+'.list'
fid = open(templist,'w')
for tag in taglist[outfilename]:
fid.write(tag+'\n')
fid.close()
command = '/work/rhiju/rosetta++/rosetta.gcc -extract -l '+templist+' -paths /work/rhiju/paths.txt -s '+outfilename
# Check if this is an RNA run.
fid = open( infile, 'r')
line = fid.readline(); # Should be the sequence.
if (line.count('a') or line.count('c') or
line.count('g') or line.count('u')):
command += ' -enable_dna -enable_rna '
lines = popen('head -n 8 '+outfilename).readlines()
if len(string.split(lines[7])) > 10:
command += ' -fa_input'
print(command)
system(command)
for tag in taglist[outfilename]:
command = 'mv %s.pdb %s.cluster%03d.1.pdb' % (tag,infile,whichcenter[tag])
print(command)
system(command)
command = 'rm '+templist
print(command)
system(command)