forked from LondonLab/PRosettaC
-
Notifications
You must be signed in to change notification settings - Fork 0
/
utils.py
91 lines (82 loc) · 4.35 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
import os,sys
import glob
import shutil
PatchDock = os.environ["PATCHDOCK"]
OB = os.environ["OB"]
SCRIPTS_FOL = os.environ["SCRIPTS_FOL"]
ROSETTA_FOL = os.environ["ROSETTA_FOL"]
#adding hydrogens to an sdf file is done by converting it to pdb, and then back to sdf using openbabel
def addH_sdf(sdf_file, new_sdf = None):
tmp_pdb = sdf_file.split('.')[0] + '.pdb'
os.system(OB + '/babel ' + sdf_file + ' ' + tmp_pdb + ' -h')
if new_sdf == None:
os.system(OB + '/babel ' + tmp_pdb + ' ' + sdf_file)
else:
os.system(OB + '/babel ' + tmp_pdb + ' ' + new_sdf)
os.remove(tmp_pdb)
#openbabel conversion of pdb to sdf
def pdb2sdf(pdb_file, sdf_file):
os.system(OB + '/babel ' + pdb_file + ' ' + sdf_file)
def sdf2sdf(sdf_file):
os.system(OB + '/babel ' + sdf_file + ' ' + sdf_file)
#merge a virtual atom sdf file into an input sdf file
def add_virtual_atoms(input_sdf, v_atoms_sdf, output_sdf):
with open(input_sdf, 'r') as f:
confs = f.read().split('$$$$')
confs[0] = '\n' + confs[0]
confs = [[l + '\n' for l in line.split('\n') + ['$$$$']][1:] for line in confs][:-1]
with open(v_atoms_sdf, 'r') as f:
v_atoms = f.readlines()[4:7]
header = confs[0][3]
num_atoms = int(header[:3])
num_bonds = int(header[3:6])
new_header = '%03d' % (num_atoms + 3) + '%03d' % (num_bonds + 3) + header[6:]
v_index = ['%03d' % (num_atoms + 1), '%03d' % (num_atoms + 2), '%03d' % (num_atoms + 3)]
v_bonds = [v_index[0] + v_index[1] + ' 1 0\n', v_index[1] + v_index[2] + ' 1 0\n', ' 1' + v_index[0] + ' 1 0\n']
for i, conf in enumerate(confs):
confs[i] = conf[:3] + [new_header] + conf[4:4 + num_atoms] + v_atoms + conf[4 + num_atoms:4 + num_atoms + num_bonds] + v_bonds + conf[4 + num_atoms + num_bonds:-4] + [' 0 0 0 0 0 0 0 0 ' + '%03d' % (num_atoms + 3) + ' 0 ' + '%03d' % (num_atoms + 3) + ' 0'] + conf[-3:]
with open(output_sdf, 'w') as f:
for conf in confs:
for c in conf:
f.write(c)
return num_atoms + 2
#run PatchDock
def patchdock(structs, anchors, min_dist, max_dist, num_results=1000, threshold=4.0):
[structA, structB] = structs
[anchorA, anchorB] = anchors
with open('Patchdock_cst', 'w') as f:
f.write(' '.join([str(s) for s in [anchorA, anchorB, min_dist, max_dist]]) + '\n')
os.system(PatchDock + '/buildParams.pl ' + structA + ' ' + structB + ' ; mv params.txt Patchdock_params.txt')
os.system('sed -i \'s/#distanceConstraintsFile file_name/distanceConstraintsFile Patchdock_cst/g\' Patchdock_params.txt')
os.system('sed -i \'s/clusterParams 0.1 4 2.0 4.0/clusterParams 0.1 4 2.0 ' + str(threshold) + '/g\' Patchdock_params.txt')
os.system(PatchDock + '/patch_dock.Linux Patchdock_params.txt Patchdock_output')
os.system(PatchDock + '/transOutput.pl Patchdock_output 1 ' + str(num_results))
os.mkdir('Patchdock_Results')
results = [int(line.split('.')[1]) for line in glob.glob('Patchdock_output.*')]
if len(results) == 0:
return None
Num_Results = max(results)
for i in range(Num_Results):
os.system('mv Patchdock_output.' + str(i + 1) + '.pdb Patchdock_Results/pd.' + str(i + 1) + '.pdb')
os.system('sed -i \'s/PT1 X/PT1 Y/g\' Patchdock_Results/pd.' + str(i + 1) + '.pdb')
return Num_Results
def read_params(config_file: str) -> dict:
"""
Reads given config file and parses its content. Returns a dictionary with the parameter names as keys. Parameters
not set in the config file are set to their default value.
"""
# Lines must be formatted as "key: value". Ignore empty lines.
with open(config_file) as f:
lines = [l.strip() for l in f.readlines() if l.strip() != '']
params = {k.strip(): v.strip() for k, v in [l.split(':') for l in lines]}
# Set defaults if missing
try:
params['RosettaDockMemory'] = int(params.get('RosettaDockMemory', 8000))
except ValueError:
sys.exit(f'Could not interpret RosettaDockMemory from {config_file} as megabyte (int): {params["RosettaDockMemory"]}')
try:
params['ProtacModelMemory'] = int(params.get('ProtacModelMemory', 4000))
except ValueError:
sys.exit(f'Could not interpret ProtacModelMemory from {config_file} as megabyte (int): {params["ProtacModelMemory"]}')
params['ClusterName'] = params.get('ClusterName', 'PBS')
return params