-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathDNAFlexRB.py
136 lines (113 loc) · 4.67 KB
/
DNAFlexRB.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
# File: DNAFlexRB.py
#
# Copyright (C) 2016 Marco Pasi <[email protected]>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
#"DNAFlexRB.py v0.1 (C) 2016 Marco Pasi"
#
#
from mug import datatypes as mug_datatypes
from DNAFlexibility import DNAFlexibility
from pycompss.api.task import task
from pycompss.api.constraint import constraint
from pycompss.api.parameter import IN, OUT
from subprocess import Popen, PIPE
import tempfile, sys
import numpy as np
#------------------------------------------------------------------------------
__doc__ = """\
Predict the flexibility of a canonical B-form DNA oligomer of
arbitrary sequence by using the cgDNA tool. cgDNA uses an MD-derived
parameter set to predict stiffness matrices as a function of the
Curves+ intra-base-pair and inter-base-pair helical parameters. For
more information see the following references. If you find this
software useful, please cite the following references. Requires a
working installation of GNU Octave, and of cgDNA in the Octave path.
Usage:
DNAFlexRB.py [options] <SEQUENCE>
Options:
-h (--help) Display this help.
References:
[1] Gonzalez,O., Petkeviciute,D. and Maddocks,J.H. (2013) A
sequence-dependent rigid-base model of DNA. J Chem Phys, 138, 055102.
[2] Petkeviciute,D., Pasi,M., Gonzalez,O., and Maddocks,J.H. (2014)
cgDNA: a software package for the prediction of sequence-dependent
coarse-grain free energies of B-form DNA. Nucleic Acids Res., 42, e153-
"""
#------------------------------------------------------------------------------
class DNAFlexRB(DNAFlexibility):
output_data_type = mug_datatypes.Matrix
"""Configuration: the name of the parameter file."""
configuration = {
'cgDNApath': None,
'cgDNAparamset': 'cgDNAparamset2.mat'
}
def _is_error(self, stderr):
"""
Parse the standard error stream from an Octave session to assess
whether an error was reported.
"""
for line in stderr.split("\n"):
if line.startswith("error:"): return True
return False
def _get_stiffness_matrix(self, sequence):
"""
Generate the full-oligomer stiffness matrix by running an octave
script that uses the cgDNA code.
"""
with tempfile.NamedTemporaryFile(mode="w", suffix=".m") as octave_script,\
tempfile.NamedTemporaryFile(mode="w", suffix=".dat") as output_matrix:
if self.configuration['cgDNApath'] is not None:
octave_script.write(
"addpath {}\n".format(self.configuration['cgDNApath']))
octave_script.write("""\
sequence = '{sequence}';
params = load('{paramset}');
[nondimshapes, stiff] = constructSeqParms(sequence, params);
save -ascii {output} stiff;""".format(
sequence = sequence,
paramset = self.configuration['cgDNAparamset'],
output = output_matrix.name))
octave_script.flush()
predict = Popen(['octave',
'--no-gui',
octave_script.name],
stdout=PIPE, stderr=PIPE,
shell=False)
predict.wait()
err = predict.stderr.read()
if self._is_error(err):
with open(octave_script.name) as error_script:
sys.stderr.write("SCRIPT:\n"+error_script.read())
err = "Octave Error! Standard error stream content starts on next line:\n"+err
raise Exception(err)
return np.loadtxt(output_matrix.name)
@task(sequence = IN, stiffness_matrix = OUT)
@constraint(AppSoftware="octave,numpy,cgDNA")
def run(self, sequence):
"""
Return the full-oligomer stiffness matrix built using cgDNA in octave.
"""
stiffness_matrix = self._get_stiffness_matrix(sequence)
return stiffness_matrix
#------------------------------------------------------------------------------
def main():
try:
opts, args = getopt.getopt(sys.argv[1:], "h", ["help"])
except getopt.error, msg:
sys.stderr.write(msg+"\nSee --help\n")
sys.exit(1)
for o, a in opts:
if o in ("-h", "--help"):
print __doc__
sys.exit(0)
if len(args) < 1:
print __doc__
sys.exit(1)
print DNAFlexRB().run(args[0])
if __name__ == "__main__":
main()