-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathmdlr2mdl.py
156 lines (122 loc) · 6.32 KB
/
mdlr2mdl.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
import argparse
import readMDL
import writeMDL
from subprocess import call
import splitBNGXML
import re
from nfsim_python import NFSim
import os
import readBNGXML
import writeBNGXMLe as writeBXe
import yaml
import sys
def defineConsole():
parser = argparse.ArgumentParser(description='SBML to BNGL translator')
parser.add_argument('-i', '--input', type=str, help='input MDLr file', required=True)
parser.add_argument('-n', '--nfsim', action='store_true', help='mcell-nfsim mode')
parser.add_argument('-o', '--output', type=str, help='output MDL file')
parser.add_argument('-b', '--bng-executable', type=str, help='file path pointing to the BNG2.pl file')
return parser
def getScriptPath():
return os.path.dirname(os.path.realpath(sys.argv[0]))
class MDLR2MDL(object):
'''
given an mdlr definition this script will get a set of mdl files compatible with an nfsim bng-xml definition
'''
def __init__(self, configpath):
with open(configpath, 'r') as f:
self.config = yaml.load(f.read())
self.nfsim = NFSim(os.path.join(self.config['libpath'], 'libnfsim_c.so'))
def processMDLR(self, mdlrPath):
'''
main method. extracts species definition, creates bng-xml, creates mdl definitions
'''
nautyDict = self.xml2HNautySpeciesDefinitions(mdlrPath)
#append extended bng-xml to the bng-xml definition (the one that doesn't include seed information)
bngxmlestr = writeBXe.mergeBXBXe(namespace.input + '_total.xml', namespace.input + '_extended.xml')
with open(mdlrPath + '_total.xml', 'w') as f:
f.write(bngxmlestr)
xmlspec = readBNGXML.parseFullXML(namespace.input + '.xml')
# write out the equivalent plain mdl stuffs
mdlDict = writeMDL.constructMCell(xmlspec, namespace.input, finalName.split(os.sep)[-1], nautyDict)
writeMDL.writeMDL(mdlDict, finalName)
def tokenizeSeedElements(self, seed):
#extract species names
seedKeys = re.findall('concentration="[0-9a-zA-Z_]+" name="[_0-9a-zA-Z@:(~!),.]+"', seed)
seedKeys = [re.sub('concentration="([0-9a-zA-Z_]+)" name="([_0-9a-zA-Z@:(~!),.]+)"', '\g<2>;\g<1>', x) for x in seedKeys]
seedList = seed.split('</Species>')
seedList = [x.strip() for x in seedList if x != '']
seedList = [x + '</Species>' for x in seedList]
seedList = [re.sub('"S[0-9]+"', "S1", x) for x in seedList]
seedList = [re.sub('concentration="[0-9a-zA-Z_]+"', 'concentration="1"', x) for x in seedList]
seedList = ['<Model><ListOfSpecies>{0}</ListOfSpecies></Model>'.format(x) for x in seedList]
#seedDict = {x:y for x,y in zip(seedKeys,seedList)}
seedDict = {x.split(';')[0]:y for x, y in zip(seedKeys, seedList) if x.split(';')[1] != '0'}
#print '---', seedDict.keys()
return seedDict
def getNamesFromDefinitionString(self, defStr):
speciesNames = re.findall('[0-9a-zA-Z_]+\(',defStr)
return [x[:-1] for x in speciesNames]
def xml2HNautySpeciesDefinitions(self, inputMDLRFile):
"""
Temporary function for translating xml bng definitions to nautty species definition strings
it call the nfsim library to get the list of possible complexes in the system, however the function right now
returns the species in question + all molecule types (if we are sending a lone molecule tye as initialization
it still returns all molecule types), which means the list requires filterinng. and the filtering
is not pretty
How to solve: make it so that nfsim returns a more sensible complex list (filtering out unrelated molecule types) or
create a nauty label creation mechanism locally
"""
#get a bng-xml file
call([self.config['bionetgen'], '-xml', '-check', inputMDLRFile + '.bngl'])
#extract seed species defition
seed, rest = splitBNGXML.extractSeedBNG(inputMDLRFile + '.xml')
#store xml with non-seed sections and load up nfsim library
with open(namespace.input + '_total.xml', 'w') as f:
f.write(rest)
#load up nfsim library
self.nfsim.initNFsim(namespace.input + '_total.xml', 0)
# remove encapsulating tags
seed = seed[30:-30]
#get the seed species definitions as a list
seedDict = self.tokenizeSeedElements(seed)
nautyDict = {}
for seed in seedDict:
#initialize nfsim with each species definition and get back a dirty list where one of the entries is the one we want
#XXX: i think i've solved it on the nfsim side, double check
tmpList = self.getNautyString(seedDict[seed])
#and now filter it out...
#get species names from species definition string
speciesNames = self.getNamesFromDefinitionString(seed)
nautyDict[seed] = [x for x in tmpList if all(y in x for y in speciesNames)][0]
return nautyDict
def getNautyString(self, xmlSpeciesDefinition):
self.nfsim.resetSystem()
self.nfsim.initSystemXML(xmlSpeciesDefinition)
result = self.nfsim.querySystemStatus("complex")
return result
if __name__ == "__main__":
parser = defineConsole()
namespace = parser.parse_args()
bnglPath = namespace.input + '.bngl'
finalName = namespace.output if namespace.output else namespace.input
# mdl to bngl
resultDict = readMDL.constructBNGFromMDLR(namespace.input, namespace.nfsim)
outputDir = os.sep.join(namespace.output.split(os.sep)[:-1])
# create bngl file
readMDL.outputBNGL(resultDict['bnglstr'], bnglPath)
# temporaryly store bng-xml information in a separate file for display purposes
with open(namespace.input + '_extended.xml', 'wb') as f:
f.write(resultDict['bngxmlestr'])
#get cannonical label -bngl label dictionary
if not namespace.nfsim:
# bngl 2 sbml 2 json
readMDL.bngl2json(namespace.input + '.bngl')
# json 2 plain mdl
mdlDict = writeMDL.constructMDL(namespace.input + '_sbml.xml.json', namespace.input, finalName)
# create an mdl with nfsim-species and nfsim-reactions
writeMDL.writeMDL(mdlDict, finalName)
else:
mdlr2mdl = MDLR2MDL(os.path.join(getScriptPath(),'mcellr.yaml'))
#get the species definitions
mdlr2mdl.processMDLR(namespace.input)