Mercurial > repos > fubar > brokenandnotdeletablebyowneroradmin
comparison rgDynamicScriptWrapper.py @ 0:fda8032fe989
Initial checkin of dynamic script runner. Goal is to add code to generate a new toolshed entry once the script works correctly
author | ross lazarus ross.lazarus@gmail.com |
---|---|
date | Wed, 30 May 2012 22:36:34 +1000 |
parents | |
children | 0133b97e477e |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:fda8032fe989 |
---|---|
1 # rgDynamicScriptWrapper.py | |
2 # derived from | |
3 # rgBaseScriptWrapper.py | |
4 # to run some user supplied code | |
5 # extremely dangerous | |
6 # trusted users only - private site only | |
7 # a list in the xml is searched - only users in the list can run this tool. | |
8 # | |
9 # copyright ross lazarus (ross.lazarus@gmail.com) May 2012 | |
10 # | |
11 # all rights reserved | |
12 # Licensed under the LGPL for your pleasure | |
13 # Derived from rgDGE.py in May 2012 | |
14 # generalized to run required interpreter | |
15 # to make your own tools based on a given script and interpreter such as perl or python | |
16 # clone this and the corresponding xml wrapper | |
17 # replace the parameters/inputs/outputs and the configfile contents with your script | |
18 # Use the $foo syntax to place your parameter values inside the script to assign them - at run time, the script will be used as a template | |
19 # and returned as part of the output to the user - with the right values for all the parameters. | |
20 # Note that this assumes you want all the outputs arranged as a single Html file output | |
21 # after this generic script runner runs your script with the specified interpreter, | |
22 # it will collect all output files into the specified output_html, making thumbnails for all the pdfs it finds and making links for all the other files. | |
23 | |
24 import sys | |
25 import shutil | |
26 import subprocess | |
27 import os | |
28 import time | |
29 import tempfile | |
30 import optparse | |
31 | |
32 progname = os.path.split(sys.argv[0])[1] | |
33 myversion = 'V000.1 May 2012' | |
34 verbose = False | |
35 debug = False | |
36 | |
37 # characters that are allowed but need to be escaped | |
38 # also a test sandboxing of any R system commands | |
39 # ultimately futile - we need to generate a new tool | |
40 # which will have no new security problems! | |
41 mapped_chars = { '>' :'__gt__', | |
42 '<' :'__lt__', | |
43 "'" :'__sq__', | |
44 '"' :'__dq__', | |
45 '{' :'__oc__', | |
46 '}' :'__cc__', | |
47 '@' : '__at__', | |
48 '\n' : '__cn__', | |
49 '\r' : '__cr__', | |
50 '\t' : '__tc__', | |
51 '#' : '__pd__', | |
52 '[' :'__ob__', | |
53 ']' :'__cb__', | |
54 '\t' : 'Xt', | |
55 'systemCallsAreNotAllowed' : 'system' | |
56 } | |
57 | |
58 galhtmlprefix = """<?xml version="1.0" encoding="utf-8" ?> | |
59 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> | |
60 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
61 <head> <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
62 <meta name="generator" content="Galaxy %s tool output - see http://g2.trac.bx.psu.edu/" /> | |
63 <title></title> | |
64 <link rel="stylesheet" href="/static/style/base.css" type="text/css" /> | |
65 </head> | |
66 <body> | |
67 <div class="document"> | |
68 """ | |
69 galhtmlattr = """<b><a href="http://rgenetics.org">Galaxy Rgenetics Base Script Wrapper based </a> tool output %s run at %s</b><br/>""" | |
70 galhtmlpostfix = """</div></body></html>\n""" | |
71 | |
72 def timenow(): | |
73 """return current time as a string | |
74 """ | |
75 return time.strftime('%d/%m/%Y %H:%M:%S', time.localtime(time.time())) | |
76 | |
77 def restore_text(text): | |
78 """Restores sanitized text""" | |
79 if not text: | |
80 return text | |
81 for key, value in mapped_chars.items(): | |
82 text = text.replace(value, key) | |
83 return text | |
84 | |
85 class ScriptRunner: | |
86 """class is a wrapper for an arbitrary script | |
87 """ | |
88 | |
89 def __init__(self,opts=None): | |
90 """ | |
91 run the script | |
92 cheetah/galaxy will provide an escaped string so | |
93 __pd__ your script goes here | |
94 __cr____cn__ourargs __lt__- commandArgs(TRUE) | |
95 __cr____cn__inf = ourargs[1] | |
96 __cr____cn__outf = ourargs[2] | |
97 __cr____cn__inp = read.table(inf,head=T,rownames=F,sep=__sq__Xt__sq__) | |
98 __cr____cn__ write.table(inp,outf, quote=FALSE, sep=__dq__Xt__dq__,row.names=F) | |
99 __cr____cn__sessionInfo() | |
100 __cr____cn__ | |
101 """ | |
102 self.thumbformat = 'jpg' | |
103 self.opts = opts | |
104 self.toolname = opts.tool_name.replace(' ','_') | |
105 s = open(self.opts.script_path,'r').read() | |
106 self.script = restore_text(s) | |
107 if opts.output_dir: # may not want these complexities if a simple script | |
108 self.tlog = os.path.join(opts.output_dir,"%s_runner.log" % self.toolname) | |
109 artifactpath = os.path.join(opts.output_dir,'%s_run.script' % self.toolname) | |
110 artifact = open(artifactpath,'w') | |
111 artifact.write(self.script) | |
112 artifact.write('\n') | |
113 artifact.close() | |
114 self.cl = [] | |
115 a = self.cl.append | |
116 a(opts.interpreter) | |
117 a('-') # use stdin | |
118 a(opts.input_tab) | |
119 a(opts.output_tab) | |
120 | |
121 def compressPDF(self,inpdf=None,thumbformat='png'): | |
122 """need absolute path to pdf | |
123 """ | |
124 assert os.path.isfile(inpdf), "## Input %s supplied to %s compressPDF not found" % (inpdf,self.myName) | |
125 hf,hlog = tempfile.mkstemp(suffix="%s.log" % self.toolname) | |
126 sto = open(hlog,'w') | |
127 outpdf = '%s_compressed' % inpdf | |
128 cl = ["gs", "-sDEVICE=pdfwrite", "-dNOPAUSE", "-dBATCH", "-sOutputFile=%s" % outpdf,inpdf] | |
129 x = subprocess.Popen(cl,stdout=sto,stderr=sto,cwd=self.opts.output_dir) | |
130 retval1 = x.wait() | |
131 if retval1 == 0: | |
132 os.unlink(inpdf) | |
133 shutil.move(outpdf,inpdf) | |
134 outpng = '%s.%s' % (os.path.splitext(inpdf)[0],thumbformat) | |
135 cl2 = ['convert', inpdf, outpng] | |
136 x = subprocess.Popen(cl2,stdout=sto,stderr=sto,cwd=self.opts.output_dir) | |
137 retval2 = x.wait() | |
138 sto.close() | |
139 retval = retval1 or retval2 | |
140 return retval | |
141 | |
142 | |
143 def getfSize(self,fpath,outpath): | |
144 """ | |
145 format a nice file size string | |
146 """ | |
147 size = '' | |
148 fp = os.path.join(outpath,fpath) | |
149 if os.path.isfile(fp): | |
150 n = float(os.path.getsize(fp)) | |
151 if n > 2**20: | |
152 size = ' (%1.1f MB)' % (n/2**20) | |
153 elif n > 2**10: | |
154 size = ' (%1.1f KB)' % (n/2**10) | |
155 elif n > 0: | |
156 size = ' (%d B)' % (int(n)) | |
157 return size | |
158 | |
159 | |
160 def run(self): | |
161 """ | |
162 """ | |
163 if self.opts.output_dir: | |
164 sto = open(self.tlog,'w') | |
165 p = subprocess.Popen(' '.join(self.cl),shell=True,stdout=sto,stderr=sto,stdin=subprocess.PIPE,cwd=self.opts.output_dir) | |
166 else: | |
167 p = subprocess.Popen(' '.join(self.cl),shell=True,stdin=subprocess.PIPE) | |
168 p.stdin.write(self.script) | |
169 p.stdin.close() | |
170 retval = p.wait() | |
171 if self.opts.output_dir: | |
172 sto.close() | |
173 flist = os.listdir(self.opts.output_dir) | |
174 flist = [x for x in flist if x <> 'Rplots.pdf'] | |
175 flist.sort() | |
176 html = [galhtmlprefix % progname,] | |
177 html.append('<h2>Galaxy %s outputs run at %s</h2></br>Click on a thumbnail below to download the original PDF</br>\n' % (self.toolname,timenow())) | |
178 fhtml = [] | |
179 if len(flist) > 0: | |
180 html.append('<table cellpadding="3" cellspacing="3">\n') | |
181 for fname in flist: | |
182 dname,e = os.path.splitext(fname) | |
183 sfsize = self.getfSize(fname,self.opts.output_dir) | |
184 if e.lower() == '.pdf' : # compress and make a thumbnail | |
185 thumb = '%s.%s' % (dname,self.thumbformat) | |
186 pdff = os.path.join(self.opts.output_dir,fname) | |
187 retval = self.compressPDF(inpdf=pdff,thumbformat=self.thumbformat) | |
188 if retval == 0: | |
189 s= '<tr><td><a href="%s"><img src="%s" title="Click to download a PDF of %s" hspace="10" width="600"></a></td></tr>\n' % (fname,thumb,fname) | |
190 html.append(s) | |
191 fhtml.append('<li><a href="%s">%s %s</a></li>' % (fname,fname,sfsize)) | |
192 else: | |
193 fhtml.append('<li><a href="%s">%s %s</a></li>' % (fname,fname,sfsize)) | |
194 html.append('</table>\n') | |
195 if len(fhtml) > 0: | |
196 fhtml.insert(0,'<ul>') | |
197 fhtml.append('</ul>') | |
198 html += fhtml # add all non-pdf files to the end of the display | |
199 else: | |
200 html.append('<h2>### Error - %s returned no files - please confirm that parameters are sane</h1>' % self.opts.interpreter) | |
201 html.append('<h3>%s log follows below</h3><hr><pre>\n' % self.opts.interpreter) | |
202 rlog = open(self.tlog,'r').readlines() | |
203 html += rlog | |
204 html.append('%s CL = %s</br>\n' % (self.toolname,' '.join(sys.argv))) | |
205 html.append('CL = %s</br>\n' % (' '.join(self.cl))) | |
206 html.append('</pre>\n') | |
207 html.append(galhtmlattr % (progname,timenow())) | |
208 html.append(galhtmlpostfix) | |
209 htmlf = file(self.opts.output_html,'w') | |
210 htmlf.write('\n'.join(html)) | |
211 htmlf.write('\n') | |
212 htmlf.close() | |
213 return retval | |
214 | |
215 | |
216 def main(): | |
217 u = """ | |
218 This is a Galaxy wrapper. It expects to be called by a special purpose tool.xml as: | |
219 <command interpreter="python">rgBaseScriptWrapper.py --script_path "$scriptPath" --tool_name "foo" --interpreter "Rscript" | |
220 </command> | |
221 """ | |
222 permitted_users = ['rlazarus@bakeridi.edu.au','akaspi@bakeridi.edu.au','mziemann@bakeridi.edu.edu'] | |
223 op = optparse.OptionParser() | |
224 a = op.add_option | |
225 a('--script_path',default=None) | |
226 a('--tool_name',default=None) | |
227 a('--interpreter',default=None) | |
228 a('--output_dir',default=None) | |
229 a('--output_html',default=None) | |
230 a('--input_tab',default='NONE') | |
231 a('--output_tab',default='NONE') | |
232 a('--user_email',default=None) | |
233 a('--bad_user',default=None) | |
234 opts, args = op.parse_args() | |
235 assert not opts.bad_user,'%s is NOT authorized to use this tool. Please ask your friendly admin' % opts.bad_user | |
236 assert opts.tool_name,'## Dynamic script wrapper expects a tool name - eg --tool_name=DESeq' | |
237 assert opts.interpreter,'## Dynamic script wrapper expects an interpreter - eg --interpreter=Rscript' | |
238 assert os.path.isfile(opts.script_path),'## Dynamic script wrapper expects a script path - eg --script_path=foo.R' | |
239 if opts.output_dir: | |
240 try: | |
241 os.makedirs(opts.output_dir) | |
242 except: | |
243 pass | |
244 r = ScriptRunner(opts) | |
245 retcode = r.run() | |
246 if retcode: | |
247 sys.exit(retcode) # indicate failure to job runner | |
248 | |
249 | |
250 if __name__ == "__main__": | |
251 main() | |
252 | |
253 |