# HG changeset patch
# User dfornika
# Date 1560553685 14400
# Node ID 350da4807491f7158db5f9541616227cd0e0d938
# Parent a6b8ec872e3c560fbcd025b9765d63010d7feef4
planemo upload for repository https://github.com/dfornika/galaxytools/tree/master/data_managers/data_manager_build_mash_sketch/ commit 34a1400396f10e63e79511a4b28501fdaa03e77d-dirty
diff -r a6b8ec872e3c -r 350da4807491 data_manager/mash_build_sketch.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/data_manager/mash_build_sketch.py Fri Jun 14 19:08:05 2019 -0400
@@ -0,0 +1,109 @@
+#!/usr/bin/env python
+
+from __future__ import print_function
+
+import argparse
+import datetime
+import errno
+import json
+import os
+import string
+import subprocess
+import sys
+
+
+DATA_TABLE_NAME = "mash_sketches"
+
+def run(args, cwd):
+ proc = subprocess.Popen(args=args, shell=False, cwd=cwd)
+ return_code = proc.wait()
+ if return_code:
+ print("Error building sketch.", file=sys.stderr)
+ sys.exit( return_code )
+
+def mash_build_sketch(data_manager_dict, mash_args, target_directory, data_table_name=DATA_TABLE_NAME):
+
+ now = datetime.datetime.utcnow().strftime("%Y-%m-%dT%H%M%SZ")
+
+ database_value = "_".join([
+ now,
+ "refseq" + "." +
+ sketch_type + "." +
+ "k21.s1000.msh",
+ ])
+
+ database_name = " ".join([
+ "refseq" + "." +
+ sketch_type + "." +
+ "k21.s1000.msh"
+ "(Created:",
+ now + ")"
+ ])
+
+ database_path = database_value
+
+ args = [
+ '-p', mash_args['threads'],
+ '-k', mash_args['kmer_size'],
+ '-s', mash_args['sketch_size'],
+ '-o', 'sketch'
+ ]
+
+ subprocess.check_call(['mash', 'sketch'] + args, target_directory)
+
+ data_table_entry = {
+ "value": database_value,
+ "name": database_name,
+ "path": database_path,
+ }
+
+ _add_data_table_entry(data_manager_dict, data_table_entry)
+
+
+def _add_data_table_entry(data_manager_dict, data_table_entry, data_table_name=DATA_TABLE_NAME):
+ data_manager_dict['data_tables'] = data_manager_dict.get( 'data_tables', {} )
+ data_manager_dict['data_tables'][data_table_name] = data_manager_dict['data_tables'].get( data_table_name, [] )
+ data_manager_dict['data_tables'][data_table_name].append( data_table_entry )
+ return data_manager_dict
+
+
+def main():
+ parser = argparse.ArgumentParser()
+ parser.add_argument('data_manager_json')
+ parser.add_argument('--kmer-size', dest='kmer_size', help='K-mer size' )
+ parser.add_argument('--sketch-size', dest='sketch_size', help='Sketch size' )
+ parser.add_argument( '--threads', dest='threads', default=1, help='threads' )
+
+ args = parser.parse_args()
+
+ data_manager_input = json.loads(open(args.data_manager_json).read())
+
+ target_directory = data_manager_input['output_data'][0]['extra_files_path']
+
+ mash_args = {
+ 'kmer_size': args.kmer_size,
+ 'sketch_size': args.kmer_size,
+ 'threads': args.threads,
+ }
+
+ try:
+ os.mkdir( target_directory )
+ except OSError as exc:
+ if exc.errno == errno.EEXIST and os.path.isdir( target_directory ):
+ pass
+ else:
+ raise
+
+ data_manager_output = {}
+
+ mash_build_sketch(
+ data_manager_output,
+ mash_args,
+ target_directory,
+ )
+
+ open(args.data_manager_json, 'wb').write(json.dumps(data_manager_output))
+
+
+if __name__ == "__main__":
+ main()
diff -r a6b8ec872e3c -r 350da4807491 data_manager/mash_build_sketch.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/data_manager/mash_build_sketch.xml Fri Jun 14 19:08:05 2019 -0400
@@ -0,0 +1,30 @@
+
+
+ mash sketch builder
+
+ mash
+
+ mash --version
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ 10.1186/gb-2014-15-3-r46
+
+
diff -r a6b8ec872e3c -r 350da4807491 data_manager/mash_build_sketch_refseq.py
--- a/data_manager/mash_build_sketch_refseq.py Wed Mar 06 19:52:04 2019 -0500
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
@@ -1,99 +0,0 @@
-#!/usr/bin/env python
-
-from __future__ import print_function
-
-import argparse
-import datetime
-import errno
-import json
-import os
-import string
-import subprocess
-import sys
-
-
-DATA_TABLE_NAME = "mash_sketches"
-
-def run(args, cwd):
- proc = subprocess.Popen(args=args, shell=False, cwd=cwd)
- return_code = proc.wait()
- if return_code:
- print("Error building sketch.", file=sys.stderr)
- sys.exit( return_code )
-
-def mash_build_sketch_refseq(data_manager_dict, sketch_type, target_directory, data_table_name=DATA_TABLE_NAME):
-
- now = datetime.datetime.utcnow().strftime("%Y-%m-%dT%H%M%SZ")
-
- database_value = "_".join([
- now,
- "refseq" + "." +
- sketch_type + "." +
- "k21.s1000.msh",
- ])
-
- database_name = " ".join([
- "refseq" + "." +
- sketch_type + "." +
- "k21.s1000.msh"
- "(Created:",
- now + ")"
- ])
-
- database_path = database_value
-
- args = [
- 'https://gembox.cbcb.umd.edu/mash/refseq.' + sketch_type + '.k21s1000.msh'
- ]
-
- run(['wget'] + args, target_directory)
-
- data_table_entry = {
- "value": database_value,
- "name": database_name,
- "path": database_path,
- }
-
- _add_data_table_entry(data_manager_dict, data_table_entry)
-
-
-def _add_data_table_entry(data_manager_dict, data_table_entry, data_table_name=DATA_TABLE_NAME):
- data_manager_dict['data_tables'] = data_manager_dict.get( 'data_tables', {} )
- data_manager_dict['data_tables'][data_table_name] = data_manager_dict['data_tables'].get( data_table_name, [] )
- data_manager_dict['data_tables'][data_table_name].append( data_table_entry )
- return data_manager_dict
-
-
-def main():
- parser = argparse.ArgumentParser()
- parser.add_argument('data_manager_json')
- parser.add_argument('--sketch-type', dest='sketch_type', help='Sketch Type (genome or plasmid or genome+plasmid)' )
- parser.add_argument( '-t', '--threads', dest='threads', default=1, help='threads' )
-
- args = parser.parse_args()
-
- data_manager_input = json.loads(open(args.data_manager_json).read())
-
- target_directory = data_manager_input['output_data'][0]['extra_files_path']
-
- try:
- os.mkdir( target_directory )
- except OSError as exc:
- if exc.errno == errno.EEXIST and os.path.isdir( target_directory ):
- pass
- else:
- raise
-
- data_manager_output = {}
-
- mash_build_sketch_refseq(
- data_manager_output,
- args.sketch_type,
- target_directory,
- )
-
- open(args.data_manager_json, 'wb').write(json.dumps(data_manager_output))
-
-
-if __name__ == "__main__":
- main()
diff -r a6b8ec872e3c -r 350da4807491 data_manager/mash_build_sketch_refseq.xml
--- a/data_manager/mash_build_sketch_refseq.xml Wed Mar 06 19:52:04 2019 -0500
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
@@ -1,31 +0,0 @@
-
-
- database builder
-
- mash
-
- mash --version
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- 10.1186/gb-2014-15-3-r46
-
-