Mercurial > repos > greg > assembly_post_processor
comparison assembly_post_processor.py @ 65:baf10f7f3d4a draft
Uploaded
| author | greg |
|---|---|
| date | Wed, 24 May 2017 13:22:28 -0400 |
| parents | e7f264e21d9a |
| children | 9da5dc4b99cc |
comparison
equal
deleted
inserted
replaced
| 64:45aa928ed5df | 65:baf10f7f3d4a |
|---|---|
| 1 #!/usr/bin/env python | 1 #!/usr/bin/env python |
| 2 import argparse | 2 import argparse |
| 3 import os | 3 import os |
| 4 import shutil | |
| 4 | 5 |
| 5 import utils | 6 import utils |
| 6 | 7 |
| 7 OUTPUT_DIR = 'assemblyPostProcessing_dir' | 8 OUTPUT_DIR = 'assemblyPostProcessing_dir' |
| 8 | 9 |
| 12 parser.add_argument('--gene_family_search', dest='gene_family_search', default=None, help='Targeted gene families') | 13 parser.add_argument('--gene_family_search', dest='gene_family_search', default=None, help='Targeted gene families') |
| 13 parser.add_argument('--method', dest='method', default=None, help='Protein clustering method') | 14 parser.add_argument('--method', dest='method', default=None, help='Protein clustering method') |
| 14 parser.add_argument('--min_length', dest='min_length', type=int, default=0, help='Minimum sequence length') | 15 parser.add_argument('--min_length', dest='min_length', type=int, default=0, help='Minimum sequence length') |
| 15 parser.add_argument('--num_threads', dest='num_threads', type=int, help='Number of processors') | 16 parser.add_argument('--num_threads', dest='num_threads', type=int, help='Number of processors') |
| 16 parser.add_argument('--output_pttgf', dest='output_pttgf', default=None, help='Primary targeted gene families dataset') | 17 parser.add_argument('--output_pttgf', dest='output_pttgf', default=None, help='Primary targeted gene families dataset') |
| 18 parser.add_argument('--output_cds', dest='output_cds', help='Output transcripts.cds') | |
| 19 parser.add_argument('--output_cleaned_cds', dest='output_cleaned_cds', help='Output transcripts.cleaned.cds') | |
| 20 parser.add_argument('--output_cleaned_nr_cds', dest='output_cleaned_nr_cds', default=None, help='Output transcripts.cleaned.nr.cds') | |
| 21 parser.add_argument('--output_cleaned_nr_pep', dest='output_cleaned_nr_pep', default=None, help='Output transcripts.cleaned.nr.pep') | |
| 22 parser.add_argument('--output_cleaned_pep', dest='output_cleaned_pep', help='Output transcripts.cleaned.pep') | |
| 23 parser.add_argument('--output_pep', dest='output_pep', help='Output transcripts.pep') | |
| 17 parser.add_argument('--output_pttgf_dir', dest='output_pttgf_dir', default=None, help='Directory hierarchy of targeted gene family datasets') | 24 parser.add_argument('--output_pttgf_dir', dest='output_pttgf_dir', default=None, help='Directory hierarchy of targeted gene family datasets') |
| 18 parser.add_argument('--prediction_method', dest='prediction_method', help='Coding regions prediction method') | 25 parser.add_argument('--prediction_method', dest='prediction_method', help='Coding regions prediction method') |
| 19 parser.add_argument('--scaffold', dest='scaffold', default=None, help='Gene family scaffold') | 26 parser.add_argument('--scaffold', dest='scaffold', default=None, help='Gene family scaffold') |
| 20 parser.add_argument('--score_matrices', dest='score_matrices', default=None, help='Scores matrices') | 27 parser.add_argument('--score_matrices', dest='score_matrices', default=None, help='Scores matrices') |
| 21 parser.add_argument('--strand_specific', dest='strand_specific', default=None, help='Strand-specific assembly') | 28 parser.add_argument('--strand_specific', dest='strand_specific', default=None, help='Strand-specific assembly') |
| 46 cmd += ' --transcripts %s' % args.transcripts | 53 cmd += ' --transcripts %s' % args.transcripts |
| 47 # Run the command. | 54 # Run the command. |
| 48 utils.run_command(cmd) | 55 utils.run_command(cmd) |
| 49 | 56 |
| 50 # Handle outputs. | 57 # Handle outputs. |
| 58 shutil.move(os.path.join(OUTPUT_DIR, 'transcripts.cds'), args.output_cds) | |
| 59 shutil.move(os.path.join(OUTPUT_DIR, 'transcripts.cleaned.cds'), args.output_cleaned_cds) | |
| 60 if args.output_cleaned_nr_cds is not None: | |
| 61 shutil.move(os.path.join(OUTPUT_DIR, 'transcripts.cleaned.nr.cds'), args.output_cleaned_nr_cds) | |
| 62 if args.output_cleaned_nr_pep is not None: | |
| 63 shutil.move(os.path.join(OUTPUT_DIR, 'transcripts.cleaned.nr.pep'), args.output_cleaned_nr_pep) | |
| 64 shutil.move(os.path.join(OUTPUT_DIR, 'transcripts.cleaned.pep'), args.output_cleaned_pep) | |
| 65 shutil.move(os.path.join(OUTPUT_DIR, 'transcripts.pep'), args.output_pep) | |
| 51 if args.output_pttgf is not None and args.output_pttgf_dir is not None: | 66 if args.output_pttgf is not None and args.output_pttgf_dir is not None: |
| 52 src_output_dir = os.path.join(OUTPUT_DIR, 'targeted_gene_families') | 67 src_output_dir = os.path.join(OUTPUT_DIR, 'targeted_gene_families') |
| 53 utils.move_directory_files(src_output_dir, args.output_pttgf_dir) | 68 utils.move_directory_files(src_output_dir, args.output_pttgf_dir) |
| 54 utils.write_html_output(args.output_pttgf, 'Targeted gene families', args.output_pttgf_dir) | 69 utils.write_html_output(args.output_pttgf, 'Targeted gene families', args.output_pttgf_dir) |
