comparison assembly_post_processor.py @ 54:9a105e8f08e5 draft

Uploaded
author greg
date Mon, 22 May 2017 10:11:50 -0400
parents 9d58af3e459d
children ee5edbfd99c3
comparison
equal deleted inserted replaced
53:0f65703d5bb8 54:9a105e8f08e5
1 #!/usr/bin/env python 1 #!/usr/bin/env python
2 import argparse 2 import argparse
3 import os
3 4
4 import utils 5 import utils
6
7 OUTPUT_DIR = 'assemblyPostProcessing_dir'
5 8
6 parser = argparse.ArgumentParser() 9 parser = argparse.ArgumentParser()
7 parser.add_argument('--dereplicate', dest='dereplicate', default=None, help='Remove duplicate sequences') 10 parser.add_argument('--dereplicate', dest='dereplicate', default=None, help='Remove duplicate sequences')
8 parser.add_argument('--gap_trimming', dest='gap_trimming', type=float, default=0, help='Trim alignments') 11 parser.add_argument('--gap_trimming', dest='gap_trimming', type=float, default=0, help='Trim alignments')
9 parser.add_argument('--gene_family_search', dest='gene_family_search', default=None, help='Targeted gene families') 12 parser.add_argument('--gene_family_search', dest='gene_family_search', default=None, help='Targeted gene families')
10 parser.add_argument('--method', dest='method', default=None, help='Protein clustering method') 13 parser.add_argument('--method', dest='method', default=None, help='Protein clustering method')
11 parser.add_argument('--min_length', dest='min_length', type=int, default=0, help='Minimum sequence length') 14 parser.add_argument('--min_length', dest='min_length', type=int, default=0, help='Minimum sequence length')
12 parser.add_argument('--num_threads', dest='num_threads', type=int, help='Number of processors') 15 parser.add_argument('--num_threads', dest='num_threads', type=int, help='Number of processors')
16 parser.add_argument('--output_pttgf', dest='output_pttgf', default=None, help='Primary targeted gene families dataset')
17 parser.add_argument('--output_pttgf_dir', dest='output_pttgf_dir', default=None, help='Directory hierarchy of targeted gene family datasets')
13 parser.add_argument('--prediction_method', dest='prediction_method', help='Coding regions prediction method') 18 parser.add_argument('--prediction_method', dest='prediction_method', help='Coding regions prediction method')
14 parser.add_argument('--scaffold', dest='scaffold', default=None, help='Gene family scaffold') 19 parser.add_argument('--scaffold', dest='scaffold', default=None, help='Gene family scaffold')
15 parser.add_argument('--score_matrices', dest='score_matrices', default=None, help='Scores matrices') 20 parser.add_argument('--score_matrices', dest='score_matrices', default=None, help='Scores matrices')
16 parser.add_argument('--strand_specific', dest='strand_specific', default=None, help='Strand-specific assembly') 21 parser.add_argument('--strand_specific', dest='strand_specific', default=None, help='Strand-specific assembly')
17 parser.add_argument('--transcripts', dest='transcripts', help='Transcriptome assembly fasta file') 22 parser.add_argument('--transcripts', dest='transcripts', help='Transcriptome assembly fasta file')
39 if args.strand_specific is not None: 44 if args.strand_specific is not None:
40 cmd += ' --strand_specific' 45 cmd += ' --strand_specific'
41 cmd += ' --transcripts %s' % args.transcripts 46 cmd += ' --transcripts %s' % args.transcripts
42 # Run the command. 47 # Run the command.
43 utils.run_command(cmd) 48 utils.run_command(cmd)
49
50 # Handle outputs.
51 if args.output_pttgf is not None and args.output_pttgf_dir is not None:
52 src_output_dir = os.path.join(OUTPUT_DIR, 'targeted_gene_families')
53 utils.move_directory_files(src_output_dir, args.output_pttgf_dir)