Mercurial > repos > geert-vandeweyer > cufflinks
comparison cufflinks_wrapper.py @ 5:261425bba55d draft
corrected syntax error in wrapper.py
| author | geert-vandeweyer |
|---|---|
| date | Fri, 01 Aug 2014 08:54:01 -0400 |
| parents | ae8ad9d17e34 |
| children | 82f0d5660884 |
comparison
equal
deleted
inserted
replaced
| 4:03fdfb596475 | 5:261425bba55d |
|---|---|
| 19 parser.add_option( '-j', '--pre-mrna-fraction', dest='pre_mrna_fraction', help='Some RNA-Seq protocols produce a significant amount of reads that originate from incompletely spliced transcripts, and these reads can confound the assembly of fully spliced mRNAs. Cufflinks uses this parameter to filter out alignments that lie within the intronic intervals implied by the spliced alignments. The minimum depth of coverage in the intronic region covered by the alignment is divided by the number of spliced reads, and if the result is lower than this parameter value, the intronic alignments are ignored. The default is 5%.' ) | 19 parser.add_option( '-j', '--pre-mrna-fraction', dest='pre_mrna_fraction', help='Some RNA-Seq protocols produce a significant amount of reads that originate from incompletely spliced transcripts, and these reads can confound the assembly of fully spliced mRNAs. Cufflinks uses this parameter to filter out alignments that lie within the intronic intervals implied by the spliced alignments. The minimum depth of coverage in the intronic region covered by the alignment is divided by the number of spliced reads, and if the result is lower than this parameter value, the intronic alignments are ignored. The default is 5%.' ) |
| 20 parser.add_option( '-p', '--num-threads', dest='num_threads', help='Use this many threads to align reads. The default is 1.' ) | 20 parser.add_option( '-p', '--num-threads', dest='num_threads', help='Use this many threads to align reads. The default is 1.' ) |
| 21 parser.add_option( '-G', '--GTF', dest='GTF', help='Tells Cufflinks to use the supplied reference annotation to estimate isoform expression. It will not assemble novel transcripts, and the program will ignore alignments not structurally compatible with any reference transcript.' ) | 21 parser.add_option( '-G', '--GTF', dest='GTF', help='Tells Cufflinks to use the supplied reference annotation to estimate isoform expression. It will not assemble novel transcripts, and the program will ignore alignments not structurally compatible with any reference transcript.' ) |
| 22 parser.add_option ("--compatible-hits-norm",dest='compatible_hits_norm',help='Count hits compatible with reference RNAs only') | 22 parser.add_option ("--compatible-hits-norm",dest='compatible_hits_norm',help='Count hits compatible with reference RNAs only') |
| 23 parser.add_option( '-g', '--GTF-guide', dest='GTFguide', help='use reference transcript annotation to guide assembly' ) | 23 parser.add_option( '-g', '--GTF-guide', dest='GTFguide', help='use reference transcript annotation to guide assembly' ) |
| 24 parser.add_option("--3-overhang-tolerance",dest='3_overhang_tolerance', help='The number of bp allowed to overhang the 3prime end of a reference transcript when determining if an assembled transcript should be merged with it (ie, the assembled transcript is not novel). The default is 600 bp.') | 24 parser.add_option("--3-overhang-tolerance",dest='three_overhang_tolerance', help='The number of bp allowed to overhang the 3prime end of a reference transcript when determining if an assembled transcript should be merged with it (ie, the assembled transcript is not novel). The default is 600 bp.') |
| 25 parser.add_option("--intron-overhang-tolerance",dest='intron_overhang_tolerance',help='The number of bp allowed to enter the intron of a reference transcript when determining if an assembled transcript should be merged with it (ie, the assembled transcript is not novel). The default is 50 bp.') | 25 parser.add_option("--intron-overhang-tolerance",dest='intron_overhang_tolerance',help='The number of bp allowed to enter the intron of a reference transcript when determining if an assembled transcript should be merged with it (ie, the assembled transcript is not novel). The default is 50 bp.') |
| 26 parser.add_option("--no-faux-reads", dest='no_faux_reads',help='This option disables tiling of the reference transcripts with faux reads. Use this if you only want to use sequencing reads in assembly but do not want to output assembled transcripts that lay within reference transcripts. All reference transcripts in the input annotation will also be included in the output.') | 26 parser.add_option("--no-faux-reads", dest='no_faux_reads',help='This option disables tiling of the reference transcripts with faux reads. Use this if you only want to use sequencing reads in assembly but do not want to output assembled transcripts that lay within reference transcripts. All reference transcripts in the input annotation will also be included in the output.') |
| 27 parser.add_option( '-u', '--multi-read-correct', dest='multi_read_correct', action="store_true", help='Tells Cufflinks to do an initial estimation procedure to more accurately weight reads mapping to multiple locations in the genome') | 27 parser.add_option( '-u', '--multi-read-correct', dest='multi_read_correct', action="store_true", help='Tells Cufflinks to do an initial estimation procedure to more accurately weight reads mapping to multiple locations in the genome') |
| 28 | 28 |
| 29 # Normalization options. | 29 # Normalization options. |
| 52 parser.add_option( '--overhang-tolerance', dest='overhang_tolerance', help='The number of bp allowed to enter the intron of a transcript when determining if a \ | 52 parser.add_option( '--overhang-tolerance', dest='overhang_tolerance', help='The number of bp allowed to enter the intron of a transcript when determining if a \ |
| 53 read or another transcript is mappable to/compatible with it. The default is 8 bp based on the default bowtie/TopHat parameters.' ) | 53 read or another transcript is mappable to/compatible with it. The default is 8 bp based on the default bowtie/TopHat parameters.' ) |
| 54 parser.add_option( '--max-bundle-length', dest='max_bundle_length', help='Maximum genomic length of a given bundle" help="Default: 3,500,000bp' ) | 54 parser.add_option( '--max-bundle-length', dest='max_bundle_length', help='Maximum genomic length of a given bundle" help="Default: 3,500,000bp' ) |
| 55 parser.add_option( '--max-bundle-frags', dest='max_bundle_frags', help='Sets the maximum number of fragments a locus may have before being skipped. Skipped loci are listed in skipped.gtf. Default: 1,000,000' ) | 55 parser.add_option( '--max-bundle-frags', dest='max_bundle_frags', help='Sets the maximum number of fragments a locus may have before being skipped. Skipped loci are listed in skipped.gtf. Default: 1,000,000' ) |
| 56 parser.add_option( '--min-intron-length', dest='min_intron_length', help='Minimal allowed intron size. Default: 50' ) | 56 parser.add_option( '--min-intron-length', dest='min_intron_length', help='Minimal allowed intron size. Default: 50' ) |
| 57 parser.add_option( '--trim-3-avgcov-thresh', dest='trim_3_avgcov_thresh', help='Minimum average coverage required to attempt 3prime trimming. Default: 10' ) | 57 parser.add_option( '--trim-3-avgcov-thresh', dest='trim_three_avgcov_thresh', help='Minimum average coverage required to attempt 3prime trimming. Default: 10' ) |
| 58 parser.add_option( '--trim-3-dropoff-frac', dest='trim_3_dropoff_frac', help='The fraction of average coverage below which to trim the 3prime end of an assembled transcript. Default: 0.1' ) | 58 parser.add_option( '--trim-3-dropoff-frac', dest='trim_three_dropoff_frac', help='The fraction of average coverage below which to trim the 3prime end of an assembled transcript. Default: 0.1' ) |
| 59 | 59 |
| 60 | 60 |
| 61 # Bias correction options. | 61 # Bias correction options. |
| 62 parser.add_option( '-b', dest='do_bias_correction', action="store_true", help='Providing Cufflinks with a multifasta file via this option instructs it to run our new bias detection and correction algorithm which can significantly improve accuracy of transcript abundance estimates.') | 62 parser.add_option( '-b', dest='do_bias_correction', action="store_true", help='Providing Cufflinks with a multifasta file via this option instructs it to run our new bias detection and correction algorithm which can significantly improve accuracy of transcript abundance estimates.') |
| 63 parser.add_option( '', '--index', dest='index', help='The path of the reference genome' ) | 63 parser.add_option( '', '--index', dest='index', help='The path of the reference genome' ) |
| 117 cmd += ( " -G %s" % options.GTF ) | 117 cmd += ( " -G %s" % options.GTF ) |
| 118 if options.compatible_hits_norm: | 118 if options.compatible_hits_norm: |
| 119 cmd += ( " --compatible-hits-norm" ) | 119 cmd += ( " --compatible-hits-norm" ) |
| 120 if options.GTFguide: | 120 if options.GTFguide: |
| 121 cmd += ( " -g %s" % options.GTFguide ) | 121 cmd += ( " -g %s" % options.GTFguide ) |
| 122 cmd += ( " --3-overhang-tolerance %i" % int ( options.3_overhang_tolerance ) ) | 122 cmd += ( " --3-overhang-tolerance %i" % int ( options.three_overhang_tolerance ) ) |
| 123 cmd += ( " --intron-overhang-tolerance %i" % int ( options.intron_overhang_tolerance ) ) | 123 cmd += ( " --intron-overhang-tolerance %i" % int ( options.intron_overhang_tolerance ) ) |
| 124 if options.no_faux_reads: | 124 if options.no_faux_reads: |
| 125 cmd += ( " --no-faux-reads" ) | 125 cmd += ( " --no-faux-reads" ) |
| 126 if options.multi_read_correct: | 126 if options.multi_read_correct: |
| 127 cmd += ( " -u" ) | 127 cmd += ( " -u" ) |
| 146 cmd += ( " --max-bundle-length %i" % int ( options.max_bundle_length ) ) | 146 cmd += ( " --max-bundle-length %i" % int ( options.max_bundle_length ) ) |
| 147 if options.max_bundle_frags: | 147 if options.max_bundle_frags: |
| 148 cmd += ( " --max-bundle-frags %i" % int ( options.max_bundle_frags ) ) | 148 cmd += ( " --max-bundle-frags %i" % int ( options.max_bundle_frags ) ) |
| 149 if options.min_intron_length: | 149 if options.min_intron_length: |
| 150 cmd += ( " --min-intron-length %i" % int ( options.min_intron_length ) ) | 150 cmd += ( " --min-intron-length %i" % int ( options.min_intron_length ) ) |
| 151 if options.trim_3_avgcov_thresh: | 151 if options.trim_three_avgcov_thresh: |
| 152 cmd += ( " --trim-3-avgcov-thresh %i" % int ( options.trim_3_avgcov_thresh ) ) | 152 cmd += ( " --trim-3-avgcov-thresh %i" % int ( options.trim_three_avgcov_thresh ) ) |
| 153 if options.trim_3_dropoff_frac: | 153 if options.trim_three_dropoff_frac: |
| 154 cmd += ( " --trim-3-dropoff-frac %f" % float ( options.trim_3_dropoff_frac ) ) | 154 cmd += ( " --trim-3-dropoff-frac %f" % float ( options.trim_three_dropoff_frac ) ) |
| 155 | 155 |
| 156 if options.do_bias_correction: | 156 if options.do_bias_correction: |
| 157 cmd += ( " -b %s" % seq_path ) | 157 cmd += ( " -b %s" % seq_path ) |
| 158 if options.no_effective_length_correction: | 158 if options.no_effective_length_correction: |
| 159 cmd += ( " --no-effective-length-correction" ) | 159 cmd += ( " --no-effective-length-correction" ) |
