# HG changeset patch # User devteam # Date 1483458644 18000 # Node ID fa69d5a7b8c8c6c1b477a9939d8bc07322d609ee # Parent fed480fea9f0bf5e850dae31df4a177eaff530c0 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/bowtie2 commit d0e857ba2691ca15b6239890baf98dbe7bc3ccbd diff -r fed480fea9f0 -r fa69d5a7b8c8 bowtie2_wrapper.xml --- a/bowtie2_wrapper.xml Fri Dec 18 18:50:22 2015 -0500 +++ b/bowtie2_wrapper.xml Tue Jan 03 10:50:44 2017 -0500 @@ -1,23 +1,22 @@ - + - map reads against reference genome read_group_macros.xml + + bowtie2 + samtools + bowtie2 --version - - bowtie2 - samtools - - - + '$mapping_stats' #end if ## output file #if ( str( $analysis_type.analysis_type_selector ) != "full" or str( $analysis_type.sam_opt ) != "true" ): - | samtools view -Su - | samtools sort -o - - > $output + | samtools sort -O bam -o '$output' #else - > $output_sam + > '$output_sam' #end if ## rename unaligned sequence files #if $library.type == "paired" and $output_unaligned_reads_l and $output_unaligned_reads_r: #from os.path import splitext #set _unaligned_root, _unaligned_ext = splitext( str( $output_unaligned_reads_l ) ) - && mv "${ _unaligned_root }.1${_unaligned_ext}" "${ output_unaligned_reads_l }" - && mv "${ _unaligned_root }.2${_unaligned_ext}" "${ output_unaligned_reads_r }" + && mv "${ _unaligned_root }.1${_unaligned_ext}" '$output_unaligned_reads_l' + && mv "${ _unaligned_root }.2${_unaligned_ext}" '$output_unaligned_reads_r' + #end if + #if $library.type == "paired" and $output_aligned_reads_l and $output_aligned_reads_r: + #from os.path import splitext + #set _aligned_root, _aligned_ext = splitext( str( $output_aligned_reads_l ) ) + && mv "${ _aligned_root }.1${_aligned_ext}" '$output_aligned_reads_l' + && mv "${ _aligned_root }.2${_aligned_ext}" '$output_aligned_reads_r' #end if - - - - - - + ]]> @@ -205,11 +211,13 @@ + + @@ -237,6 +245,7 @@ + @@ -262,7 +271,7 @@ - + @@ -278,10 +287,10 @@ - + - + @@ -336,10 +345,10 @@ - - - - + + + + @@ -404,7 +413,7 @@ - + @@ -439,9 +448,9 @@ - + - + library['unaligned_file'] is True @@ -464,6 +473,45 @@ + + library['aligned_file'] is True + + + + + + + + + + + + + + + + + + + ( library['type'] == "paired" or library['type'] == "paired_collection" ) and library['aligned_file'] is True + + + + + + + + + + + + + ( library['type'] == "paired" or library['type'] == "paired_collection" ) and library['unaligned_file'] is True @@ -481,7 +529,7 @@ - + analysis_type['analysis_type_selector'] == "simple" or analysis_type['sam_opt'] is False @@ -576,10 +624,10 @@ - - + Support** link at the top of the interface and let us know that an index needs to be added @@ -619,18 +667,18 @@ **Input options**:: - -s/--skip <int> - Skip (i.e. do not align) the first `<int>` reads or pairs in the input. + -s/--skip + Skip (i.e. do not align) the first `` reads or pairs in the input. - -u/--qupto <int> - Align the first `<int>` reads or read pairs from the input (after the + -u/--qupto + Align the first `` reads or read pairs from the input (after the `-s`/`--skip` reads or pairs have been skipped), then stop. Default: no limit. - -5/--trim5 <int> - Trim `<int>` bases from 5' (left) end of each read before alignment (default: 0). + -5/--trim5 + Trim `` bases from 5' (left) end of each read before alignment (default: 0). - -3/--trim3 <int> - Trim `<int>` bases from 3' (right) end of each read before alignment (default: 0). + -3/--trim3 + Trim `` bases from 3' (right) end of each read before alignment (default: 0). --phred33 Input qualities are ASCII chars equal to the Phred quality plus 33. This is @@ -650,7 +698,7 @@ Quality values are represented in the read input file as space-separated ASCII integers, e.g., `40 40 30 40`..., rather than ASCII characters, e.g., `II?I`.... Integers are treated as being on the Phred quality scale unless `--solexa-quals` is also specified. Default: off. - + ------ **Presets in `--end-to-end` mode**:: @@ -660,7 +708,7 @@ --fast Same as: `-D 10 -R 2 -N 0 -L 22 -i S,0,2.50` - + --sensitive Same as: `-D 15 -R 2 -L 22 -i S,1,1.15` (default in `--end-to-end` mode) @@ -682,23 +730,23 @@ --very-sensitive-local Same as: `-D 20 -R 3 -N 0 -L 20 -i S,1,0.50` - + ------ **Alignment options**:: - -N <int> + -N Sets the number of mismatches to allowed in a seed alignment during multiseed alignment. Can be set to 0 or 1. Setting this higher makes alignment slower (often much slower) but increases sensitivity. Default: 0. - -L <int> + -L Sets the length of the seed substrings to align during multiseed alignment. Smaller values make alignment slower but more sensitive. Default: the `--sensitive` preset is used by default, which sets `-L` to 22 in `--end-to-end` mode and to 20 in `--local` mode. - -i <func> + -i Sets a function governing the interval between seed substrings to use during multiseed alignment. For instance, if the read has 30 characers, and seed length is 10, and the seed interval is 6, the seeds extracted will be: @@ -722,24 +770,24 @@ default, which sets `-i` to `S,1,1.15` in `--end-to-end` mode to `-i S,1,0.75` in `--local` mode. - --n-ceil <func> + --n-ceil Sets a function governing the maximum number of ambiguous characters (usually `N`s and/or `.`s) allowed in a read as a function of read length. For instance, specifying `-L,0,0.15` sets the N-ceiling function `f` to `f(x) = 0 + 0.15 * x`, where x is the read length. Reads exceeding this ceiling are filtered out. Default: `L,0,0.15`. - --dpad <int> - "Pads" dynamic programming problems by `<int>` columns on either side to allow + --dpad + "Pads" dynamic programming problems by `` columns on either side to allow gaps. Default: 15. - --gbar <int> - Disallow gaps within `<int>` positions of the beginning or end of the read. + --gbar + Disallow gaps within `` positions of the beginning or end of the read. Default: 4. --ignore-quals When calculating a mismatch penalty, always consider the quality value at the - mismatched position to be the highest possible, regardless of the actual value. + mismatched position to be the highest possible, regardless of the actual value. I.e. input is treated as though all quality values are high. This is also the default behavior when the input doesn't specify quality values (e.g. in `-f`, `-r`, or `-c` modes). @@ -751,7 +799,7 @@ reference strand. In paired-end mode, `--nofw` and `--norc` pertain to the fragments; i.e. specifying `--nofw` causes `bowtie2` to explore only those paired-end configurations corresponding to fragments from the reverse-complement - (Crick) strand. Default: both strands enabled. + (Crick) strand. Default: both strands enabled. --no-1mm-upfront By default, Bowtie 2 will attempt to find either an exact or a 1-mismatch @@ -782,13 +830,13 @@ and one of the presets (e.g. `--local --very-fast`) is equivalent to specifying the local version of the preset (`--very-fast-local`). This is mutually exclusive with `--end-to-end`. `--end-to-end` is the default mode. - + ----- **Scoring options**:: - --ma <int> - Sets the match bonus. In `--local` mode `<int>` is added to the alignment + --ma + Sets the match bonus. In `--local` mode `` is added to the alignment score for each position where a read character aligns to a reference character and the characters match. Not used in `--end-to-end` mode. Default: 2. @@ -801,31 +849,31 @@ Otherwise, the number subtracted is `MN + floor( (MX-MN)(MIN(Q, 40.0)/40.0) )` where Q is the Phred quality value. Default: `MX` = 6, `MN` = 2. - --np <int> + --np Sets penalty for positions where the read, reference, or both, contain an ambiguous character such as `N`. Default: 1. - --rdg <int1>,<int2> - Sets the read gap open (`<int1>`) and extend (`<int2>`) penalties. A read gap of - length N gets a penalty of `<int1>` + N * `<int2>`. Default: 5, 3. + --rdg , + Sets the read gap open (``) and extend (``) penalties. A read gap of + length N gets a penalty of `` + N * ``. Default: 5, 3. - --rfg <int1>,<int2> - Sets the reference gap open (`<int1>`) and extend (`<int2>`) penalties. A - reference gap of length N gets a penalty of `<int1>` + N * `<int2>`. Default: + --rfg , + Sets the reference gap open (``) and extend (``) penalties. A + reference gap of length N gets a penalty of `` + N * ``. Default: 5, 3. - --score-min <func> + --score-min Sets a function governing the minimum alignment score needed for an alignment to be considered "valid" (i.e. good enough to report). This is a function of read length. For instance, specifying `L,0,-0.6` sets the minimum-score function `f` to `f(x) = 0 + -0.6 * x`, where `x` is the read length. The default in `--end-to-end` mode is `L,-0.6,-0.6` and the default in `--local` mode is `G,20,8`. - ------ + +----- **Reporting options**:: - -k <int> + -k By default, `bowtie2` searches for distinct, valid alignments for each read. When it finds a valid alignment, it continues looking for alignments that are nearly as good or better. The best alignment found is reported (randomly @@ -834,15 +882,15 @@ `AS:i` and `XS:i`. When `-k` is specified, however, `bowtie2` behaves differently. Instead, it - searches for at most `<int>` distinct, valid alignments for each read. The + searches for at most `` distinct, valid alignments for each read. The search terminates when it can't find more distinct valid alignments, or when it - finds `<int>`, whichever happens first. All alignments found are reported in + finds ``, whichever happens first. All alignments found are reported in descending order by alignment score. The alignment score for a paired-end alignment equals the sum of the alignment scores of the individual mates. Each reported read or pair alignment beyond the first has the SAM 'secondary' bit (which equals 256) set in its FLAGS field. For reads that have more than - `<int>` distinct, valid alignments, `bowtie2` does not guarantee that the - `<int>` alignments reported are the best possible in terms of alignment score. + `` distinct, valid alignments, `bowtie2` does not guarantee that the + `` alignments reported are the best possible in terms of alignment score. `-k` is mutually exclusive with `-a`. Note: Bowtie 2 is not designed with large values for `-k` in mind, and when @@ -854,30 +902,30 @@ Note: Bowtie 2 is not designed with `-a` mode in mind, and when aligning reads to long, repetitive genomes this mode can be very, very slow. - + ----- **Effort options**:: - -D <int> - Up to `<int>` consecutive seed extension attempts can "fail" before Bowtie 2 + -D + Up to `` consecutive seed extension attempts can "fail" before Bowtie 2 moves on, using the alignments found so far. A seed extension "fails" if it does not yield a new best or a new second-best alignment. This limit is automatically adjusted up when -k or -a are specified. Default: 15. - -R <int> - `<int>` is the maximum number of times Bowtie 2 will "re-seed" reads with + -R + `` is the maximum number of times Bowtie 2 will "re-seed" reads with repetitive seeds. When "re-seeding," Bowtie 2 simply chooses a new set of reads (same length, same number of mismatches allowed) at different offsets and searches for more alignments. A read is considered to have repetitive seeds if the total number of seed hits divided by the number of seeds that aligned at least once is greater than 300. Default: 2. - + ----- **Paired-end options**:: - -I/--minins <int> + -I/--minins The minimum fragment length for valid paired-end alignments. E.g. if `-I 60` is specified and a paired-end alignment consists of two 20-bp alignments in the appropriate orientation with a 20-bp gap between them, that alignment is @@ -891,9 +939,9 @@ For typical fragment length ranges (200 to 400 nucleotides), Bowtie 2 is very efficient. - Default: 0 (essentially imposing no minimum) + Default: 0 (essentially imposing no minimum) - -X/--maxins <int> + -X/--maxins The maximum fragment length for valid paired-end alignments. E.g. if `-X 100` is specified and a paired-end alignment consists of two 20-bp alignments in the proper orientation with a 60-bp gap between them, that alignment is considered @@ -945,19 +993,19 @@ --no-overlap If one mate alignment overlaps the other at all, consider that to be non-concordant. Default: mates can overlap in a concordant alignment. - + ------ **SAM options**:: - --rg-id <text> - Set the read group ID to `<text>`. This causes the SAM `@RG` header line to be - printed, with `<text>` as the value associated with the `ID:` tag. It also + --rg-id + Set the read group ID to ``. This causes the SAM `@RG` header line to be + printed, with `` as the value associated with the `ID:` tag. It also causes the `RG:Z:` extra field to be attached to each SAM output record, with - value set to `<text>`. + value set to ``. - --rg <text> - Add `<text>` (usually of the form `TAG:VAL`, e.g. `SM:Pool1`) as a field on the + --rg + Add `` (usually of the form `TAG:VAL`, e.g. `SM:Pool1`) as a field on the `@RG` header line. Note: in order for the `@RG` line to appear, `--rg-id` must also be specified. This is because the `ID` tag is required by the SAM Specification. Specify `--rg` multiple times to set multiple fields. See the @@ -967,7 +1015,7 @@ When printing secondary alignments, Bowtie 2 by default will write out the `SEQ` and `QUAL` strings. Specifying this option causes Bowtie 2 to print an asterix in those fields instead. - + ----- **Other options**:: @@ -980,8 +1028,8 @@ not specified. Has no effect if `-p` is set to 1, since output order will naturally correspond to input order in that case. - --seed <int> - Use `<int>` as the seed for pseudo-random number generator. Default: 0. + --seed + Use `` as the seed for pseudo-random number generator. Default: 0. --non-deterministic Normally, Bowtie 2 re-initializes its pseudo-random generator for each read. It @@ -996,7 +1044,7 @@ but might be more appropriate in situations where the input consists of many identical reads. - + ]]> 10.1186/gb-2009-10-3-r25 10.1038/nmeth.1923 diff -r fed480fea9f0 -r fa69d5a7b8c8 tool_dependencies.xml --- a/tool_dependencies.xml Fri Dec 18 18:50:22 2015 -0500 +++ b/tool_dependencies.xml Tue Jan 03 10:50:44 2017 -0500 @@ -4,6 +4,6 @@ - +