Mercurial > repos > bgruening > text_processing
comparison unsorted_uniq.xml @ 0:ec66f9d90ef0 draft
initial uploaded
| author | bgruening |
|---|---|
| date | Thu, 05 Sep 2013 04:58:21 -0400 |
| parents | |
| children | a4ad586d1403 |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:ec66f9d90ef0 |
|---|---|
| 1 <tool id="unixtools_sorted_uniq" name="Unique" version="0.3"> | |
| 2 <description>occurrences of each record</description> | |
| 3 <requirements> | |
| 4 <requirement type="package" version="8.21">gnu_coreutils</requirement> | |
| 5 </requirements> | |
| 6 <command interpreter='python'> | |
| 7 unique_lines.py | |
| 8 $ignore_case | |
| 9 $is_numeric | |
| 10 #if $adv_opts.adv_opts_selector=="advanced": | |
| 11 $adv_opts.column_start | |
| 12 $adv_opts.column_end | |
| 13 #end if | |
| 14 $outfile | |
| 15 $infile | |
| 16 </command> | |
| 17 <inputs> | |
| 18 <param name="infile" type="data" format="tabular,text" label="from query" /> | |
| 19 <param name="ignore_case" type="boolean" label="ignore differences in case when comparing (-f)" truevalue="-f" falsevalue="false" checked="false" help="ignore differences in case when comparing"/> | |
| 20 <param name="is_numeric" type="boolean" label="column only contains numeric values (-n)" truevalue="-n" falsevalue="false" checked="false" help="did the calumn have numeric values"/> | |
| 21 <conditional name="adv_opts"> | |
| 22 <param name="adv_opts_selector" type="select" label="Advanced Options"> | |
| 23 <option value="basic" selected="True">Hide Advanced Options</option> | |
| 24 <option value="advanced">Show Advanced Options</option> | |
| 25 </param> | |
| 26 <when value="basic" /> | |
| 27 <when value="advanced"> | |
| 28 <param name="column_start" label="Column start" type="data_column" data_ref="infile" help="Unique on specific column range"/> | |
| 29 <param name="column_end" label="Column end" type="data_column" data_ref="infile" help="Unique on specific column range"/> | |
| 30 </when> | |
| 31 </conditional> | |
| 32 </inputs> | |
| 33 <outputs> | |
| 34 <data format="infile" name="outfile" metadata_source="infile"/> | |
| 35 </outputs> | |
| 36 <tests> | |
| 37 <test> | |
| 38 </test> | |
| 39 </tests> | |
| 40 <help> | |
| 41 | |
| 42 .. class:: infomark | |
| 43 | |
| 44 **Syntax** | |
| 45 | |
| 46 This tool returns all unique lines using the 'sort -u' command. It can be used with unsorted files. | |
| 47 If you need additional options, like grouping or counting your unique results, please use the 'Unique lines from sorted file' tool. | |
| 48 | |
| 49 ----- | |
| 50 | |
| 51 .. class:: infomark | |
| 52 | |
| 53 The input file needs to be tab separated. Please convert your file if necessary. | |
| 54 | |
| 55 ----- | |
| 56 | |
| 57 **Example** | |
| 58 | |
| 59 - Input file:: | |
| 60 | |
| 61 chr1 10 100 gene1 | |
| 62 chr1 105 200 gene2 | |
| 63 chr1 10 100 gene1 | |
| 64 chr2 10 100 gene4 | |
| 65 chr2 1000 1900 gene5 | |
| 66 chr3 15 1656 gene6 | |
| 67 chr2 10 100 gene4 | |
| 68 | |
| 69 - Unique lines will result in:: | |
| 70 | |
| 71 chr1 10 100 gene1 | |
| 72 chr1 105 200 gene2 | |
| 73 chr2 10 100 gene4 | |
| 74 chr2 1000 1900 gene5 | |
| 75 chr3 15 1656 gene6 | |
| 76 | |
| 77 | |
| 78 </help> | |
| 79 </tool> |
