Mercurial > repos > bgruening > text_processing
diff sorted_uniq.xml @ 0:ec66f9d90ef0 draft
initial uploaded
author | bgruening |
---|---|
date | Thu, 05 Sep 2013 04:58:21 -0400 |
parents | |
children | a4ad586d1403 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/sorted_uniq.xml Thu Sep 05 04:58:21 2013 -0400 @@ -0,0 +1,55 @@ +<tool id="unixtools_uniq_tool" name="Unique lines"> + <description>from sorted file</description> + <requirements> + <requirement type="package" version="8.21">gnu_coreutils</requirement> + </requirements> + <command> + uniq + -f + $skipfields + $count + $repeated + $ignorecase + $uniqueonly + $input + + ## feature is not yet released, it will be in the next 8.22 version + ##--group=$group + > $output + </command> + + <inputs> + <param format="txt" name="input" type="data" label="File to scan for unique values" help="Make sure you have sorted this file" /> + + <param name="count" type="boolean" label="count [-c]" help="Prefix lines by the number of occurrences" truevalue="-c" falsevalue="" /> + <param name="repeated" type="boolean" label="repeated [-d]" help="Only print duplicate lines" truevalue="-d" falsevalue="" /> + <param name="ignorecase" type="boolean" label="ignore case [-i]" help="Ignore differences in case when comparing" truevalue="-i" falsevalue="" /> + <param name="uniqueonly" type="boolean" label="unique only [-u]" help="Only print unique lines" truevalue="-u" falsevalue="" /> + <param name="skipfields" type="integer" label="skip fields [-f]" help="Avoid comparing the first N fields. (use zero to start from the first field)" size="2" value="0" /> + + <!-- + <param name="group" type="select" label="Output all lines, and delimit each unique group."> + <option value="separate">Separate unique groups with a single delimiter</option> + <option value="prepend">Output a delimiter before each group of unique items</option> + <option value="append">Output a delimiter after each group of unique items.</option> + <option value="both">Output a delimiter around each group of unique items.</option> + </param> + --> + </inputs> + + <outputs> + <data format="input" name="output" metadata_source="input"/> + </outputs> + <help> +This tool takes a sorted file and look for lines that are unique. + +.. class:: warningmark + +Please make sure your file is sorted, or else this tool will give you an erroneous output. + +.. class:: infomark + +You can sort your file using either the "Sort" tool in "Filter and Sort", or the "Sort" tool in "Unix Tools". + + </help> +</tool>