annotate kmersvm/nullseq.xml @ 0:66088269713e draft

Uploaded all files tracked by git
author test-svm
date Sun, 05 Aug 2012 15:32:16 -0400
parents
children 5b3d8ca0bf20
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
1 <tool id="kmersvm_nullseq" name="Generate Null Sequence">
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
2 <description>using random sampling from genomic DNA</description>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
3 <command interpreter="python">scripts/nullseq_generate.py -q
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
4 #if str($excluded) !="None":
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
5 -e $excluded
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
6 #end if
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
7 -x $fold -r $rseed -g $gc_err -t $rpt_err $input $dbkey ${indices_path.fields.path}
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
8 </command>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
9 <inputs>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
10 <param name="fold" type="integer" value="1" label="# of Fold-Increase" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
11 <param name="gc_err" type="float" value="0.02" label="Allowable GC Error" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
12 <param name="rpt_err" type="float" value="0.02" label="Allowable Repeat Error" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
13 <param name="rseed" type="integer" value="1" label="Random Number Seed" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
14 <param format="interval" name="input" type="data" label="BED File of Positive Regions" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
15 <validator type="unspecified_build" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
16 <validator type="dataset_metadata_in_file" filename="nullseq_indices.loc" metadata_name="dbkey" metadata_column="0" message="Sequences are currently unavailable for the specified build." />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
17 <param name="excluded" optional="true" format="interval" type="data" value="None" label="Excluded Regions (optional)" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
18 <param name="indices_path" type="select" label="Available Datasets">
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
19 <options from_file="nullseq_indices.loc">
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
20 <column name="dbkey" index="0"/>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
21 <column name="value" index="0"/>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
22 <column name="name" index="1"/>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
23 <column name="path" index="2"/>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
24 <!--filter type="data_meta" ref="input" key="dbkey" column="0" /-->
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
25 </options>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
26 </param>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
27 </inputs>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
28 <outputs>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
29 <data format="interval" name="nullseq_output" from_work_dir="nullseq_output.bed" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
30 </outputs>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
31 <tests>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
32 <test>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
33 <param name="input" value="nullseq_test.bed" ftype="bed" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
34 <param name="fold" value="1" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
35 <param name="gc_err" value="0.02" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
36 <param name="rpt_err" value="0'02" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
37 <param name="rseed" value="1" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
38 <param name="indices_path" value="hg19" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
39 <output name="output" file="nullseq_output.bed" />
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
40 </test>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
41 </tests>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
42 <help>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
43
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
44 **What it does**
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
45
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
46 Takes an input BED file and generates a set of sequences for use as negative data (null sequences) in Train SVM similar in length, GC content and repeat fraction. Uses random sampling for efficiency.
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
47
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
48 **Parameters**
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
49
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
50 Fold-Increase: Size of desired null sequence data set expressed as multiple of the size of the input data set.
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
51
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
52 GC Error, Repeat Error: Acceptable difference between a positive sequence and its corresponding null sequence in terms of GC content, repeat content.
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
53
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
54 Random Number Seed: Seed for random number generator.
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
55
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
56 Excluded Regions: Submitted regions will be excluded from null sequence generation.
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
57
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
58 ----
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
59
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
60 **Example**
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
61
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
62 Given a BED file containing::
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
63
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
64 chr1 10212203 10212303
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
65 chr1 103584748 103584848
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
66 chr1 105299130 105299230
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
67 chr1 106367772 106367872
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
68
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
69 Tool will output BED file matched in length, GC content and repeat content::
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
70
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
71 chr1 3089935 3090035
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
72 chr1 5031335 5031435
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
73 chr1 5103742 5103842
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
74 chr1 5650372 5650472
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
75
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
76 </help>
66088269713e Uploaded all files tracked by git
test-svm
parents:
diff changeset
77 </tool>