comparison summarize_poliovirus_alignment.xml @ 3:09b98e40ab59 draft

planemo upload for repository https://github.com/pvanheus/polio_report commit a99e10fec2fac5aae70974c977eb3b362a1a8429-dirty
author sanbi-uwc
date Fri, 22 Jul 2022 09:56:33 +0000
parents 5c8dfc4d9d68
children eae57366bc55
comparison
equal deleted inserted replaced
2:5c8dfc4d9d68 3:09b98e40ab59
18 <inputs> 18 <inputs>
19 <!-- input is list of reports for poliovirus sabin 1, 2 and 3 --> 19 <!-- input is list of reports for poliovirus sabin 1, 2 and 3 -->
20 <param name="alignment_assessments" format="json" type="data_collection" collection_type="list" label="Poliovius alignment assessments" help="Input is a list of JSON reports from the assess_poliovirus_alignment tool" /> 20 <param name="alignment_assessments" format="json" type="data_collection" collection_type="list" label="Poliovius alignment assessments" help="Input is a list of JSON reports from the assess_poliovirus_alignment tool" />
21 </inputs> 21 </inputs>
22 <outputs> 22 <outputs>
23 <data name="output1" format="tabular" label="Poliovirus variant summary on ${on_string}" /> 23 <data name="output1" format="tabular" label="Poliovirus variant summary on ${on_string}">
24 <actions>
25 <action name="column_names" type="metadata" default="sample name,best matching reference,num variants,perc variants,quality,variant list" />
26 </actions>
27 </data>
24 <collection name="variant_list" type="list" label="Poliovirus variant lists on ${on_string}" structured_like="alignment_assessments" format="tabular"> 28 <collection name="variant_list" type="list" label="Poliovirus variant lists on ${on_string}" structured_like="alignment_assessments" format="tabular">
25 <!-- todo - find a way to set the metadata columns for the tabular datasets --> 29 <!-- todo - find a way to set the metadata columns for the tabular datasets -->
26 </collection> 30 </collection>
27 </outputs> 31 </outputs>
28 <tests> 32 <tests>
41 <element name="sample1" file="sample1_variants.tabular" ftype="tabular" /> 45 <element name="sample1" file="sample1_variants.tabular" ftype="tabular" />
42 </output_collection> 46 </output_collection>
43 </test> 47 </test>
44 </tests> 48 </tests>
45 <help><![CDATA[ 49 <help><![CDATA[
46 Given a list of outputs of the assess_poliovirus_alignment tool, make a final summary. 50 Given a list of outputs of the assess_poliovirus_alignment tool, make a summary and per sample variant list.
51
52 In the summary file the columns are:
53
54 1. sample name
55
56 2. best matching reference: the workflow compares sequences against Sabin 1, 2 and 3 poliovirus reference sequences and select the one that is the closest matching
57
58 3. number of variants relative to the best matching reference
59
60 4. percentage of variation: variants are only counted in the VP1 gene and this percentage is calculated by comparing the number of variants to the length of the VP1 gene in the best matching reference.
61
62 5. quality: this is an attempt at a quality score for the sequences
63
64 6. variant list: a semi-colon separated list of variants. variant positions are in 1-based coordinates counting from the first base of the VP1 gene. A variant list is produced for each sample, these might be more readable.
65
66 In the per-sample variant lists the columns are as follows:
67
68 1. variant position in the genome
69
70 2. variant position in VP1 (in 1-based coordinates)
71
72 3. base in reference
73
74 4. base in sequenced sample
75
47 ]]></help> 76 ]]></help>
48 <citations> 77 <citations>
49 <citation type="bibtex"><![CDATA[ 78 <citation type="bibtex"><![CDATA[
50 @software{van_Heusden_Poliovirus_variation_reporting_2022, 79 @software{van_Heusden_Poliovirus_variation_reporting_2022,
51 author = {van Heusden, Peter}, 80 author = {van Heusden, Peter},