diff gff3_extract_sequence.xml @ 0:f678e282b320 draft default tip

"planemo upload"
author cpt_testbed
date Fri, 06 May 2022 07:07:23 +0000
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/gff3_extract_sequence.xml	Fri May 06 07:07:23 2022 +0000
@@ -0,0 +1,71 @@
+<?xml version="1.0"?>
+<tool id="edu.tamu.cpt.gff3.export_seq" name="GFF3 Feature Sequence Export" version="19.1.0.0">
+  <description>Export corresponding sequence in genome from GFF3</description>
+  <macros>
+    <import>macros.xml</import>
+		<import>cpt-macros.xml</import>
+  </macros>
+  <expand macro="requirements"/>
+  <command detect_errors="aggressive"><![CDATA[
+@GENOME_SELECTOR_PRE@
+
+$__tool_directory__/gff3_extract_sequence.py
+@GENOME_SELECTOR@
+
+@INPUT_GFF@
+
+#if $feature_filter and $feature_filter is not None:
+--feature_filter $feature_filter
+#end if
+$nodesc
+> $default]]></command>
+  <inputs>
+    <expand macro="genome_selector" />
+    <expand macro="gff3_input" />
+	<param label="Filter for specific feature types" name="feature_filter" type="text"
+		help="Use 'nice_cds' if your features are coming from Apollo, however this will fail on non-Apollo data"/>
+    <param label="Remove description (use if blasting)" name="nodesc" type="boolean" truevalue="--nodesc" falsevalue=""/>
+  </inputs>
+  <outputs>
+    <data format="fasta" hidden="false" name="default"/>
+  </outputs>
+  <tests>
+		<test>
+			<param name="reference_genome_source" value="history" />
+			<param name="genome_fasta" value="T7_ExtSeqIn.fasta" />
+			<param name="gff3_data" value="T7_ExtSeqIn.gff3" />
+			<param name="nodesc" value="" />
+			<param name="feature_filter" value="CDS" />
+			<output name="output" file="T7_ExtSeqOut.fasta" />
+		</test>
+                <test>
+			<param name="reference_genome_source" value="history" />
+			<param name="genome_fasta" value="Miro_ExtSeqIn.fa" />
+			<param name="gff3_data" value="Miro_ExtSeqIn.gff3" />
+			<param name="nodesc" value="" />
+			<param name="feature_filter" value="CDS" />
+			<output name="output" file="Miro_ExtSeqOut1.fa" />
+		</test>
+		<test>
+			<param name="reference_genome_source" value="history" />
+			<param name="genome_fasta" value="Miro_ExtSeqIn.fa" />
+			<param name="gff3_data" value="Miro_ExtSeqIn.gff3" />
+			<param name="feature_filter" value="CDS" />
+			<param name="nodesc" value="--nodesc" />
+			<output name="output" file="Miro_ExtSeqOut2.fa" />
+		</test>
+  </tests>
+  <help><![CDATA[
+**What it does**
+
+From the FASTA sequence for a genome, extracts the *nucleotide* sequences for 
+all CDSs in an input GFF3 and outputs them as a multi-FASTA formatted file.
+
+The filter for specific feature types was designed for data retrieved from Apollo. 
+Using ‘unique_cds’ extracts the sequence for all CDS. Using ‘nice_cds’ will extract 
+the sequence only for CDS features with a start codon (recommended). If a gene from
+Apollo has multiple CDSs, the tool will append a "_##" to the end of subsequent genes.
+
+      ]]></help>
+		<expand macro="citations" />
+</tool>