changeset 0:13a9ae9ef940 draft

planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 38545eb765e0df7fcc6b8130e8e5f87cf4481122
author abims-sbr
date Thu, 13 Apr 2017 05:45:50 -0400
parents
children 2bd29709310f
files CHANGELOG.md filter_assembly.xml macros.xml test-data/test_01_input_Trinity_filter_oase.zip test-data/test_01_input_Velvet_filter_oase.zip test-data/test_01_output_(trinity)filter_oase.zip test-data/test_01_output_(velvet)filter_oase.zip test-data/test_06.out test-data/test_06bis.out
diffstat 9 files changed, 244 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/CHANGELOG.md	Thu Apr 13 05:45:50 2017 -0400
@@ -0,0 +1,7 @@
+Changelog
+
+Version 1.0 - 13/04/2017
+
+  - Add funtional test with planemo
+  - Planemo test with conda dependencies for cap3, fastaformatter and python 
+  - Scripts renamed + symlinks to the directory 'scripts'
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/filter_assembly.xml	Thu Apr 13 05:45:50 2017 -0400
@@ -0,0 +1,168 @@
+<?xml version="1.0"?>
+
+<tool name="Filter assemblies" id="filter_assemblies" version="1.0">	
+
+	<description>
+		Filter the outputs of Velvet or Trinity assemblies
+	</description>
+
+	<macros>
+		<import>macros.xml</import>
+	</macros>
+
+	<requirements>
+		<expand macro="python_required" />
+		<requirement type="package" version="0.0.14">fastx_toolkit</requirement>
+		<requirement type="package">cap3</requirement>
+	</requirements>
+
+  	<command>
+	<![CDATA[
+		ln -s $__tool_directory__/scripts/S02a_remove_redondancy_from_velvet_oases.py .
+		&&
+		ln -s $__tool_directory__/scripts/S02b_format_fasta_name_trinity.py .
+		&&
+		ln -s $__tool_directory__/scripts/S03_choose_one_variants_per_locus_trinity.py .
+		&&
+		ln -s $__tool_directory__/scripts/S04_find_orf.py .
+		&&
+		ln -s $__tool_directory__/scripts/S05_filter.py .
+		&&
+		python $__tool_directory__/scripts/S01_script_to_choose.py
+
+		#if $input.input_type_choice == "velvet"
+			velvet ${input.zip_velvet} 
+		#else
+			trinity ${input.zip_trinity} 
+		#end if
+		$length_seq_max $percent_identity $overlap_length
+		> ${output}
+	]]>
+  	</command>
+
+ 	<inputs>
+		<conditional name="input">
+			<param name="input_type_choice" type="select" label="What is the type of your inputs? ">
+				<option value="velvet">Velvet Oases</option>
+				<option value="trinity">Trinity</option>
+			</param>
+			<when value="velvet">
+				<param name="zip_velvet" type="data" format="no_unzip.zip,zip" label="Choose your ZIP file" help="A zip file containing all your files" />
+			</when>
+			<when value="trinity">
+				<param name="zip_trinity" type="data" format="no_unzip.zip,zip" label="Choose your ZIP file" help="A zip file containing all your files" />
+			</when>
+		</conditional>
+		<param name="percent_identity" type="integer" value="100" label="Maximum sequence length" help="Cap3 parameter -p  N  specify overlap percent identity cutoff N &gt; 65 " />
+		<param name="overlap_length" type="integer" value="60" label="Maximum sequence length" help="Cap3 parameter -o  N  specify overlap length cutoff &gt; 15 " />
+		<param name="length_seq_max" type="integer" value="100" label="Minimum sequence length" help="Keep sequences which length is higher than the minimum sequence length  " />
+	</inputs>
+
+	<outputs>
+		<data format="no_unzip.zip" name="output_zip" label="Filter_oase_zip" from_work_dir="sequences_filtered.zip" />
+		<data format="txt" name="output" label="Filter_Assemblies_Summary"/>
+	</outputs>
+
+	<tests>
+		<test>
+			<param name="input_type_choice" value="trinity" />
+			<param name="input|zip_trinity" ftype="zip" value="test_01_input_Trinity_filter_oase.zip" />
+			<param name="percent_identity" value="100" />
+			<param name="overlap_length" value="60" />
+			<param name="length_seq_max" value="100" />
+			<output name="output" value="test_06.out" />
+		</test>
+		<test>
+			<param name="input_type_choice" value="velvet" />
+			<param name="input|zip_velvet" ftype="zip" value="test_01_input_Velvet_filter_oase.zip" />
+			<param name="percent_identity" value="100" />
+			<param name="overlap_length" value="60" />
+			<param name="length_seq_max" value="100" />
+			<output name="output" value="test_06bis.out" />
+		</test>
+		
+	</tests>	
+
+	<help>
+
+.. class:: infomark
+
+**Authors**  Eric Fontanillas creates the scripts of this pipeline.
+
+.. class:: infomark
+
+**Galaxy integration** Julie Baffard and ABIMS TEAM
+
+ | Contact support.abims@sb-roscoff.fr for any questions or concerns about the Galaxy implementation of this tool.
+
+---------------------------------------------------
+
+===========
+Filter Oase
+===========
+
+-----------
+Description
+-----------
+
+
+This script reformats Velvet Oases or Trinity assemblies for the AdaptSearch galaxy suite and selects only one variant per gene according to its length and quality check.
+
+
+
+.. class:: infomark
+
+
+**Important part of this tool (the inputs format)**
+
+--------
+
+
+
+============
+Input format
+============
+
+
+---------------------------------
+For Velvet Oases assemblies input
+---------------------------------
+
+Because of putative changes in the sequence names of the assemblies associated with the upgrade of the Velvet/Oases software, the script will only work if:
+
+(1)sequences are in the sequential format:
+	| e.g.
+	| &gt;seqname
+	| AAAGAGAGAVCACATGTCAGTAGC
+	| &gt;seqname
+	| AAAGAGAGAVCACATGTCAGTAGC
+		
+(2)The name of each transcript must start by a species abbreviation of two letters, unique for each assembly. The file name of the assembly file must also begin with these same two letters.
+
+(3)The syntax of the sequence name must be constructed as: &gt;fh1_2/3_4_5 where are the two chosen letters the number of the locus, the transcript variant among all versions of the transcript,the confidence value and the length of the transcript. In this case, the file name should thus begin with fs.
+
+-----------------------------
+For Trinity assemblies inputs
+-----------------------------
+
+Because of putative changes in the sequence names of the assemblies associated with the upgrade of the Trinity software, the script will only work if:
+
+(1)Sequences are in the sequential format:
+	| e.g.
+	| &gt;seqname
+	| AAAGAGAGAVCACATGTCAGTAGC
+	| &gt;seqname
+	| AAAGAGAGAVCACATGTCAGTAGC
+		
+(2)The name of each transcript must start by &gt;comp, e.g. &gt;comp10020 instead of &gt;c10020 or &gt;transcript, etc...
+
+(3)The syntax of the sequence name should avoid spaces and must contain _len:, e.g. &gt;comp1_g1_it1_len:1000_path=[.....]
+
+(4)A suffix of two letters abbreviating the species name must be chosen, e.g. Homo sapiens -&gt; Hs. The file name of the assembly file must begin with this suffix. Each suffix should be unique among the n analyzed transcriptomes.
+e.g. if the file name is Hs_trinity_22000_transcripts.fasta with sequences, the suffix abbreviation must be Hs and all sequences must be : &gt;Hs.
+Alternatively if the name is: Homosapiens_trinity_22000_transcripts.fasta, the suffix must be thus Ho.
+	</help>		
+
+    <expand macro="citations" />
+
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml	Thu Apr 13 05:45:50 2017 -0400
@@ -0,0 +1,16 @@
+<macros>
+
+	<xml name="python_required">		
+			<requirement type="package" version="2.7">python</requirement>		
+	</xml>
+
+	<xml name="citations">
+		<citations>
+			<citation type="bibtex">Credits : ABIMS team, Roscoff Marine Station</citation>
+			<citation type="bibtex">Contact support.abims@sb-roscoff.fr for any questions or concerns about the Galaxy implementation of this tool.</citation>
+			<citation type="bibtex">Version 1 : Scripts by Eric Fontanillas -- Galaxy integration by Julie Baffard</citation>
+			<citation type="bibtex">Version 2 : improvments by Victor Mataigne, Gildas le Corguillé, Misharl Monsoor</citation>
+		</citations>
+	</xml>
+
+</macros>
Binary file test-data/test_01_input_Trinity_filter_oase.zip has changed
Binary file test-data/test_01_input_Velvet_filter_oase.zip has changed
Binary file test-data/test_01_output_(trinity)filter_oase.zip has changed
Binary file test-data/test_01_output_(velvet)filter_oase.zip has changed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_06.out	Thu Apr 13 05:45:50 2017 -0400
@@ -0,0 +1,32 @@
+20
+Number of segment pairs = 380; number of pairwise comparisons = 3
+'+' means given segment; '-' means reverse complement
+
+Overlaps            Containments  No. of Constraints Supporting Overlap
+
+
+DETAILED DISPLAY OF CONTIGS
+21
+Number of segment pairs = 380; number of pairwise comparisons = 3
+'+' means given segment; '-' means reverse complement
+
+Overlaps            Containments  No. of Constraints Supporting Overlap
+
+
+DETAILED DISPLAY OF CONTIGS
+20
+Number of segment pairs = 380; number of pairwise comparisons = 3
+'+' means given segment; '-' means reverse complement
+
+Overlaps            Containments  No. of Constraints Supporting Overlap
+
+
+DETAILED DISPLAY OF CONTIGS
+22
+Number of segment pairs = 342; number of pairwise comparisons = 2
+'+' means given segment; '-' means reverse complement
+
+Overlaps            Containments  No. of Constraints Supporting Overlap
+
+
+DETAILED DISPLAY OF CONTIGS
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_06bis.out	Thu Apr 13 05:45:50 2017 -0400
@@ -0,0 +1,21 @@
+Number of segment pairs = 4032; number of pairwise comparisons = 0
+'+' means given segment; '-' means reverse complement
+
+Overlaps            Containments  No. of Constraints Supporting Overlap
+
+
+DETAILED DISPLAY OF CONTIGS
+Number of segment pairs = 4160; number of pairwise comparisons = 0
+'+' means given segment; '-' means reverse complement
+
+Overlaps            Containments  No. of Constraints Supporting Overlap
+
+
+DETAILED DISPLAY OF CONTIGS
+Number of segment pairs = 4422; number of pairwise comparisons = 1
+'+' means given segment; '-' means reverse complement
+
+Overlaps            Containments  No. of Constraints Supporting Overlap
+
+
+DETAILED DISPLAY OF CONTIGS