changeset 0:5a57280b9125 draft

Imported from capsule None
author sblanck
date Thu, 10 Nov 2016 07:34:57 -0500
parents
children f8a2f1fec8ef
files AffyQCnormalization.xml Analyse.xml GEOQuery.xml ImportDataFromMatrix.xml MetaMA.xml MetaRNAseq.xml repository_dependencies.xml
diffstat 7 files changed, 384 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/AffyQCnormalization.xml	Thu Nov 10 07:34:57 2016 -0500
@@ -0,0 +1,61 @@
+<tool id="QCnormalization" name="QCnormalization" version="0.1.0">
+	<description>Quality control and normalization of affymetrix expression data</description>
+	<requirements>
+	  <container type="docker">sblanck/smat</container>
+	</requirements>
+	<command>
+		<![CDATA[
+		/galaxy-tools/stderr_wrapper.py Rscript 
+		/galaxy-tools/transcriptomics/AffyQCnormalization/AffyQCnormalization.R
+		   	#for $input in $inputs
+                "${input}"
+			    "${input.name}"
+     		#end for
+			"${normalization}"
+			$result_export_eset
+       		$result_html
+			$result_html.files_path
+		/galaxy-tools/transcriptomics/AffyQCnormalization/AffyQCnormalization_tpl.html
+		]]>
+		</command>
+	
+		<inputs>
+	
+		<param name="inputs" type="data" format="cel" multiple="true" label=".CEL files" help=".CEL files to be used"/>
+
+		<param name="normalization" type="select" label="Preprocessing/normalization">
+		
+    		<option value="rma">rma (backgroung correction + quantile normalization + log2)</option>
+            <option value="quantile">quantile normalization + log2</option>
+            <option value="background">background correction + log2</option>
+            <option value="log2">log2 only</option>
+           
+		
+		</param>
+		
+	</inputs>
+	<outputs>
+		<data format="rdata" name="result_export_eset" label="export normalized expressionSet"/>		
+		<data format="html" name="result_html" label="QC result"/>
+	</outputs>
+
+	<help>
+<![CDATA[
+		**What it does** 
+		    	
+The QCnormalization tool offers to ensure the quality of the data and to normalize them. Several normalization methods are available :
+
+* rma normalization 
+* quantile normalization + log2
+* background correction + log2
+* log2 only
+
+**Results**
+
+- Several quality figures : microarray images, boxplots and MA plots
+- Rdata object containing the normalized data for further analysis
+  		
+]]>
+</help>
+
+</tool>
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/Analyse.xml	Thu Nov 10 07:34:57 2016 -0500
@@ -0,0 +1,92 @@
+<tool id="LimmaAnalyse" name="Limma analysis" version="0.3.0">
+	<description>Perform gene expression analysis thanks to limma</description>
+	<requirements>
+	  	<container type="docker">sblanck/smagexp</container>
+	</requirements>
+	<command>
+		<![CDATA[ 
+		/galaxy-tools/stderr_wrapper.py Rscript
+		/galaxy-tools/transcriptomics/Analyse/Analyse.R
+		   	"${rdataset}"
+			"${conditions}"
+		 	"${selectCondition1}"
+			"${condition1}"
+		    "${selectCondition2}"
+			"${condition2}"
+			"${nbresult}"
+       		$result_export_eset
+       		$result_html 
+			$result_html.files_path
+			$result_tabular
+		/galaxy-tools/transcriptomics/Analyse/Analyse_tpl.html
+		]]>
+	</command>
+	
+	<inputs>
+		<param name="rdataset" type="data" format="rdata" label="RData" help="RData to be used"/>
+		<param name="conditions" type="data" format="cond" label="Conditions" help="conditions associated with the rData file"/>
+		<param name="selectCondition1" type="select" label="condition 1">
+			<options from_dataset="conditions">
+    		<column name="name" index="1"/>
+    		<column name="value" index="1"/>
+    		<filter type="unique_value" column="1"/>
+		</options>
+		</param>
+		<param name="condition1" type="select" display="checkboxes" label="Condition 1" multiple="true">
+			<options from_dataset="conditions">
+    		<column name="name" index="2"/>
+    		<column name="value" index="0"/>
+			<filter  type="param_value" ref="selectCondition1" column="1"/>
+		</options>
+		</param>	
+		<param name="selectCondition2" type="select" label="condition 2">
+			<options from_dataset="conditions">
+    		<column name="name" index="1"/>
+    		<column name="value" index="1"/>
+			<filter type="unique_value" column="1"/>    		
+		</options>
+		</param>	
+		<param name="condition2" type="select" display="checkboxes" label="Condition 2" multiple="true">
+			<options from_dataset="conditions">
+    		<column name="name" index="2"/>
+    		<column name="value" index="0"/>
+			<filter  type="param_value" ref="selectCondition2" column="1"/>
+		</options>
+		</param>	
+		<param name="nbresult" type="integer" value="1000" min="1" label="number of top genes" help="Number of genes to be displayed in result datatable"/>
+	</inputs>
+	<outputs>
+		<data format="html" name="result_html" label="Results of analysis of ${rdataset.name}"/>
+		<data format="rdata" name="result_export_eset" label="Export of expression set of ${rdataset.name}"/>
+		<data format="tabular" name="result_tabular" label="Text Results of analysis of ${rdataset.name}"/>
+		
+	</outputs>
+	<help>
+<![CDATA[ 
+**What it does**
+		
+The Limma analysis tool performs single analysis either of data previously retrieved from GEO database or normalized affymetrix .CEL files data. 
+Given a .cond file, it runs a standard limma differential expression analysis. 
+
+**Example** of .cond file      	
+
+The .cond file should look like this 
+::
+
+ Sample ID 	Condition			Description
+ GSM80460	series of 16 tumors	GSM80460 OSCE-2T SERIES OF 16 TUMORS
+ GSM80461	series of 16 tumors	GSM80461 OSCE-4T Series of 16 Tumors
+ GSM80462	series of 16 tumors	GSM80462 OSCE-6T Series of 16 Tumors
+ GSM80476	series of 4 normals	GSM80476 OSCE-2N Series of 4 Normals
+ GSM80477	series of 4 normals	GSM80477 OSCE-9N Series of 4 Normals
+	
+		
+**Results**
+		
+- Boxplots, p-value histograms and a volcano plot 
+- Table summarizing the differentially expressed genes and their annotations. This table is sortable and requestable.
+- Rdata object to perform further meta-analysis. 
+]]>
+	</help>
+
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/GEOQuery.xml	Thu Nov 10 07:34:57 2016 -0500
@@ -0,0 +1,65 @@
+<tool id="GEOQuery" name="GEOQuery">
+	<description>GEOQuery wrapper</description>
+	<requirements>
+	  	<container type="docker">sblanck/smagexp</container>
+	</requirements>
+	<command>
+		<![CDATA[ 
+			/galaxy-tools/stderr_wrapper.py Rscript 
+			/galaxy-tools/transcriptomics/GEOquery/GEOQuery.R 
+			$GEOQueryID 
+			$GEOQueryData 
+			$GEOQueryRData 
+			$conditions
+			$transformation
+		]]>
+	</command>
+
+	<inputs>
+		<param name="GEOQueryID" type="text" size="12" optional="false" label="GEOQuery ID" help="">
+			<validator type="empty_field"/>
+		</param>
+	<param name="transformation" type="select" label="log2 transformation">
+			<option value="auto">auto</option>
+            <option value="yes">yes</option>
+            <option value="no">no</option>
+        </param>
+	</inputs>
+
+		<outputs>
+		<data format="tabular" name="GEOQueryData" label="GEOQuery Data of ${GEOQueryID}"/>
+		<data format="cond" name="conditions" label="conditions of ${GEOQueryID}"/>
+        <data format="rdata" name="GEOQueryRData" label="GEOQuery RData of ${GEOQueryID}"/>		
+	</outputs>
+	<help>
+<![CDATA[ 
+**What it does**     	
+
+This tool fetches microarray data directly from GEO database, based on the GEOQuery R package. Given a GSE accession ID, it returns an Rdata object containing the data and a text file (.cond file) summarizing the conditions of the experiment. 
+The .cond file is a text file containing one line per sample in the experiment. Each line is made of 3 columns:
+
+	- Sample ID 
+	- Condition of the biological sample
+	- Description of the biological sample
+
+**Example** of .cond file      	
+::
+
+ Sample ID 	Condition			Description
+ GSM80460	series of 16 tumors	GSM80460 OSCE-2T SERIES OF 16 TUMORS
+ GSM80461	series of 16 tumors	GSM80461 OSCE-4T Series of 16 Tumors
+ GSM80462	series of 16 tumors	GSM80462 OSCE-6T Series of 16 Tumors
+ GSM80476	series of 4 normals	GSM80476 OSCE-2N Series of 4 Normals
+ GSM80477	series of 4 normals	GSM80477 OSCE-9N Series of 4 Normals
+    
+**Results**
+	
+- Rdata object containing data for further analysis
+- Condition (.cond) file summarizing conditions of the experiment
+- Tabular (.txt) file containing expression data for each sample
+]]> 		
+
+	</help>
+
+
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/ImportDataFromMatrix.xml	Thu Nov 10 07:34:57 2016 -0500
@@ -0,0 +1,78 @@
+<tool id="importMatrixData" name="Import custom data">
+	<description>Quality control and normalization of a custom matrix expression data</description>
+	<requirements>
+	  	<container type="docker">sblanck/smagexp</container>
+	</requirements>
+	<command>
+		<![CDATA[ 
+		/galaxy-tools/stderr_wrapper.py Rscript 
+		/galaxy-tools/transcriptomics/ImportDataFromMatrix/ImportDataFromMatrix.R
+		    $input
+			$normalization
+			$conditions
+			$annotations
+			$result_export_eset
+       		$result_html
+			$result_html.files_path
+		/galaxy-tools/transcriptomics/ImportDataFromMatrix/ImportDataFromMatrix_tpl.html
+		]]>		
+		</command>
+		
+	
+	<inputs>
+		<param name="input" type="data" format="tabular" label="Input data" help="Input data"/>
+		<param name="normalization" type="select" label="Preprocessing/normalization">
+    		<option value="quantile">quantile normalization + log2</option>
+            <option value="log2">log2 only</option>
+            <option value="none">none</option>
+		</param>
+		<param name="conditions" type="data" format="cond" label="Conditions" help="conditions associated with the input file"/>
+		<param name="annotations" type="text" label="Annotation GPL code" help="GPL code for annotations"/>		
+	</inputs>
+
+	<outputs>
+		<data format="rdata" name="result_export_eset" label="export normalized expressionSet"/>		
+		<data format="html" name="result_html" label="QC result"/>
+	</outputs>
+
+	<help>
+<![CDATA[ 
+**What it does**
+		     	
+This tool imports data stored in a tabular text file. 
+Column titles (chip IDs) must match the IDs of the .cond file.
+GPL annotation code is also required to fetch annotations from GEO.
+
+**Exemple**
+
+Header of input tabular text file
+::
+
+""	"GSM80460"	"GSM80461"	"GSM80462"	"GSM80463"	"GSM80464"
+"1007_s_at"	-0.0513991525066443	0.306845500314283	0.0854246562526777	-0.142417044615852	0.0854246562526777
+"1053_at"	-0.187707155126729	-0.488026018218199	-0.282789700980404	0.160920188181103	0.989865622866287
+"117_at"	0.814755482809874	-2.15842936260448	-0.125006361067033	-0.256700472111743	0.0114956388378294
+"121_at"	-0.0558912008920451	-0.0649174766813385	0.49467161164755	-0.0892673380970874	0.113700499164728
+"1294_at"	0.961993677420255	-0.0320936297098533	-0.169744675832317	-0.0969617298870879	-0.181149439104566
+"1316_at"	0.0454429707611671	0.43616183931445	-0.766111939825723	-0.182786075741673	0.599317793698226
+"1405_i_at"	2.23450132056221	0.369606070031838	-1.06190243892591	-0.190997225060914	0.595503660502742
+
+
+The .cond file should look like this 
+::
+
+ Sample ID 	Condition			Description
+ GSM80460	series of 16 tumors	GSM80460 OSCE-2T SERIES OF 16 TUMORS
+ GSM80461	series of 16 tumors	GSM80461 OSCE-4T Series of 16 Tumors
+ GSM80462	series of 16 tumors	GSM80462 OSCE-6T Series of 16 Tumors
+ GSM80476	series of 4 normals	GSM80476 OSCE-2N Series of 4 Normals
+ GSM80477	series of 4 normals	GSM80477 OSCE-9N Series of 4 Normals
+
+				
+**Results**
+	- Bboxplots and MA plots 
+	- Rdata object containing the data for further analysis.
+]]>
+	</help>
+
+</tool>
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/MetaMA.xml	Thu Nov 10 07:34:57 2016 -0500
@@ -0,0 +1,50 @@
+<tool id="metaMA" name="Microarray data meta-analysis" version="0.1.0">
+	<description>Perform meta-analysis thanks to metaMA.</description>
+	<requirements>
+	  <container type="docker">sblanck/smagexp</container>
+	</requirements>
+	<command>
+		<![CDATA[ 
+		/galaxy-tools/stderr_wrapper.py Rscript 
+		/galaxy-tools/transcriptomics/MetaMA/MetaMA.R
+		#for $currentInput in $inputList
+        	"${currentInput.rdataset}"
+		 #end for
+       		$result_html 
+			$result_html.extra_files_path
+		/galaxy-tools/transcriptomics/MetaMA/MetaMa_tpl.html
+		]]>
+	</command>
+	
+	<inputs>
+		<repeat name="inputList" title="Datasets">
+			<param name="rdataset" type="data" format="rdata" label="RData" help="RData to be used"/>
+		</repeat>
+	</inputs>
+	
+	<outputs>
+		<data format="html" name="result_html" label="Meta-analysis results"/>
+	</outputs>
+
+	<help>
+<![CDATA[ 
+**What it does**
+		
+Given several Rdata object this tool run a meta-analysis using the metaMA R package.
+		
+**Results**
+		
+- Venn Diagram summarizing the results of the meta-analysis
+- A list of indicators to evaluate the quality of the performance of the meta-analysis
+		
+	- DE : Number of differentially expressed genes 
+	- IDD (Integration Driven discoveries) : number of genes that are declared differentially expressed in the meta-analysis that were not identified in any of the single studies alone
+	- Loss : Number of genes that are identified differentially expressed in single studies but not in meta-analysis 
+	- DR (Integration-driven Discovery Rate) : corresponding proportion of IDD
+	- IRR (Integration-driven Revision) : corresponding proportion of Loss
+		
+- Fully sortable and requestable table, with gene annotations and hypertext links to NCBI gene database.
+]]>
+	</help>
+
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/MetaRNAseq.xml	Thu Nov 10 07:34:57 2016 -0500
@@ -0,0 +1,34 @@
+<tool id="metarnaseq" name="RNA-seq data meta-analysis">
+	<description>perform meta-analysis thanks to metaRNAseq</description>
+	<requirements>
+	  	<container type="docker">sblanck/smagexp</container>
+	</requirements>
+	<command>
+		<![CDATA[ 	
+		/galaxy-tools/stderr_wrapper.py Rscript 
+		/galaxy-tools/transcriptomics/MetaRNASeq/MetaRNASeq.R 
+		#for $currentInput in $inputList
+        	"${currentInput}"
+			"${currentInput.name}"	
+		 #end for	
+			$top_table 
+			$diagnostic_html 
+			"$diagnostic_html.files_path"
+		/galaxy-tools/transcriptomics/MetaRNASeq/MetaRNASeq_tpl.html
+	]]>	
+	</command>
+
+	<inputs>
+		<param format="tabular" name="inputList" multiple="true" type="data" optional="false" label="Counts file" help="Must have the same number of row in each study. The experimental conditions must be specified in the header of each file"/>
+	</inputs>
+
+	<outputs>
+		<data format="tabular" name="top_table" label="Summary of meta-analysis and single studie analysis from ${tool.name} on ${on_string}"/>
+		<data format="html" name="diagnostic_html" label="Charts for ${tool.name} on ${on_string}"/>
+	</outputs>
+
+	<help>
+		
+	</help>
+
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/repository_dependencies.xml	Thu Nov 10 07:34:57 2016 -0500
@@ -0,0 +1,4 @@
+<?xml version="1.0"?>
+<repositories description="smagexp datatypes">
+  <repository changeset_revision="f66f8566fd75" name="smagexp_datatypes" owner="sblanck" toolshed="https://testtoolshed.g2.bx.psu.edu" />
+</repositories>