|
0
|
1 <tool id="export2graphlan" name="export2graphlan" version="1.0.0">
|
|
|
2 <description>Export to Graphlan</description>
|
|
|
3 <command interpreter="python">
|
|
|
4 export2graphlan.py
|
|
|
5 -i $inp_data
|
|
|
6 -o $out_data
|
|
|
7 -t $output_tree_file
|
|
|
8 -a $output_annot_file
|
|
18
|
9
|
|
0
|
10 --annotations $export_annotations
|
|
|
11 --external_annotations $export_external_annotations
|
|
14
|
12 --background_levels $background_levels
|
|
17
|
13 #if $str($background_clades) != " ":
|
|
16
|
14 --background_clades $background_clades
|
|
|
15 #end if
|
|
18
|
16 #if $str($background_colors) != " ":
|
|
|
17 --background_colors $background_colors
|
|
|
18 #end if
|
|
|
19 #if $str($export_title) != " ":
|
|
|
20 --title $export_title
|
|
|
21 #end if
|
|
|
22 --title_font_size $title_font_size
|
|
|
23 --def_clade_size $def_clade_size
|
|
|
24 --min_clade_size $min_clade_size
|
|
|
25 --max_clade_size $max_clade_size
|
|
20
|
26 --def_font_size $def_font_size
|
|
|
27 --min_font_size $min_font_size
|
|
|
28 --max_font_size $max_font_size
|
|
|
29 --annotation_legend_font_size $annotation_legend_font_size
|
|
|
30 --abundance_threshold $abundance_threshold
|
|
21
|
31 #if $most_abundant > 0:
|
|
|
32 --most_abundant $most_abundant
|
|
|
33 #end if
|
|
0
|
34 --skip_rows 1,2
|
|
|
35 </command>
|
|
|
36
|
|
|
37 <inputs>
|
|
19
|
38 <param format="tabular" name="inp_data" type="data" label="Input used to run Lefse" help="This is the file that was used as input for Lefse"/>
|
|
|
39 <param format="lefse_internal_res" name="out_data" type="data" label="Output of Lefse" help="This is the Lefse output file"/>
|
|
14
|
40 <param name="export_annotations" type="text" format="text" label="Annotations" value="2,3"/>
|
|
|
41 <param name="export_external_annotations" type="text" format="text" label="External Annotations" value="4,5,6"/>
|
|
|
42 <param name="background_levels" type="text" format="text" label="Background Levels" value="1,2,3"/>
|
|
15
|
43 <param name="background_clades" type="text" format="text" label="Background Clades" value=" " />
|
|
18
|
44 <param name="background_colors" type="text" format="text" label="Background Colors" value=" " />
|
|
|
45 <param name="export_title" type="text" format="text" label="Title" value=" "/>
|
|
|
46 <param name="title_font_size" type="integer" size="4" value="15" label="Title font size"/>
|
|
|
47 <param name="def_clade_size" type="integer" size="4" value="0" label="Default Clade size"/>
|
|
|
48 <param name="min_clade_size" type="integer" size="4" value="20" label="Minimum Clade size that are Biomarkers"/>
|
|
|
49 <param name="max_clade_size" type="integer" size="4" value="200" label="Maximum Clade size that are Biomarkers"/>
|
|
20
|
50 <param name="def_font_size" type="integer" size="4" value="10" label="Default font size"/>
|
|
|
51 <param name="min_font_size" type="integer" size="4" value="8" label="Minimum font size "/>
|
|
|
52 <param name="max_font_size" type="integer" size="4" value="12" label="Maximum font size "/>
|
|
|
53 <param name="annotation_legend_font_size" type="integer" size="4" value="10" label="Annotation legend font size "/>
|
|
|
54 <param name="abundance_threshold" type="float" value="20.0" label="Abundance threshold: minimun abundace value for a clade to be annotated"/>
|
|
21
|
55 <param name="most_abundant" type="integer" size="4" value="0" label=" When only lefse_input is provided, you can specify how many clades to highlight "/>
|
|
20
|
56
|
|
21
|
57 least_biomarkers
|
|
0
|
58 </inputs>
|
|
|
59 <outputs>
|
|
|
60 <data name="output_annot_file" format="circl" />
|
|
|
61 <data name="output_tree_file" format="circl" />
|
|
|
62 </outputs>
|
|
|
63
|
|
|
64 <help>
|
|
|
65 Overview
|
|
|
66 ========
|
|
1
|
67 **export2graphlan** is an *OPTIONAL* tool that automatically convert **LEfSe**, **MetaPhlAn2**, and **HUMAnN** input and/or output files, to **GraPhlAn**. Input file can be also given in BIOM (both 1 and 2) format.
|
|
0
|
68
|
|
1
|
69 The aim of this tool is to support biologists, helping them by provide the tree and the annotation file for GraPhlAn, automatically.
|
|
|
70
|
|
|
71 Input files
|
|
|
72 -----------
|
|
|
73
|
|
|
74 As shown in the image below, export2graphlan can work with just one of the following files or with both of them.
|
|
|
75
|
|
|
76 * **Result of MetaPhlAn or HUMAnN analysis**: As depicted in the image below, this file can be the result of a MetaPhlAn analysis or a HUMAnN analysis. Generally, it is a tab separated file that have for each row a taxonomy and an abundance value.
|
|
|
77
|
|
|
78 * **Output of LEfSe**: This file is the result of LEfSe execute on the *Result of MetaPhlAn or HUMAnN analysis* file. This file allow GraPhlAn to highlight for you the found biomarkers.
|
|
|
79
|
|
21
|
80 Input parameters
|
|
|
81 ----------------
|
|
3
|
82
|
|
4
|
83 --annotations ANNOTATIONS
|
|
1
|
84 List which levels should be annotated in the tree. Use
|
|
|
85 a comma separate values form, e.g.,
|
|
|
86 --annotation_levels 1,2,3. Default is None
|
|
4
|
87 --external_annotations EXTERNAL_ANNOTATIONS
|
|
1
|
88 List which levels should use the external legend for
|
|
|
89 the annotation. Use a comma separate values form,
|
|
|
90 e.g., --annotation_levels 1,2,3. Default is None
|
|
|
91 --background_levels BACKGROUND_LEVELS
|
|
|
92 List which levels should be highlight with a shaded
|
|
|
93 background. Use a comma separate values form, e.g.,
|
|
|
94 --background_levels 1,2,3
|
|
|
95 --background_clades BACKGROUND_CLADES
|
|
|
96 Specify the clades that should be highlight with a
|
|
|
97 shaded background. Use a comma separate values form
|
|
|
98 and surround the string with " if it contains spaces.
|
|
|
99 Example: --background_clades "Bacteria.Actinobacteria,
|
|
|
100 Bacteria.Bacteroidetes.Bacteroidia,
|
|
|
101 Bacteria.Firmicutes.Clostridia.Clostridiales"
|
|
|
102 --background_colors BACKGROUND_COLORS
|
|
|
103 Set the color to use for the shaded background. Colors
|
|
|
104 can be either in RGB or HSV (using a semi-colon to
|
|
|
105 separate values, surrounded with ()) format. Use a
|
|
|
106 comma separate values form and surround the string
|
|
|
107 with " if it contains spaces. Example:
|
|
|
108 --background_colors "#29cc36, (150; 100; 100), (280;
|
|
|
109 80; 88)"
|
|
|
110 --title TITLE If specified set the title of the GraPhlAn plot.
|
|
|
111 Surround the string with " if it contains spaces,
|
|
|
112 e.g., --title "Title example"
|
|
|
113 --title_font_size TITLE_FONT_SIZE
|
|
|
114 Set the title font size. Default is 15
|
|
|
115 --def_clade_size DEF_CLADE_SIZE
|
|
|
116 Set a default size for clades that are not found as
|
|
|
117 biomarkers by LEfSe. Default is 10
|
|
|
118 --min_clade_size MIN_CLADE_SIZE
|
|
|
119 Set the minimum value of clades that are biomarkers.
|
|
|
120 Default is 20
|
|
|
121 --max_clade_size MAX_CLADE_SIZE
|
|
|
122 Set the maximum value of clades that are biomarkers.
|
|
|
123 Default is 200
|
|
|
124 --def_font_size DEF_FONT_SIZE
|
|
|
125 Set a default font size. Default is 10
|
|
|
126 --min_font_size MIN_FONT_SIZE
|
|
|
127 Set the minimum font size to use. Default is 8
|
|
|
128 --max_font_size MAX_FONT_SIZE
|
|
|
129 Set the maximum font size. Default is 12
|
|
|
130 --annotation_legend_font_size ANNOTATION_LEGEND_FONT_SIZE
|
|
|
131 Set the font size for the annotation legend. Default
|
|
|
132 is 10
|
|
|
133 --abundance_threshold ABUNDANCE_THRESHOLD
|
|
|
134 Set the minimun abundace value for a clade to be
|
|
|
135 annotated. Default is 20.0
|
|
|
136 --most_abundant MOST_ABUNDANT
|
|
|
137 When only lefse_input is provided, you can specify how
|
|
|
138 many clades highlight. Since the biomarkers are
|
|
|
139 missing, they will be chosen from the most abundant
|
|
|
140 --least_biomarkers LEAST_BIOMARKERS
|
|
|
141 When only lefse_input is provided, you can specify the
|
|
|
142 minimum number of biomarkers to extract. The taxonomy
|
|
|
143 is parsed, and the level is choosen in order to have
|
|
|
144 at least the specified number of biomarkers
|
|
|
145 --discard_otus If specified the OTU ids will be discarde from the
|
|
|
146 taxonmy. Default behavior keep OTU ids in taxonomy
|
|
|
147 --internal_levels If specified sum-up from leaf to root the abundances
|
|
|
148 values. Default behavior do not sum-up abundances on
|
|
|
149 the internal nodes
|
|
|
150
|
|
|
151 input parameters:
|
|
21
|
152
|
|
3
|
153 -i LEFSE_INPUT, --lefse_input LEFSE_INPUT
|
|
6
|
154
|
|
1
|
155 -o LEFSE_OUTPUT, --lefse_output LEFSE_OUTPUT
|
|
|
156
|
|
|
157 output parameters:
|
|
13
|
158
|
|
1
|
159 -t TREE, --tree TREE Output filename where save the input tree for GraPhlAn
|
|
13
|
160
|
|
9
|
161 -a ANNOTATION, --annotation ANNOTATION : This is the Output filename where to save GraPhlAn annotation
|
|
7
|
162
|
|
1
|
163 Input data matrix parameters:
|
|
|
164 --sep SEP
|
|
9
|
165 --out_table OUT_TABLE : This is where to write the processed data matrix to file
|
|
12
|
166
|
|
11
|
167 --fname_row FNAME_ROW : Row number containing the names of the features (default 0, specify -1 if no names are present in the matrix)
|
|
12
|
168
|
|
1
|
169 --sname_row SNAME_ROW
|
|
11
|
170 column number containing the names of the samples (default 0, specify -1 if no names are present in the matrix)
|
|
1
|
171 --metadata_rows METADATA_ROWS
|
|
|
172 Row numbers to use as metadata[default None, meaning
|
|
|
173 no metadata
|
|
|
174 --skip_rows SKIP_ROWS
|
|
|
175 Row numbers to skip (0-indexed, comma separated) from
|
|
|
176 the input file[default None, meaning no rows skipped
|
|
|
177 --sperc SPERC Percentile of sample value distribution for sample
|
|
|
178 selection
|
|
|
179 --fperc FPERC Percentile of feature value distribution for sample
|
|
|
180 selection
|
|
|
181 --stop STOP Number of top samples to select (ordering based on
|
|
|
182 percentile specified by --sperc)
|
|
|
183 --ftop FTOP Number of top features to select (ordering based on
|
|
|
184 percentile specified by --fperc)
|
|
|
185 --def_na DEF_NA Set the default value for missing values [default None
|
|
|
186 which means no replacement]
|
|
|
187
|
|
|
188 Integration
|
|
|
189 ===========
|
|
|
190
|
|
|
191 A graphical representation of how **export2graphlan** can be integrated in the analysis pipeline:
|
|
0
|
192
|
|
|
193 .. image:: https://bitbucket.org/repo/oL6bEG/images/3364692296-graphlan_integration.png
|
|
1
|
194 :height: 672
|
|
|
195 :width: 800
|
|
0
|
196
|
|
1
|
197 Want to know more?
|
|
|
198 ==================
|
|
0
|
199
|
|
2
|
200 If you want to know more about **export2graphlan** please have a look at the tutorial
|
|
0
|
201 </help>
|
|
|
202 </tool>
|