44
|
1 <tool id="ctat_genome_resource_libs_data_manager"
|
|
2 name="CTAT Genome Resource Libraries Data Manager"
|
|
3 version="2.0.0" tool_type="manage_data">
|
|
4 <description>Retrieve, and/or specify the location of, a CTAT Genome Resource Library.
|
|
5 </description>
|
|
6 <requirements>
|
|
7 <requirement type="package" version="2.7">python</requirement>
|
|
8 <requirement type="package" version="0.5.0">fusion-filter</requirement>
|
|
9 <requirement type="package" version="2.0.1">ctat-mutations</requirement>
|
|
10 </requirements>
|
|
11 <command detect_errors="exit_code">
|
|
12 <![CDATA[
|
|
13 python $__tool_directory__/add_ctat_resource_lib.py
|
|
14 --output_filename="${out_file}"
|
|
15 --display_name="${display_name}"
|
|
16 #if str( $genome_resource_library.build_type ) == "download_and_build":
|
|
17 --download_url="${genome_resource_library.download_url}"
|
|
18 --download_location="${genome_resource_library.download_destination}"
|
|
19 #if str( $genome_resource_library.force_new_download ) == "true":
|
|
20 --new_archive_download
|
|
21 #end if
|
|
22 #if str( $genome_resource_library.keep_archive ) == "true":
|
|
23 --keep_archive
|
|
24 #end if
|
|
25 #if str( $genome_resource_library.rebuild ) == "true":
|
|
26 --new_library_build
|
|
27 #end if
|
|
28 #if str( $genome_resource_library.specify_build_location.build_location ) == "true":
|
|
29 --build_location="${genome_resource_library.specify_build_location.different_build_location}"
|
|
30 #end if
|
|
31 #elif str( $genome_resource_library.build_type ) == "build_from_source":
|
|
32 --source_location "${genome_resource_library.source_location}"
|
|
33 #if str( $genome_resource_library.rebuild ) == "true":
|
|
34 --new_library_build
|
|
35 #end if
|
|
36 #if str( $genome_resource_library.specify_build_location.build_location ) == "true":
|
|
37 --build_location="${genome_resource_library.specify_build_location.different_build_location}"
|
|
38 #end if
|
|
39 #elif str( $genome_resource_library.build_type ) == "specify_built_location":
|
|
40 --build_location="${genome_resource_library.built_library_location}"
|
|
41 #end if
|
|
42
|
|
43 #if str( $gmap_options.gmap_build ) == "true":
|
|
44 --gmap_build
|
|
45 #if str( $gmap_options.force_gmap_build ) == "true":
|
|
46 --force_gmap_build
|
|
47 #end if
|
|
48 #end if
|
|
49
|
|
50 #if str( $mutation_lib_options.mutation_build ) == "true":
|
|
51 --download_mutation_resources_url="${mutation_lib_options.source_url}"
|
|
52 --cosmic_resources_location="${mutation_lib_options.cosmic_files_location}"
|
|
53 #if str( $mutation_lib_options.force_download ) == "true":
|
|
54 --new_mutation_download
|
|
55 #end if
|
|
56 #if str( $mutation_lib_options.redo_integration ) == "true":
|
|
57 --new_mutation_integration
|
|
58 #end if
|
|
59 #end if
|
|
60 ]]>
|
|
61 </command>
|
|
62 <inputs>
|
|
63 <!-- The following are left in here, just as examples of various ways of doing options.
|
|
64 <param name="force_download" type="boolean" checked="false"
|
|
65 truevalue="- -force_download" falsevalue="" label="Force New Download? (yes/no)" />
|
|
66 <param name="download" type="select" label="Need to Download?">
|
|
67 <option value="single" selected="true">Single Dataset</option>
|
|
68 <option value="paired_collection">Paired Collection</option>
|
|
69 <when value="paired_collection">
|
|
70 <param name="fastq_input" format="fastqsanger" type="data_collection" collection_type="paired" label="Select dataset pair" help="Specify paired dataset collection containing paired reads"/>
|
|
71 </when>
|
|
72 -->
|
|
73 <conditional name="genome_resource_library">
|
|
74 <param name="build_type" type="select" label="Download CTAT Genome Resource Library?">
|
|
75 <option value="download_and_build" selected="true">Download from CTAT and build if needed</option>
|
|
76 <option value="build_from_source">Build library from local source data</option>
|
|
77 <option value="specify_built_location">Specify location of built library</option>
|
|
78 </param>
|
|
79 <when value="download_and_build">
|
|
80 <!-- The use of a code block to get dynamic options is now deprecated and discouraged.
|
|
81 I am still using it here. The only other way I can think of to do this is to
|
|
82 create another data_manager that gets the list of files and puts them into a
|
|
83 data_table, that is then used to get the filenames. That would require the admin
|
|
84 to first run the data_manager that builds the filename data_table before running
|
|
85 this data_manager.
|
|
86 This is the dynamic way to get the options filled.
|
|
87 <param name="filename" type="select" label="Select File" display="radio"
|
|
88 dynamic_options="get_ctat_genome_filenames()"
|
|
89 help="Select a CTAT Genome Resource Library to Download." />
|
|
90 Here is the static method for what is online in April 2017:
|
|
91 <param name="filename" type="select" label="Choose which library to download.">
|
|
92 <option value="https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/GRCh37_v19_CTAT_lib_Feb092018.plug-n-play.tar.gz">
|
|
93 GRCh37_v19_CTAT_lib_Feb092018.plug-n-play.tar.gz
|
|
94 </option>
|
|
95 <option value="https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/ GRCh37_v19_CTAT_lib_Feb092018.source_data.tar.gz">
|
|
96 GRCh37_v19_CTAT_lib_Feb092018.source_data.tar.gz
|
|
97 </option>
|
|
98 <option value="https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/ GRCh38_v27_CTAT_lib_Feb092018.plug-n-play.tar.gz">
|
|
99 GRCh38_v27_CTAT_lib_Feb092018.plug-n-play.tar.gz
|
|
100 </option>
|
|
101 <option value="https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/ GRCh38_v27_CTAT_lib_Feb092018.source_data.tar.gz">
|
|
102 GRCh38_v27_CTAT_lib_Feb092018.source_data.tar.gz
|
|
103 </option>
|
|
104 <option value="https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/ Mouse_M16_CTAT_lib_Feb202018.plug-n-play.tar.gz">
|
|
105 Mouse_M16_CTAT_lib_Feb202018.plug-n-play.tar.gz
|
|
106 </option>
|
|
107 <option value="https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/ Mouse_M16_CTAT_lib_Feb202018.source_data.tar.gz">
|
|
108 Mouse_M16_CTAT_lib_Feb202018.source_data.tar.gz
|
|
109 </option>
|
|
110 -->
|
|
111 <param name="download_url" type="select" label="Select a File"
|
|
112 dynamic_options="get_ctat_genome_urls()"
|
|
113 help="Select a CTAT Genome Resource Library to Download.">
|
|
114 </param>
|
|
115 <param name="download_destination" type="text" label="Download Destination (full path)" />
|
|
116 <param name="force_new_download" type="boolean" checked="false" label="Force New Download?" />
|
|
117 <param name="keep_archive" type="boolean" checked="true" label="Keep downloaded archive rather than deleting after build?" />
|
|
118 <param name="rebuild" type="boolean" checked="false" label="Force new build of Library?" />
|
|
119 <conditional name="specify_build_location">
|
|
120 <param name="build_location" type="boolean" checked="false" label="Is the build location different than the source location?" />
|
|
121 <when value="true">
|
|
122 <param name="different_build_location" type="text" label="Build Location (full path)" />
|
|
123 </when>
|
|
124 </conditional>
|
|
125 </when>
|
|
126 <when value="build_from_source">
|
|
127 <param name="source_location" type="text" label="Location of Source Files (full path)" />
|
|
128 <param name="rebuild" type="boolean" checked="false" label="Force new build of Library?" />
|
|
129 <conditional name="specify_build_location">
|
|
130 <param name="build_location" type="boolean" checked="false" label="Is the build location different than the source location?" />
|
|
131 <when value="true">
|
|
132 <param name="different_build_location" type="text" label="Build Location (full path)" />
|
|
133 </when>
|
|
134 </conditional>
|
|
135 </when>
|
|
136 <when value="specify_built_location">
|
|
137 <param name="built_library_location" type="text" label="Location of the Built Library (full path)" />
|
|
138 </when>
|
|
139 </conditional>
|
|
140 <param name="display_name" type="text" label="Reference Genome Display Name" />
|
|
141 <conditional name="gmap_options">
|
|
142 <param name="gmap_build" type="boolean" checked="true" label="Do a gmap_build on the Library?" />
|
|
143 <when value="true">
|
|
144 <param name="force_gmap_build" type="boolean" checked="false" label="Force a new build even if previously done?" />
|
|
145 </when>
|
|
146 </conditional>
|
|
147 <conditional name="mutation_lib_options">
|
|
148 <param name="mutation_build" type="boolean" checked="false" label="Download and integrate mutation library?">
|
|
149 </param>
|
|
150 <when value="true">
|
|
151 <param name="source_url" type="select" label="Select a File"
|
|
152 dynamic_options="get_mutation_resource_urls()"
|
|
153 help="Select CTAT Mutation Library File to Download.\nMake sure it is the right one for your CTAT Genome Resource Library!">
|
|
154 </param>
|
|
155 <param name="force_download" type="boolean" checked="false" label="Force New Download?" />
|
|
156 <param name="redo_integration" type="boolean" checked="false" label="Redo Library Integration?" />
|
|
157 <param name="cosmic_files_location" type="text" label="Location of the COSMIC files (See Tool Notes)." />
|
|
158 </when>
|
|
159 </conditional>
|
|
160 -->
|
|
161 </inputs>
|
|
162 <outputs>
|
|
163 <data name="out_file" format="data_manager_json" />
|
|
164 </outputs>
|
|
165 <help>
|
|
166 Retrieve, and/or specify the location of, a CTAT Genome Resource Library.
|
|
167
|
|
168 There are three options: 1) Download from CTAT and build if needed; 2) Build library from local source data; 3) Specify location of built library.
|
|
169
|
|
170 1) Download from CTAT and build if needed:
|
|
171 This option uses the files at https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/
|
|
172 as selectors for the user to choose among.
|
|
173 Specify the Full Path of the location where the CTAT Genome Resource Library should be placed.
|
|
174 The other options should be self-explanatory.
|
|
175 2) Build library from local source data:
|
|
176 This assumes that you have already downloaded the source data for a build and you want to build it.
|
|
177 3) Specify location of built library:
|
|
178 This assumes you already have a build library and need tell galaxy where it is.
|
|
179
|
|
180 All options allow the user to do a gmap_build on the library
|
|
181 and also to integrate ctat-mutation resources into the library.
|
|
182
|
|
183 You will need approximately 62GB of space for this library, once it is built,
|
|
184 but if downloading and building, to be safe provide at least 75GB.
|
|
185
|
|
186 The installation of this tool takes some time, due to building a conda environment for the dependencies.
|
|
187 The "source_data" files download faster, but then must be built.
|
|
188 Building the library from the "source_data" files can take many hours, depending on the resources of your machine.
|
|
189 The "plug-n-play" can take considerable time to download, depending on your internet connection. Even with high speed,
|
|
190 it is about 25GB that is transfered, so plan accordingly.
|
|
191 If you have a good speed internet connection, downloading the plug-n-play will usually be faster than building.
|
|
192
|
|
193 **If a download or a build is interrupted, re-running the job should pick up where it left off.**
|
|
194
|
|
195 Neither the "source_data" nor the "plug-n-play" versions have had their gmap index built. If you are not going to be
|
|
196 using gmap_fusion, then you can uncheck the gmap_build check box and save the space and time building the index consumes.
|
|
197
|
|
198 Neither the "source_data" nor the "plug-n-play" versions have mutation resources included. Those must be downloaded
|
|
199 separately. By default the Mutation Resources are not integrated into the Library. If you are going to be using the
|
|
200 ctat_mutations tool, check the Download Mutation Library check box.
|
|
201
|
|
202 In order to integrate the Mutation Resources into a CTAT Genome Resource Library, you must have previously downloaded
|
|
203 COSMIC resources (See Step 2 from https://github.com/NCIP/ctat-mutations/tree/master/mutation_lib_prep )
|
|
204 You can place them directly into the Genome Resource Library location, or if the Library is
|
|
205 not built yet, or you do not know the full path to it, specify the directory where the COSMIC files are, so they can be
|
|
206 integrated into the Library.
|
|
207
|
|
208 The Mouse genome is not currently supported by ctat_mutations.
|
|
209
|
|
210 If the Reference Genome Display Name is left empty a name will be created,
|
|
211 but any text that will best guide the user can be entered here.
|
|
212 It will be the text that is used for selecting the library in pull down lists
|
|
213 requiring a Genome Reference Library resource (ctat_genome_resource_libs).
|
|
214
|
|
215 For more information on CTAT Genome Resource Libraries,
|
|
216 see https://github.com/FusionFilter/FusionFilter/wiki
|
|
217 </help>
|
|
218 <code file="add_ctat_resource_lib.py" />
|
|
219 </tool>
|