comparison hal_halLodExtract.xml @ 0:d398af42f54a draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/tools/haltools commit 6244b9d15a5ad97ae20191e2f8fbafe2050c3cac
author iuc
date Fri, 06 Feb 2026 10:32:18 +0000
parents
children b95d65e23448
comparison
equal deleted inserted replaced
-1:000000000000 0:d398af42f54a
1 <tool id="hal_hallodextract" name="halLodExtract" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
2 <description>generates a new HAL file at a coarser Level of Detail by interpolation</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="requirements"/>
7 <expand macro="stdio"/>
8 <command detect_errors="aggressive"><![CDATA[
9 halLodExtract
10 #if $backend.format == 'mmap':
11 --format 'mmap'
12 --mmapFileSize $backend.mmapFileSize
13 #end if
14 #if $root:
15 --root '$root'
16 #end if
17 #if $outTree:
18 --outTree '$outTree'
19 #end if
20 --probeFrac $probeFrac
21 --minSeqFrac $minSeqFrac
22 $keepSequences
23 $allSequences
24 '$input_hal' '$output_file' $scale
25 ]]></command>
26 <inputs>
27 <expand macro="input_hal"/>
28 <param name="scale" type="float" min="1" optional="false" label="Scale factor for interpolation"/>
29 <expand macro="params_root_optional"/>
30 <param argument="--outTree" type="text" value="" optional="true" label="Newick tree for new HAL file" help="Specify the Newick tree for the new HAL file. Must contain only genomes from the input HAL file (input's tree used if empty)">
31 <expand macro="sanitizer_default"/>
32 <expand macro="validator_newick"/>
33 </param>
34 <param argument="--probeFrac" type="float" value="0.035" min="0" label="Fraction of bases in step-interval" help="Fraction of bases in step-interval to sample while looking for most aligned column"/>
35 <param argument="--minSeqFrac" type="float" value="0.5" min="0" label="Minumum sequence length to sample (as fraction)" help="Minumum sequence length to sample as fraction of step size: i.e. sequences with length &lt;= floor(minSeqFrac * step) are ignored"/>
36 <param argument="--keepSequences" type="boolean" truevalue="--keepSequences" falsevalue="" checked="false" label="Keep sequences" help="Write the sequence strings to the output file"/>
37 <param argument="--allSequences" type="boolean" truevalue="--allSequences" falsevalue="" checked="false" label="All sequences" help="Sample all sequences (chromsomes / contigs / etc.) no matter how small they are. By default, small sequences may be skipped if they fall within the step size"/>
38 <expand macro="hal_backend_format"/>
39 </inputs>
40 <outputs>
41 <data name="output_file" format="hal" label="${tool.name} on ${on_string}: New HAL"/>
42 </outputs>
43 <tests>
44 <test expect_num_outputs="1">
45 <param name="input_hal" value="halTest.hal"/>
46 <param name="scale" value="10"/>
47 <output name="output_file" ftype="hal">
48 <assert_contents>
49 <has_size min="40000"/>
50 </assert_contents>
51 </output>
52 <assert_stdout>
53 <has_text text="tree ="/>
54 <has_text text="Graph:"/>
55 </assert_stdout>
56 </test>
57 <test expect_num_outputs="1">
58 <param name="input_hal" value="halTest.hal"/>
59 <param name="scale" value="10"/>
60 <output name="output_file" ftype="hal">
61 <assert_contents>
62 <has_size min="40000"/>
63 </assert_contents>
64 </output>
65 <assert_stdout>
66 <has_text text="tree ="/>
67 <has_text text="Graph:"/>
68 </assert_stdout>
69 </test>
70 <test expect_num_outputs="1">
71 <param name="input_hal" value="halTest.hal"/>
72 <param name="scale" value="10"/>
73 <param name="root" value="Genome_0"/>
74 <param name="outTree" value="(Genome_1:1,Genome_2:1,Genome_3:1)Genome_0;"/>
75 <output name="output_file" ftype="hal">
76 <assert_contents>
77 <has_size min="40000"/>
78 </assert_contents>
79 </output>
80 <assert_stdout>
81 <has_text text="tree ="/>
82 <has_text text="Graph:"/>
83 </assert_stdout>
84 </test>
85 <test expect_num_outputs="1">
86 <param name="input_hal" value="halTest.hal"/>
87 <param name="scale" value="10"/>
88 <param name="minSeqFrac" value="1"/>
89 <param name="keepSequences" value="true"/>
90 <param name="allSequences" value="true"/>
91 <output name="output_file" ftype="hal">
92 <assert_contents>
93 <has_size min="50000"/>
94 </assert_contents>
95 </output>
96 <assert_stdout>
97 <has_text text="tree ="/>
98 <has_text text="Graph:"/>
99 </assert_stdout>
100 </test>
101 </tests>
102 <help><![CDATA[
103 halLodExtract generates a reduced resolution HAL file as output from an input HAL file by sampling the alignment at a coarser Level of Detail by interpolation.
104 It needs a scale value that controls how the data is downsampled.
105 The tool can keep or drop short sequences, adjust how sequences are filtered relative to the step size, and optionally retain sequence strings.
106 Choose a different output tree, set a root genome, and tune how many bases are probed when selecting representative columns.
107
108 Use it to create a lighter HAL file for visualization, fast browsing, or downstream analyses that do not require full-resolution data.
109
110 -----
111
112 .. class:: warningmark
113
114 Running the tool on a HAL file in mmap format may fail, while the HDF5 format can run successfully. It is recommended to convert the input to HDF5 format first using halExtract.
115
116 .. class:: warningmark
117
118 At the moment, creating a HAL file in mmap format is disabled. The creation in HDF5 format is enforced.
119 ]]></help>
120 <expand macro="citation"/>
121 <expand macro="creator"/>
122 </tool>