comparison helixer.xml @ 2:7c1dc010a819 draft

planemo upload for repository https://github.com/genouest/galaxy-tools/tree/master/tools/helixer commit 85a0295d96722d39bc249fa3be1145ce2b9801e3
author genouest
date Mon, 26 Feb 2024 09:47:53 +0000
parents 7bc75dd0f782
children e3846dc36c4d
comparison
equal deleted inserted replaced
1:7bc75dd0f782 2:7c1dc010a819
1 <?xml version="1.0"?> 1 <?xml version="1.0"?>
2 <tool id="helixer" name="Helixer" version="@TOOL_VERSION@" profile="21.05"> 2 <tool id="helixer" name="Helixer" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.05">
3 <description>gene calling</description> 3 <description>gene calling</description>
4 <macros> 4 <macros>
5 <import>macros.xml</import> 5 <import>macros.xml</import>
6 </macros> 6 </macros>
7 7
13 13
14 /usr/local/bin/fetch_helixer_models.py && 14 /usr/local/bin/fetch_helixer_models.py &&
15 Helixer.py 15 Helixer.py
16 --fasta-path '$input' 16 --fasta-path '$input'
17 --species '$species' 17 --species '$species'
18 --lineage $lineage.lineages 18 --lineage '$lineages'
19 --gff-output-path '$output' 19 --gff-output-path '$output'
20 20
21 --temporary-dir ./ 21 --temporary-dir ./
22 22
23 --subsequence-length $lineage.subsequence_length 23 #set default_subsequence_length = {"fungi": 21384, "land_plant": 106920, "invertebrate": 213840, "vertebrate": 213840}
24 #if str($lineage.option_overlap.use_overlap) == "true": 24 #set subsequence_len = default_subsequence_length.get(str($lineages))
25 --overlap-offset $lineage.option_overlap.overlap_offset 25 #set default_overlap_offset = {"fungi": 10692, "land_plant": 53460, "invertebrate": 106920, "vertebrate": 106920}
26 --overlap-core-length $lineage.option_overlap.overlap_core_length 26 #set overlap_off = default_overlap_offset.get(str($lineages))
27 #set default_overlap_core_length = {"fungi": 16038, "land_plant": 80190, "invertebrate": 160380, "vertebrate": 160380}
28 #set overlap_core_len = default_overlap_core_length.get(str($lineages))
29
30 #if str($subsequence_length) == "":
31 --subsequence-length '$subsequence_len'
27 #else: 32 #else:
28 --no-overlap 33 --subsequence-length '$subsequence_length'
29 #end if 34 #end if
35
36 #if str($option_overlap.use_overlap) == "true":
37 #if str($option_overlap.overlap_offset) == "":
38 --overlap-offset '$overlap_off'
39 #else:
40 --overlap-offset '$overlap_offset'
41 #end if
42
43 #if str($option_overlap.overlap_core_length) == "":
44 --overlap-core-length '$overlap_core_len'
45 #else:
46 --overlap-core-length '$overlap_core_length'
47 #end if
48 #end if
49
30 --batch-size $size 50 --batch-size $size
31 --window-size $post_processing.window_size 51 --window-size $post_processing.window_size
32 --min-coding-length $post_processing.min_coding_length 52 --min-coding-length $post_processing.min_coding_length
33 --edge-threshold $post_processing.edge_threshold 53 --edge-threshold $post_processing.edge_threshold
34 --peak-threshold $post_processing.peak_threshold 54 --peak-threshold $post_processing.peak_threshold
55
35 ]]></command> 56 ]]></command>
36 57
37 <inputs> 58 <inputs>
38 <param argument="--fasta-path" name="input" type="data" format="fasta,fasta.gz" label="Genomic sequence"></param> 59 <param argument="--fasta-path" name="input" type="data" format="fasta,fasta.gz" label="Genomic sequence"></param>
39 <conditional name="lineage"> 60
40 <param argument="--lineage" name="lineages" type="select" label="Available lineages" help="Choose the model to use for the annotation"> 61 <param argument="--lineage" name="lineages" type="select" label="Available lineages" help="Choose the model to use for the annotation">
41 <option value="land_plant">land plant</option> 62 <option value="land_plant">land plant</option>
42 <option value="vertebrate">vertebrate</option> 63 <option value="vertebrate">vertebrate</option>
43 <option value="invertebrate">invertebrate</option> 64 <option value="invertebrate">invertebrate</option>
44 <option value="fungi">fungi</option> 65 <option value="fungi">fungi</option>
45 </param> 66 </param>
46 <when value="land_plant"> 67
47 <expand macro="subseq" length="106920" offset="53460" offsetlen="80190" />
48 </when>
49 <when value="vertebrate">
50 <expand macro="subseq" length="213840" offset="106920" offsetlen="160380" />
51 </when>
52 <when value="invertebrate">
53 <expand macro="subseq" length="213840" offset="106920" offsetlen="160380" />
54 </when>
55 <when value="fungi">
56 <expand macro="subseq" length="21384" offset="10692" offsetlen="16038" />
57 </when>
58 </conditional>
59 <param argument="--species" type="text" optional="true" label="Species name"> 68 <param argument="--species" type="text" optional="true" label="Species name">
60 <sanitizer invalid_char=""> 69 <sanitizer invalid_char="">
61 <valid initial="string.letters,string.digits"> 70 <valid initial="string.letters,string.digits">
62 <add value="_" /> 71 <add value="_" />
63 </valid> 72 </valid>
69 <param argument="--window-size" type="integer" min="0" value="100" label="Window size" help="This determines the number of bases averaged during the sliding window approach"/> 78 <param argument="--window-size" type="integer" min="0" value="100" label="Window size" help="This determines the number of bases averaged during the sliding window approach"/>
70 <param argument="--edge-threshold" type="float" min="0" max="1" value="0.1" label="Edge threshold" help="This threshold specifies the genic score which defines the start / end boundaries of each candidate region"/> 79 <param argument="--edge-threshold" type="float" min="0" max="1" value="0.1" label="Edge threshold" help="This threshold specifies the genic score which defines the start / end boundaries of each candidate region"/>
71 <param argument="--peak-threshold" type="float" min="0" max="1" value="0.8" label="Peak threshold" help="This threshold specifies the minimum peak genic score required to accept the candidate region"/> 80 <param argument="--peak-threshold" type="float" min="0" max="1" value="0.8" label="Peak threshold" help="This threshold specifies the minimum peak genic score required to accept the candidate region"/>
72 <param argument="--min-coding-length" type="integer" min="0" value="100" label="Minimum coding length"/> 81 <param argument="--min-coding-length" type="integer" min="0" value="100" label="Minimum coding length"/>
73 </section> 82 </section>
83
84 <param name="subsequence_length" type="text" label="Subsequence length: how much of the genome the Neural Network can see at once" help="If you do not want to keep the default value, please enter the new value. Default values are 21384 for fungi, 106920 for land plant, and 213840 for vertebrates and invertebrates"/>
85
86 <conditional name="option_overlap">
87 <param name="use_overlap" type="select" label="Enable overlapping step after predictions" help="This step combines predictions made on each subsequences, to improve quality near start and end of subsequences.">
88 <option value="true" selected="true">Yes</option>
89 <option value="false">No</option>
90 </param>
91 <when value="true">
92 <param name="overlap_offset" type="text" label="Overlap offset: Smaller values may lead to better predictions but will take longer" help="If you do not want to keep the default value, please enter the new value. Default values are 10692 for fungi, 53460 for land plant, and 106920 for vertebrates and invertebrates."/>
93 <param name="overlap_core_length" type="text" label="Overlap core length: Predicted subsequences will be cut to this length to increase prediction quality. Smaller values may lead to better predictions but will take longer" help="If you do not want to keep the default value, please enter the new value. Default values are 16038 for fungi, 80190 for land plant, and 160380 for vertebrates and invertebrates."/>
94 </when>
95 <when value="false"/>
96 </conditional>
74 </inputs> 97 </inputs>
75 98
76 <outputs> 99 <outputs>
77 <data name="output" format="gff3"> 100 <data name="output" format="gff3">
78 </data> 101 </data>
79 </outputs> 102 </outputs>
80 <tests> 103 <tests>
81 <test expect_num_outputs="1"> 104 <test expect_num_outputs="1">
82 <!-- Test for species and land_plant--> 105 <!-- Test for species and land_plant-->
83 <param name="input" value="sequence.fasta"/> 106 <param name="input" value="sequence.fasta"/>
107 <param name="lineages" value="land_plant"/>
84 <param name="species" value="Arabidopsis"/> 108 <param name="species" value="Arabidopsis"/>
85 <conditional name="lineage">
86 <param name="lineages" value="land_plant"/>
87 </conditional>
88 <param name="size" value="8"/> 109 <param name="size" value="8"/>
110 <param name="subsequence_length" value=""/>
111 <section name="post_processing">
112 <param name="window_size" value="100"/>
113 <param name="edge_threshold" value="0.1"/>
114 <param name="peak_threshold" value="0.8"/>
115 <param name="min_coding_length" value="100"/>
116 </section>
117 <conditional name="option_overlap">
118 <param name="use_overlap" value="true"/>
119 <param name="overlap_offset" value=""/>
120 <param name="overlap_core_length" value=""/>
121 </conditional>
89 <output name="output" value="ouput_species.gff3" ftype="gff3" compare="sim_size" delta="100"/> 122 <output name="output" value="ouput_species.gff3" ftype="gff3" compare="sim_size" delta="100"/>
90 </test> 123 </test>
124
91 <test expect_num_outputs="1"> 125 <test expect_num_outputs="1">
92 <!-- Test for vertebrates--> 126 <!-- Test for vertebrates-->
93 <param name="input" value="sequence.fasta"/> 127 <param name="input" value="sequence.fasta"/>
94 <conditional name="lineage"> 128 <param name="lineages" value="vertebrate"/>
95 <param name="lineages" value="vertebrate"/>
96 </conditional>
97 <param name="size" value="8"/> 129 <param name="size" value="8"/>
130 <param name="size" value="8"/>
131 <param name="subsequence_length" value=""/>
132 <section name="post_processing">
133 <param name="window_size" value="100"/>
134 <param name="edge_threshold" value="0.1"/>
135 <param name="peak_threshold" value="0.8"/>
136 <param name="min_coding_length" value="100"/>
137 </section>
138 <conditional name="option_overlap">
139 <param name="use_overlap" value="true"/>
140 <param name="overlap_offset" value=""/>
141 <param name="overlap_core_length" value=""/>
142 </conditional>
98 <output name="output" value="vertebrate.gff3" ftype="gff3" lines_diff="2"/> 143 <output name="output" value="vertebrate.gff3" ftype="gff3" lines_diff="2"/>
99 </test>
100 <test expect_num_outputs="1">
101 <!-- Test for invertebrates-->
102 <param name="input" value="sequence.fasta"/>
103 <conditional name="lineage">
104 <param name="lineages" value="invertebrate"/>
105 </conditional>
106 <param name="size" value="8"/>
107 <output name="output" value="invertebrate.gff3" ftype="gff3" lines_diff="2"/>
108 </test>
109 <test expect_num_outputs="1">
110 <!-- Test for fungi-->
111 <param name="input" value="sequence.fasta"/>
112 <conditional name="lineage">
113 <param name="lineages" value="fungi"/>
114 </conditional>
115 <param name="size" value="8"/>
116 <output name="output" value="fungi.gff3" ftype="gff3" lines_diff="2"/>
117 </test> 144 </test>
118 </tests> 145 </tests>
119 146
120 <help><![CDATA[ 147 <help><![CDATA[
121 Helixer_: Gene calling with Deep Neural Networks. 148 Helixer_: Gene calling with Deep Neural Networks.