Mercurial > repos > petr-novak > repeat_annotation_pipeline3
annotate repeat_annotate_custom.xml @ 4:d7bb42f254a2 draft
"planemo upload commit fa6d4eb0c804e873b60bb2ba3d0e85646c9cd764"
author | petr-novak |
---|---|
date | Mon, 14 Mar 2022 10:16:07 +0000 |
parents | 4ea506b39297 |
children | b53f5a456d01 |
rev | line source |
---|---|
4
d7bb42f254a2
"planemo upload commit fa6d4eb0c804e873b60bb2ba3d0e85646c9cd764"
petr-novak
parents:
3
diff
changeset
|
1 <tool id="repeat_annotate" name="Library Based Assembly Annotation" version="0.1.3" python_template_version="3.5"> |
0 | 2 <requirements> |
3 <requirement type="package">repeatmasker</requirement> | |
4 <requirement type="package">bioconductor-rtracklayer</requirement> | |
5 </requirements> | |
6 <command detect_errors="exit_code"><![CDATA[ | |
3 | 7 |
8 #if $sensitivity.value == 'default': | |
9 RepeatMasker -dir \$(pwd) '$input' -pa 32 -lib '$repeat_library' -xsmall -nolow -no_is -e ncbi | |
10 #else: | |
11 RepeatMasker -dir \$(pwd) '$input' -pa 32 -lib '$repeat_library' -xsmall -nolow -no_is -e ncbi $sensitivity | |
12 #end if | |
0 | 13 && |
14 ls -l * >&2 && | |
15 cp `basename $input`.out $output2 | |
16 && | |
17 Rscript ${__tool_directory__}/clean_rm_output.R $output2 $output1 | |
18 | |
19 ]]></command> | |
20 <inputs> | |
21 <param type="data" name="input" format="fasta" label="Genome/ Assembly to annotate" /> | |
22 <param type="data" name="repeat_library" format="fasta" label="RepeatExplorer based Library of Repetitive Sequences" | |
23 help="custom database of repetitive sequences should be provided in fasta format. Sequence header should specify repeat class: | |
24 >sequence_id#classification_level1/classification_level2/..." /> | |
3 | 25 <param type="select" label="sensitivity" name="sensitivity" > |
26 <option value="default" selected="true" >Default sensitivity </option> | |
27 <option value="-s">Slow search, more sensitive </option> | |
28 <option value="-q">Quick search, more sensitive </option> | |
29 </param> | |
0 | 30 </inputs> |
31 <outputs> | |
32 <data name="output1" format="gff3" label="Repeat Annotation on ${on_string}, cleaned gff"/> | |
33 <data name="output2" format="tabular" label="Raw output from RepeatMasker on ${on_string}" /> | |
34 </outputs> | |
35 <help><![CDATA[ | |
3 | 36 This tools uses RepeatMasker to annotate repetitive sequences in the genome assemblies using custom library of repeats created either from RepeatExplorer output or from DANTE_LTR transposable element library. |
37 Library of repeats can be created from RepeatExplorer output from contigs and TAREAN consensus sequences. | |
38 Fasta formatted library of repeats must contain header containing information about classification of repeats as **>sequence_id#classification_level1/classification_level2/...** | |
0 | 39 |
3 | 40 Classification in RepeatExplorer based library follows predetermined classification levels. User can however specify additional classification levels or custom classifications. |
41 Conflicts in annotations are resolved based on classification hierarchy. | |
0 | 42 ]]></help> |
43 </tool> | |
44 |