annotate masurca.xml @ 1:03edd7b30f66 draft

Deleted selected files
author dnbenso
date Mon, 24 Jan 2022 00:00:54 +0000
parents 3f13e9565679
children 1808eaa9d699
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
1 <tool id="masurca" name="MaSuRCA" version="@TOOL_VERSION@+galaxy0">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
2 <description>The MaSuRCA (Maryland Super Read Cabog Assembler) genome assembly and analysis toolkit with config</description>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
3 <macros>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
4 <token name="@TOOL_VERSION@">4.0.6</token>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
5 </macros>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
6 <requirements>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
7 <requirement type="package" version="@TOOL_VERSION@">masurca</requirement>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
8 </requirements>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
9 <command detect_errors="exit_code"><![CDATA[
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
10 cp $__tool_directory__/default-masurca-config config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
11 #if $nanopore_input.np_input == "Yes":
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
12 #if $pacbio_input.pb_input == "Yes":
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
13 cat '$nanopore_input.nano' '$pacbio_input.pacbio' > long.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
14 #else:
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
15 ln -s '$nanopore_input.nano' long.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
16 #end if
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
17 sed -i 's|#NANOPORE=INPUTREADLONG|NANOPORE=long.fastq.gz|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
18 #elif $pacbio_input.pb_input == "Yes":
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
19 ln -s '$pacbio_input.pacbio' long.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
20 sed -i 's|#PACBIO=INPUTREADLONG|PACBIO=long.fastq.gz|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
21 #end if
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
22 #if str( $illumina_input.input_type ) == "single"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
23 ln -s '$illumina_input.fastq_input1' ill_1.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
24 sed -i 's|INPUTREAD1|ill_1.fastq.gz|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
25 #elif str( $illumina_input.input_type ) == "paired"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
26 ln -s '$illumina_input.fastq_input1' ill_1.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
27 sed -i 's|INPUTREAD1|ill_1.fastq.gz|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
28 ln -s '$illumina_input.fastq_input2' ill_2.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
29 sed -i 's|INPUTREAD2|ill_2.fastq.gz|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
30 #elif str( $illumina_input.input_type ) == "paired_collection"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
31 ln -s '$illumina_input.fastq_input1' ill_1.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
32 sed -i 's|INPUTREAD1|ill_1.fastq.gz|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
33 ln -s '$illumina_input.fastq_input2' ill_2.fastq.gz &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
34 sed -i 's|INPUTREAD2|ill_2.fastq.gz|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
35 #end if
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
36 #if $reference_input.ref_input == "Yes":
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
37 sed -i 's|#REFERENCE=REF|REFERENCE=$ref|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
38 #end if
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
39 sed -i 's|GALAXY_SLOTS|'\${GALAXY_SLOTS:-8}'|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
40 sed -i 's|MEAN|$mean|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
41 sed -i 's|STDDEV|$stddev|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
42 sed -i 's|JELLYFISHSIZE|$jfsize|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
43 sed -i 's|USE_LINKING_MATES = 0|USE_LINKING_MATES = $lnkmts|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
44 sed -i 's|FLYE_ASSEMBLY=0|FLYE_ASSEMBLY=$flye|' config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
45 masurca config.txt &&
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
46 bash assemble.sh
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
47 ]]></command>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
48 <inputs>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
49 <conditional name="illumina_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
50 <param name="input_type" type="select" label="Paired-end reads" help="Select between paired and paired collection">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
51 <option value="single">Single</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
52 <option value="paired">Paired</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
53 <option value="paired_collection">Paired Collection</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
54 </param>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
55 <when value="single">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
56 <param type="data" name="fastq_input1" format="fastqsanger,fastqsanger.gz"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
57 label="Select unpaired reads" help="Specify dataset with unpaired reads"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
58 </when>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
59 <when value="paired">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
60 <param type="data" name="fastq_input1" format="fastqsanger,fastqsanger.gz"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
61 label="Select first set of reads" help="Specify dataset with forward reads"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
62 <param type="data" name="fastq_input2" format="fastqsanger,fastqsanger.gz"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
63 label="Select second set of reads" help="Specify dataset with reverse reads"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
64 </when>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
65 <when value="paired_collection">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
66 <param name="fastq_input1" format="fastqsanger,fastqsanger.gz" type="data_collection" collection_type="paired" label="Select a paired collection" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
67 </when>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
68 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
69 <param type="integer" name="mean" value="500" label="Mean size" help="Libarary insert average length" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
70 <param type="integer" name="stddev" value="50" label="Standard deviation"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
71 help="Library insert standard deviation - if not known, set it to approximately 15% of the mean" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
72 <conditional name="nanopore_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
73 <param name="np_input" type="select" label="Use Nanopore long reads" help="Optional Nanopore reads must be in a single fasta or fastq file">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
74 <option value="No" selected="true">No</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
75 <option value="Yes">Yes</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
76 </param>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
77 <when value="No"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
78 <when value="Yes">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
79 <param type="data" name="nano" format="fastqsanger,fastqsanger.gz,fasta,fasta.gz" label="nanopore reads" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
80 </when>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
81 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
82 <conditional name="pacbio_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
83 <param name="pb_input" type="select" label="Use Pacbio long reads" help="Optional Pacbio reads must be in a single fasta or fastq file">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
84 <option value="No" selected="true">No</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
85 <option value="Yes">Yes</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
86 </param>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
87 <when value="No"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
88 <when value="Yes">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
89 <param type="data" name="pacbio" format="fastqsanger,fastqsanger.gz,fasta,fasta.gz" label="pacbio reads" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
90 </when>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
91 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
92 <conditional name="reference_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
93 <param name="ref_input" type="select" label="Synteny-assisted assembly" help="Concatenate all reference genomes into one reference.fa; works for Illumina-only data">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
94 <option value="No" selected="true">No</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
95 <option value="Yes">Yes</option>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
96 </param>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
97 <when value="No"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
98 <when value="Yes">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
99 <param type="data" name="ref" format="fasta,fasta.gz" label="Reference" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
100 </when>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
101 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
102 <param type="integer" name="jfsize" value="20000000" label="Jellyfish hash size" help="Set this to about 10x the genome size" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
103 <param type="boolean" name="flye" truevalue="1" falsevalue="0" label="Set this to use Flye assembler for final assembly of corrected mega-reads"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
104 help="If you are doing Hybrid Illumina paired end + Nanopore/PacBio assembly ONLY (no Illumina mate pairs or OTHER frg files). DO NOT use if you have less than 15x coverage by long read" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
105 <param type="boolean" name="lnkmts" truevalue="1" falsevalue="0" label="Include Linking Mates"
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
106 help="Most of the paired end reads end up in the same super read and thus are not passed to the assembler. Those that do not end up in the same super read are called ”linking mates” . The best assembly results are achieved by setting this parameter to 1 for Illumina-only assemblies. If you have more than 2x coverage by long reads, set this to 0." />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
107 </inputs>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
108 <outputs>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
109 <data name="superReads" format="fasta" from_work_dir="superReadSequences.named.fasta" label="${tool.name} on ${on_string}: named_superReads" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
110 <data name="scaffold_prm" format="fasta" from_work_dir="CA.mr.*/primary.genome.scf.fasta" label="${tool.name} on ${on_string}: primary_genome">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
111 <filter>flye == False</filter>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
112 </data>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
113 <data name="scaffold_alt" format="fasta" from_work_dir="CA.mr.*/alternative.genome.scf.fasta" label="${tool.name} on ${on_string}: alternative_genome">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
114 <filter>flye == False</filter>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
115 </data>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
116 <data name="flye_assembly" format="fasta" from_work_dir="flye.mr.*/assembly.fasta" label="${tool.name} on ${on_string}: flye_assembly">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
117 <filter>flye == True</filter>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
118 </data>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
119 </outputs>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
120 <tests>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
121 <test>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
122 <conditional name="illumina_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
123 <param name="input_type" value="paired" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
124 <param name="fastq_input1" value="illumina_reads_1.fastq"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
125 <param name="fastq_input2" value="illumina_reads_2.fastq"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
126 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
127 <conditional name="nanopore_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
128 <param name="np_input" value="Yes" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
129 <param name="nano" value="nanopore_reads.fastq" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
130 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
131 <conditional name="pacbio_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
132 <param name="pb_input" value="No" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
133 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
134 <conditional name="reference_input">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
135 <param name="ref_input" value="Yes" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
136 <param name="ref" value="reference_genome.fasta" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
137 </conditional>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
138 <param name="mean" value="500" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
139 <param name="stddev" value="50" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
140 <param name="jfsize" value="80349460" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
141 <param name="flye" value="1" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
142 <param name="lnkmts" value="0" />
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
143 <output name="superReads" ftype="fasta">
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
144 <assert_contents>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
145 <has_line_matching expression="^GAAAGCCGTGGCTTGGAACGGTGCTGATTGATCCGGC.*"/>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
146 </assert_contents>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
147 </output>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
148 </test>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
149 </tests>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
150 <help><![CDATA[
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
151
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
152 This implementation of MaSuRCA uses a config file for more complicated
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
153 assemblies and to change default settings. Illumina reads (mandatory)
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
154 and long reads from PACBIO or Oxford Nanopore or both can be included.
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
155
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
156 ]]></help>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
157 <citations>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
158 <citation type="doi">10.1093/bioinformatics/btt476</citation>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
159 </citations>
3f13e9565679 Uploaded
dnbenso
parents:
diff changeset
160 </tool>