diff align_families.xml @ 4:5fbeaa41b223 draft

Update to Du Novo 2.0.6.
author nick
date Wed, 25 Oct 2017 19:26:43 -0400
parents 00dde366870a
children 000969829a5d
line wrap: on
line diff
--- a/align_families.xml	Mon Sep 11 16:59:44 2017 -0400
+++ b/align_families.xml	Wed Oct 25 19:26:43 2017 -0400
@@ -1,16 +1,20 @@
 <?xml version="1.0"?>
-<tool id="align_families" name="Du Novo: Align families" version="0.8.1">
+<tool id="align_families" name="Du Novo: Align families" version="2.0.6">
   <description>of duplex sequencing reads</description>
   <requirements>
     <requirement type="package" version="7.221">mafft</requirement>
-    <requirement type="package" version="0.8.1">dunovo</requirement>
+    <requirement type="package" version="2.0.6">dunovo</requirement>
     <!-- TODO: require Python 2.7 -->
   </requirements>
-  <command detect_errors="exit_code">align_families.py --galaxy $phone --processes \${GALAXY_SLOTS:-1} '$input' &gt; '$output'
+  <command detect_errors="exit_code">align_families.py --aligner $aligner --galaxy $phone --processes \${GALAXY_SLOTS:-1} '$input' &gt; '$output'
   </command>
   <inputs>
     <param name="input" type="data" format="tabular" label="Input reads" help="with barcodes, grouped by family"/>
-    <param name="phone" type="boolean" truevalue="--phone-home" falsevalue="" checked="False" label="Send anonymous usage data" help="Report helpful usage data to the developer, to better understand the use cases and performance of the tool. The only data which will be recorded is the name and version of the tool, the size of the input data, the time taken to process it, and the IP address of the machine running it. No parameters or filenames are sent."/>
+    <param name="aligner" type="select" value="mafft" label="Multiple sequence aligner" help="MAFFT is the original aligner Du Novo was published with in 2016. Kalign is much faster and has similar accuracy.">
+      <option value="kalign">Kalign2</option>
+      <option value="mafft">MAFFT</option>
+    </param>
+    <param name="phone" type="boolean" truevalue="--phone-home" falsevalue="" checked="False" label="Send usage data" help="Report helpful usage data to the developer, to better understand the use cases and performance of the tool. The only data which will be recorded is the name and version of the tool, the size of the input data, the number of processes used, the time and memory taken to process it, the alignment algorithm selected, and the IP address of the machine running it. Also, if the tool fails, it will report the name of the exception thrown and the line of code it occurred in. The names of the input and output datasets are not sent. All the reporting and recording code is available at https://github.com/NickSto/ET."/>
   </inputs>
   <outputs>
     <data name="output" format="tabular"/>
@@ -21,26 +25,10 @@
       <output name="output" file="smoke.families.aligned.tsv"/>
     </test>
     <test>
-      <param name="input" value="families.in.tsv"/>
-      <output name="output" file="families.sort.tsv"/>
+      <param name="input" value="families.sort.tsv"/>
+      <output name="output" file="families.msa.tsv"/>
     </test>
   </tests>
-  <citations>
-    <citation type="bibtex">@article{Stoler2016,
-      author = {Stoler, Nicholas and Arbeithuber, Barbara and Guiblet, Wilfried and Makova, Kateryna D and Nekrutenko, Anton},
-      doi = {10.1186/s13059-016-1039-4},
-      issn = {1474-760X},
-      journal = {Genome biology},
-      number = {1},
-      pages = {180},
-      pmid = {27566673},
-      publisher = {Genome Biology},
-      title = {{Streamlined analysis of duplex sequencing data with Du Novo.}},
-      url = {http://www.ncbi.nlm.nih.gov/pubmed/27566673},
-      volume = {17},
-      year = {2016}
-    }</citation>
-  </citations>
   <help>
 
 **What it does**
@@ -77,5 +65,21 @@
 
   $ mafft --nuc --quiet family.fa &gt; family.aligned.fa
 
-    </help>
+  </help>
+  <citations>
+    <citation type="bibtex">@article{Stoler2016,
+      author = {Stoler, Nicholas and Arbeithuber, Barbara and Guiblet, Wilfried and Makova, Kateryna D and Nekrutenko, Anton},
+      doi = {10.1186/s13059-016-1039-4},
+      issn = {1474-760X},
+      journal = {Genome biology},
+      number = {1},
+      pages = {180},
+      pmid = {27566673},
+      publisher = {Genome Biology},
+      title = {{Streamlined analysis of duplex sequencing data with Du Novo.}},
+      url = {http://www.ncbi.nlm.nih.gov/pubmed/27566673},
+      volume = {17},
+      year = {2016}
+    }</citation>
+  </citations>
 </tool>