comparison read2mut.xml @ 43:d21960b45a6b draft

planemo upload for repository https://github.com/Single-Molecule-Genetics/VariantAnalyzerGalaxy/tree/master/tools/variant_analyzer commit ee4a8e6cf290e6c8a4d55f9cd2839d60ab3b11c8
author mheinzl
date Tue, 02 Mar 2021 15:32:41 +0000
parents da224c392a54
children 8fbe6aba07e5
comparison
equal deleted inserted replaced
42:da224c392a54 43:d21960b45a6b
1 <?xml version="1.0" encoding="UTF-8"?> 1 <?xml version="1.0" encoding="UTF-8"?>
2 <tool id="read2mut" name="Call specific mutations in reads:" version="2.0.4" profile="17.01"> 2 <tool id="read2mut" name="Call specific mutations in reads:" version="2.1.0" profile="19.01">
3 <description>Looks for reads with mutation at known positions and calculates frequencies and stats.</description> 3 <description>Looks for reads with mutation at known positions and calculates frequencies and stats.</description>
4 <macros> 4 <macros>
5 <import>va_macros.xml</import> 5 <import>va_macros.xml</import>
6 </macros> 6 </macros>
7 <expand macro="requirements"> 7 <requirements>
8 <requirement type="package" version="2.7">python</requirement>
9 <requirement type="package" version="1.4.0">matplotlib</requirement>
10 <requirement type="package" version="0.15">pysam</requirement>
8 <requirement type="package" version="1.1.0">xlsxwriter</requirement> 11 <requirement type="package" version="1.1.0">xlsxwriter</requirement>
9 </expand> 12 <requirement type="package" version="0.11.6">cyvcf2</requirement>
13 </requirements>
10 <command><![CDATA[ 14 <command><![CDATA[
11 ln -s '$file2' bam_input.bam && 15 ln -s '$file2' bam_input.bam &&
12 ln -s '${file2.metadata.bam_index}' bam_input.bam.bai && 16 ln -s '${file2.metadata.bam_index}' bam_input.bam.bai &&
13 python '$__tool_directory__/read2mut.py' 17 python '$__tool_directory__/read2mut.py'
14 --mutFile '$file1' 18 --mutFile '$file1'
15 --bamFile bam_input.bam 19 --bamFile bam_input.bam
16 --inputJson '$file3' 20 --inputJson '$file3'
17 --sscsJson '$file4' 21 --sscsJson '$file4'
18 --thresh '$thresh' 22 --thresh '$thresh'
19 --phred '$phred' 23 --phred '$phred'
20 --trim5 '$trim5' 24 --trim '$trim'
21 --trim3 '$trim3'
22 $chimera_correction 25 $chimera_correction
26 --softclipping_dist '$softclipping_dist'
27 --reads_threshold '$reads_threshold'
23 --outputFile '$output_xlsx' 28 --outputFile '$output_xlsx'
24 --outputFile_csv '$outputFile_csv'
25 --outputFile2 '$output_xlsx2' 29 --outputFile2 '$output_xlsx2'
26 --outputFile3 '$output_xlsx3' 30 --outputFile3 '$output_xlsx3'
27 ]]> 31 ]]>
28 </command> 32 </command>
29 <inputs> 33 <inputs>
31 <param name="file2" type="data" format="bam" label="BAM File of raw reads" optional="false" help="BAM file with aligned raw reads of selected tags."/> 35 <param name="file2" type="data" format="bam" label="BAM File of raw reads" optional="false" help="BAM file with aligned raw reads of selected tags."/>
32 <param name="file3" type="data" format="json" label="JSON File with DCS tag stats" optional="false" help="JSON file generated by DCS mutations to tags/reads"/> 36 <param name="file3" type="data" format="json" label="JSON File with DCS tag stats" optional="false" help="JSON file generated by DCS mutations to tags/reads"/>
33 <param name="file4" type="data" format="json" label="JSON File with SSCS tag stats" optional="false" help="JSON file generated by DCS mutations to SSCS stats."/> 37 <param name="file4" type="data" format="json" label="JSON File with SSCS tag stats" optional="false" help="JSON file generated by DCS mutations to SSCS stats."/>
34 <param name="thresh" type="integer" label="Tag count threshold" value="0" help="Integer threshold for displaying mutations. Only mutations occuring in DCS of less than thresh tags are displayed. Default of 0 displays all."/> 38 <param name="thresh" type="integer" label="Tag count threshold" value="0" help="Integer threshold for displaying mutations. Only mutations occuring in DCS of less than thresh tags are displayed. Default of 0 displays all."/>
35 <param name="phred" type="integer" label="Phred quality score threshold" min="0" max="41" value="20" help="Integer threshold for Phred quality score. Only reads higher than this threshold are considered. Default = 20."/> 39 <param name="phred" type="integer" label="Phred quality score threshold" min="0" max="41" value="20" help="Integer threshold for Phred quality score. Only reads higher than this threshold are considered. Default = 20."/>
36 <param name="trim5" type="integer" label="Trimming threshold at 5' end of reads" value="10" help="Integer threshold for assigning mutations at the beginning of reads to a lower tier. Default 10."/> 40 <param name="trim" type="integer" label="Trimming threshold" value="10" help="Integer threshold for assigning mutations at start and end of reads to lower tier. Default 10."/>
37 <param name="trim3" type="integer" label="Trimming threshold at 3' end of reads" value="10" help="Integer threshold for assigning mutations at the end of reads to a lower tier. Default 10."/>
38 <param name="chimera_correction" type="boolean" label="Apply chimera correction?" truevalue="--chimera_correction" falsevalue="" checked="False" help="Count chimeric variants and correct the variant frequencies."/> 41 <param name="chimera_correction" type="boolean" label="Apply chimera correction?" truevalue="--chimera_correction" falsevalue="" checked="False" help="Count chimeric variants and correct the variant frequencies."/>
42 <param name="softclipping_dist" type="integer" label="Distance between artifact and softclipping of the reads" min="1" value="15" help="Count mutation as an artifact if mutation lies within this parameter away from the softclipping part of the reads. Default = 20"/>
43 <param name="reads_threshold" type="float" label="Minimum percentage of softclipped reads in a family" min="0.0" max="1.0" value="1.0" help="Float number which specifies the minimum percentage of softclipped reads in a family to be considered in the softclipping tiers. Default: 1.0, means all reads of a family have to be softclipped."/>
39 </inputs> 44 </inputs>
40 <outputs> 45 <outputs>
41 <data name="output_xlsx" format="xlsx" label="${tool.name} on ${on_string}: XLSX summary"/> 46 <data name="output_xlsx" format="xlsx" label="${tool.name} on ${on_string}: XLSX summary"/>
42 <data name="outputFile_csv" format="csv" label="${tool.name} on ${on_string}: CSV summary"/>
43 <data name="output_xlsx2" format="xlsx" label="${tool.name} on ${on_string}: XLSX allele frequencies"/> 47 <data name="output_xlsx2" format="xlsx" label="${tool.name} on ${on_string}: XLSX allele frequencies"/>
44 <data name="output_xlsx3" format="xlsx" label="${tool.name} on ${on_string}: XLSX tiers"/> 48 <data name="output_xlsx3" format="xlsx" label="${tool.name} on ${on_string}: XLSX tiers"/>
45 </outputs> 49 </outputs>
46 <tests> 50 <tests>
47 <test> 51 <test>
49 <param name="file2" value="Interesting_Reads_test.trim.bam"/> 53 <param name="file2" value="Interesting_Reads_test.trim.bam"/>
50 <param name="file3" value="tag_count_dict_test.json"/> 54 <param name="file3" value="tag_count_dict_test.json"/>
51 <param name="file4" value="SSCS_counts_test.json"/> 55 <param name="file4" value="SSCS_counts_test.json"/>
52 <param name="thresh" value="0"/> 56 <param name="thresh" value="0"/>
53 <param name="phred" value="20"/> 57 <param name="phred" value="20"/>
54 <param name="trim5" value="10"/> 58 <param name="trim" value="10"/>
55 <param name="trim3" value="10"/> 59 <param name="chimera_correction"/>
60 <param name="softclipping_dist" value="15"/>
61 <param name="reads_threshold" value="1.0"/>
56 <output name="output_xlsx" file="Variant_Analyzer_summary_test.xlsx" decompress="true" lines_diff="10"/> 62 <output name="output_xlsx" file="Variant_Analyzer_summary_test.xlsx" decompress="true" lines_diff="10"/>
57 <output name="outputFile_csv" file="Variant_Analyzer_summary_test.csv" decompress="true" lines_diff="10"/>
58 <output name="output_xlsx2" file="Variant_Analyzer_allele_frequencies_test.xlsx" decompress="true" lines_diff="10"/> 63 <output name="output_xlsx2" file="Variant_Analyzer_allele_frequencies_test.xlsx" decompress="true" lines_diff="10"/>
59 <output name="output_xlsx3" file="Variant_Analyzer_tiers_test.xlsx" decompress="true" lines_diff="10"/> 64 <output name="output_xlsx3" file="Variant_Analyzer_tiers_test.xlsx" decompress="true" lines_diff="10"/>
60 </test> 65 </test>
61 </tests> 66 </tests>
62 <help> <![CDATA[ 67 <help> <![CDATA[
68 from the raw reads. 73 from the raw reads.
69 74
70 **Input** 75 **Input**
71 76
72 **Dataset 1:** VCF file with duplex consesus sequence (DCS) mutations. E.g. 77 **Dataset 1:** VCF file with duplex consesus sequence (DCS) mutations. E.g.
73 generated by the `FreeBayes <https://arxiv.org/abs/1207.3907>`_ or `LoFreq <https://academic.oup.com/nar/article/40/22/11189/1152727>`_ variant caller. 78 generated by the `FreeBayes variant caller <https://arxiv.org/abs/1207.3907>`_.
74 79
75 **Dataset 2:** BAM file of aligned raw reads. This file can be obtained by the 80 **Dataset 2:** BAM file of aligned raw reads. This file can be obtained by the
76 tool `Map with BWA-MEM <https://arxiv.org/abs/1303.3997>`_. 81 tool `Map with BWA-MEM <https://arxiv.org/abs/1303.3997>`_.
77 82
78 **Dataset 3:** JSON file generated by the **DCS mutations to tags/reads** tool 83 **Dataset 3:** JSON file generated by the **DCS mutations to tags/reads** tool
84 is called in the DCS. 89 is called in the DCS.
85 90
86 **Output** 91 **Output**
87 92
88 The output are three XLSX files containing frequencies stats for DCS mutations based 93 The output are three XLSX files containing frequencies stats for DCS mutations based
89 on information from the raw reads and a CSV file containing the summary information without color-coding. In addition to that a tier based 94 on information from the raw reads. In addition to that a tier based
90 classification is provided based on the amout of support for a true variant call. 95 classification is provided based on the amout of support for a true variant call.
91 96
92 ]]> 97 ]]>
93 </help> 98 </help>
94 <expand macro="citation" /> 99 <expand macro="citation" />