Mercurial > repos > mheinzl > variant_analyzer2
comparison read2mut.xml @ 43:d21960b45a6b draft
planemo upload for repository https://github.com/Single-Molecule-Genetics/VariantAnalyzerGalaxy/tree/master/tools/variant_analyzer commit ee4a8e6cf290e6c8a4d55f9cd2839d60ab3b11c8
author | mheinzl |
---|---|
date | Tue, 02 Mar 2021 15:32:41 +0000 |
parents | da224c392a54 |
children | 8fbe6aba07e5 |
comparison
equal
deleted
inserted
replaced
42:da224c392a54 | 43:d21960b45a6b |
---|---|
1 <?xml version="1.0" encoding="UTF-8"?> | 1 <?xml version="1.0" encoding="UTF-8"?> |
2 <tool id="read2mut" name="Call specific mutations in reads:" version="2.0.4" profile="17.01"> | 2 <tool id="read2mut" name="Call specific mutations in reads:" version="2.1.0" profile="19.01"> |
3 <description>Looks for reads with mutation at known positions and calculates frequencies and stats.</description> | 3 <description>Looks for reads with mutation at known positions and calculates frequencies and stats.</description> |
4 <macros> | 4 <macros> |
5 <import>va_macros.xml</import> | 5 <import>va_macros.xml</import> |
6 </macros> | 6 </macros> |
7 <expand macro="requirements"> | 7 <requirements> |
8 <requirement type="package" version="2.7">python</requirement> | |
9 <requirement type="package" version="1.4.0">matplotlib</requirement> | |
10 <requirement type="package" version="0.15">pysam</requirement> | |
8 <requirement type="package" version="1.1.0">xlsxwriter</requirement> | 11 <requirement type="package" version="1.1.0">xlsxwriter</requirement> |
9 </expand> | 12 <requirement type="package" version="0.11.6">cyvcf2</requirement> |
13 </requirements> | |
10 <command><![CDATA[ | 14 <command><![CDATA[ |
11 ln -s '$file2' bam_input.bam && | 15 ln -s '$file2' bam_input.bam && |
12 ln -s '${file2.metadata.bam_index}' bam_input.bam.bai && | 16 ln -s '${file2.metadata.bam_index}' bam_input.bam.bai && |
13 python '$__tool_directory__/read2mut.py' | 17 python '$__tool_directory__/read2mut.py' |
14 --mutFile '$file1' | 18 --mutFile '$file1' |
15 --bamFile bam_input.bam | 19 --bamFile bam_input.bam |
16 --inputJson '$file3' | 20 --inputJson '$file3' |
17 --sscsJson '$file4' | 21 --sscsJson '$file4' |
18 --thresh '$thresh' | 22 --thresh '$thresh' |
19 --phred '$phred' | 23 --phred '$phred' |
20 --trim5 '$trim5' | 24 --trim '$trim' |
21 --trim3 '$trim3' | |
22 $chimera_correction | 25 $chimera_correction |
26 --softclipping_dist '$softclipping_dist' | |
27 --reads_threshold '$reads_threshold' | |
23 --outputFile '$output_xlsx' | 28 --outputFile '$output_xlsx' |
24 --outputFile_csv '$outputFile_csv' | |
25 --outputFile2 '$output_xlsx2' | 29 --outputFile2 '$output_xlsx2' |
26 --outputFile3 '$output_xlsx3' | 30 --outputFile3 '$output_xlsx3' |
27 ]]> | 31 ]]> |
28 </command> | 32 </command> |
29 <inputs> | 33 <inputs> |
31 <param name="file2" type="data" format="bam" label="BAM File of raw reads" optional="false" help="BAM file with aligned raw reads of selected tags."/> | 35 <param name="file2" type="data" format="bam" label="BAM File of raw reads" optional="false" help="BAM file with aligned raw reads of selected tags."/> |
32 <param name="file3" type="data" format="json" label="JSON File with DCS tag stats" optional="false" help="JSON file generated by DCS mutations to tags/reads"/> | 36 <param name="file3" type="data" format="json" label="JSON File with DCS tag stats" optional="false" help="JSON file generated by DCS mutations to tags/reads"/> |
33 <param name="file4" type="data" format="json" label="JSON File with SSCS tag stats" optional="false" help="JSON file generated by DCS mutations to SSCS stats."/> | 37 <param name="file4" type="data" format="json" label="JSON File with SSCS tag stats" optional="false" help="JSON file generated by DCS mutations to SSCS stats."/> |
34 <param name="thresh" type="integer" label="Tag count threshold" value="0" help="Integer threshold for displaying mutations. Only mutations occuring in DCS of less than thresh tags are displayed. Default of 0 displays all."/> | 38 <param name="thresh" type="integer" label="Tag count threshold" value="0" help="Integer threshold for displaying mutations. Only mutations occuring in DCS of less than thresh tags are displayed. Default of 0 displays all."/> |
35 <param name="phred" type="integer" label="Phred quality score threshold" min="0" max="41" value="20" help="Integer threshold for Phred quality score. Only reads higher than this threshold are considered. Default = 20."/> | 39 <param name="phred" type="integer" label="Phred quality score threshold" min="0" max="41" value="20" help="Integer threshold for Phred quality score. Only reads higher than this threshold are considered. Default = 20."/> |
36 <param name="trim5" type="integer" label="Trimming threshold at 5' end of reads" value="10" help="Integer threshold for assigning mutations at the beginning of reads to a lower tier. Default 10."/> | 40 <param name="trim" type="integer" label="Trimming threshold" value="10" help="Integer threshold for assigning mutations at start and end of reads to lower tier. Default 10."/> |
37 <param name="trim3" type="integer" label="Trimming threshold at 3' end of reads" value="10" help="Integer threshold for assigning mutations at the end of reads to a lower tier. Default 10."/> | |
38 <param name="chimera_correction" type="boolean" label="Apply chimera correction?" truevalue="--chimera_correction" falsevalue="" checked="False" help="Count chimeric variants and correct the variant frequencies."/> | 41 <param name="chimera_correction" type="boolean" label="Apply chimera correction?" truevalue="--chimera_correction" falsevalue="" checked="False" help="Count chimeric variants and correct the variant frequencies."/> |
42 <param name="softclipping_dist" type="integer" label="Distance between artifact and softclipping of the reads" min="1" value="15" help="Count mutation as an artifact if mutation lies within this parameter away from the softclipping part of the reads. Default = 20"/> | |
43 <param name="reads_threshold" type="float" label="Minimum percentage of softclipped reads in a family" min="0.0" max="1.0" value="1.0" help="Float number which specifies the minimum percentage of softclipped reads in a family to be considered in the softclipping tiers. Default: 1.0, means all reads of a family have to be softclipped."/> | |
39 </inputs> | 44 </inputs> |
40 <outputs> | 45 <outputs> |
41 <data name="output_xlsx" format="xlsx" label="${tool.name} on ${on_string}: XLSX summary"/> | 46 <data name="output_xlsx" format="xlsx" label="${tool.name} on ${on_string}: XLSX summary"/> |
42 <data name="outputFile_csv" format="csv" label="${tool.name} on ${on_string}: CSV summary"/> | |
43 <data name="output_xlsx2" format="xlsx" label="${tool.name} on ${on_string}: XLSX allele frequencies"/> | 47 <data name="output_xlsx2" format="xlsx" label="${tool.name} on ${on_string}: XLSX allele frequencies"/> |
44 <data name="output_xlsx3" format="xlsx" label="${tool.name} on ${on_string}: XLSX tiers"/> | 48 <data name="output_xlsx3" format="xlsx" label="${tool.name} on ${on_string}: XLSX tiers"/> |
45 </outputs> | 49 </outputs> |
46 <tests> | 50 <tests> |
47 <test> | 51 <test> |
49 <param name="file2" value="Interesting_Reads_test.trim.bam"/> | 53 <param name="file2" value="Interesting_Reads_test.trim.bam"/> |
50 <param name="file3" value="tag_count_dict_test.json"/> | 54 <param name="file3" value="tag_count_dict_test.json"/> |
51 <param name="file4" value="SSCS_counts_test.json"/> | 55 <param name="file4" value="SSCS_counts_test.json"/> |
52 <param name="thresh" value="0"/> | 56 <param name="thresh" value="0"/> |
53 <param name="phred" value="20"/> | 57 <param name="phred" value="20"/> |
54 <param name="trim5" value="10"/> | 58 <param name="trim" value="10"/> |
55 <param name="trim3" value="10"/> | 59 <param name="chimera_correction"/> |
60 <param name="softclipping_dist" value="15"/> | |
61 <param name="reads_threshold" value="1.0"/> | |
56 <output name="output_xlsx" file="Variant_Analyzer_summary_test.xlsx" decompress="true" lines_diff="10"/> | 62 <output name="output_xlsx" file="Variant_Analyzer_summary_test.xlsx" decompress="true" lines_diff="10"/> |
57 <output name="outputFile_csv" file="Variant_Analyzer_summary_test.csv" decompress="true" lines_diff="10"/> | |
58 <output name="output_xlsx2" file="Variant_Analyzer_allele_frequencies_test.xlsx" decompress="true" lines_diff="10"/> | 63 <output name="output_xlsx2" file="Variant_Analyzer_allele_frequencies_test.xlsx" decompress="true" lines_diff="10"/> |
59 <output name="output_xlsx3" file="Variant_Analyzer_tiers_test.xlsx" decompress="true" lines_diff="10"/> | 64 <output name="output_xlsx3" file="Variant_Analyzer_tiers_test.xlsx" decompress="true" lines_diff="10"/> |
60 </test> | 65 </test> |
61 </tests> | 66 </tests> |
62 <help> <![CDATA[ | 67 <help> <![CDATA[ |
68 from the raw reads. | 73 from the raw reads. |
69 | 74 |
70 **Input** | 75 **Input** |
71 | 76 |
72 **Dataset 1:** VCF file with duplex consesus sequence (DCS) mutations. E.g. | 77 **Dataset 1:** VCF file with duplex consesus sequence (DCS) mutations. E.g. |
73 generated by the `FreeBayes <https://arxiv.org/abs/1207.3907>`_ or `LoFreq <https://academic.oup.com/nar/article/40/22/11189/1152727>`_ variant caller. | 78 generated by the `FreeBayes variant caller <https://arxiv.org/abs/1207.3907>`_. |
74 | 79 |
75 **Dataset 2:** BAM file of aligned raw reads. This file can be obtained by the | 80 **Dataset 2:** BAM file of aligned raw reads. This file can be obtained by the |
76 tool `Map with BWA-MEM <https://arxiv.org/abs/1303.3997>`_. | 81 tool `Map with BWA-MEM <https://arxiv.org/abs/1303.3997>`_. |
77 | 82 |
78 **Dataset 3:** JSON file generated by the **DCS mutations to tags/reads** tool | 83 **Dataset 3:** JSON file generated by the **DCS mutations to tags/reads** tool |
84 is called in the DCS. | 89 is called in the DCS. |
85 | 90 |
86 **Output** | 91 **Output** |
87 | 92 |
88 The output are three XLSX files containing frequencies stats for DCS mutations based | 93 The output are three XLSX files containing frequencies stats for DCS mutations based |
89 on information from the raw reads and a CSV file containing the summary information without color-coding. In addition to that a tier based | 94 on information from the raw reads. In addition to that a tier based |
90 classification is provided based on the amout of support for a true variant call. | 95 classification is provided based on the amout of support for a true variant call. |
91 | 96 |
92 ]]> | 97 ]]> |
93 </help> | 98 </help> |
94 <expand macro="citation" /> | 99 <expand macro="citation" /> |