Mercurial > repos > greg > vsnp_statistics
annotate vsnp_statistics.xml @ 27:c9208cc0f5dd draft
"planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_statistics commit 7f5ebaad2e650c53a8980e8567fe9943f9ccabb6"
author | greg |
---|---|
date | Mon, 15 Nov 2021 23:15:14 +0000 |
parents | b908bb18008a |
children | e219f5c06dc0 |
rev | line source |
---|---|
16 | 1 <tool id="vsnp_statistics" name="vSNP: statistics" version="@WRAPPER_VERSION@.2+galaxy0" profile="@PROFILE@"> |
0 | 2 <description></description> |
4 | 3 <macros> |
4 <import>macros.xml</import> | |
5 </macros> | |
0 | 6 <requirements> |
8 | 7 <expand macro="biopython_requirement"/> |
8 <expand macro="numpy_requirement"/> | |
9 <expand macro="openpyxl_requirement"/> | |
10 <expand macro="pandas_requirement"/> | |
11 <expand macro="xlrd_requirement"/> | |
0 | 12 </requirements> |
13 <command detect_errors="exit_code"><![CDATA[ | |
14 #import re | |
4 | 15 |
8 | 16 #if $input_type_cond.input_type in ["single", "pair"]: |
17 #set read1 = $input_type_cond.read1 | |
0 | 18 #set read1_identifier = re.sub('[^\s\w\-]', '_', str($read1.element_identifier)) |
4 | 19 ln -s '${read1}' '${read1_identifier}' && |
8 | 20 #if $input_type_cond.input_type == "pair": |
21 #set read2 = $input_type_cond.read2 | |
4 | 22 #set read2_identifier = re.sub('[^\s\w\-]', '_', str($read2.element_identifier)) |
23 ln -s '${read2}' '${read2_identifier}' && | |
0 | 24 #end if |
25 #else: | |
18 | 26 #set identifier = re.sub('[^\s\w\-]', '_', str($input_type_cond.reads_collection.element_identifier)) |
16 | 27 #set read1 = $input_type_cond.reads_collection.forward |
18 | 28 #set read1_identifier = $identifier + '_R1' |
8 | 29 ln -s '${read1}' '${read1_identifier}' && |
16 | 30 #set read2 = $input_type_cond.reads_collection.reverse |
18 | 31 #set read2_identifier = $identifier + '_R2' |
8 | 32 ln -s '${read2}' '${read2_identifier}' && |
0 | 33 #end if |
4 | 34 |
0 | 35 python '$__tool_directory__/vsnp_statistics.py' |
8 | 36 --read1 '${read1_identifier}' |
16 | 37 #if $input_type_cond.input_type in ["pair", "paired"]: |
8 | 38 --read2 '${read2_identifier}' |
0 | 39 #end if |
8 | 40 #if $read1.is_of_type('fastqsanger.gz'): |
41 --gzipped | |
42 #end if | |
43 --dbkey '$samtools_idxstats.metadata.dbkey' | |
44 --samtools_idxstats '$samtools_idxstats' | |
45 --vsnp_azc_metrics '$vsnp_azc_metrics' | |
1 | 46 --output '$output' |
0 | 47 ]]></command> |
48 <inputs> | |
49 <conditional name="input_type_cond"> | |
50 <param name="input_type" type="select" label="Choose the category of the files to be analyzed"> | |
8 | 51 <option value="single" selected="true">Single files</option> |
52 <option value="paired">Paired reads</option> | |
53 <option value="pair">Paired reads in separate data sets</option> | |
0 | 54 </param> |
8 | 55 <when value="single"> |
56 <param name="read1" type="data" format="fastqsanger.gz,fastqsanger" label="Read1 fastq file"/> | |
4 | 57 </when> |
8 | 58 <when value="paired"> |
59 <param name="reads_collection" type="data_collection" format="fastqsanger,fastqsanger.gz" collection_type="paired" label="Collection of fastqsanger paired read files"/> | |
60 </when> | |
61 <when value="pair"> | |
62 <param name="read1" type="data" format="fastqsanger.gz,fastqsanger" label="Read1 fastq file"/> | |
63 <param name="read2" type="data" format="fastqsanger.gz,fastqsanger" label="Read2 fastq file"/> | |
0 | 64 </when> |
65 </conditional> | |
8 | 66 <param name="samtools_idxstats" type="data" format="tabular" label="Samtools idxstats file"/> |
67 <param name="vsnp_azc_metrics" type="data" format="tabular" label="vSNP: add zero coverage metrics file"/> | |
0 | 68 </inputs> |
69 <outputs> | |
5
d0fbdeaaa488
"planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_statistics commit 770e89322a15829580ed9577a853660f63233f32"
greg
parents:
4
diff
changeset
|
70 <data name="output" format="tabular"/> |
0 | 71 </outputs> |
72 <tests> | |
4 | 73 <!-- A single fastq file --> |
74 <test expect_num_outputs="1"> | |
8 | 75 <param name="input_type" value="single"/> |
4 | 76 <param name="read1" value="Mcap_Deer_DE_SRR650221.fastq.gz" ftype="fastqsanger.gz" dbkey="89"/> |
77 <param name="samtools_idxstats" value="samtools_idxstats1.tabular" ftype="tabular" dbkey="89"/> | |
8 | 78 <param name="vsnp_azc_metrics" value="add_zc_metrics1.tabular" ftype="tabular" dbkey="89"/> |
25 | 79 <output name="output" file="vsnp_statistics1.tabular" ftype="tabular" compare="contains"/> |
4 | 80 </test> |
81 <!-- A set of paired fastq files --> | |
82 <test expect_num_outputs="1"> | |
8 | 83 <param name="input_type" value="pair"/> |
0 | 84 <param name="read1" value="13-1941-6_S4_L001_R1_600000.fastq.gz" ftype="fastqsanger.gz" dbkey="89"/> |
85 <param name="read2" value="13-1941-6_S4_L001_R2_600000.fastq.gz" ftype="fastqsanger.gz" dbkey="89"/> | |
4 | 86 <param name="samtools_idxstats" value="samtools_idxstats2.tabular" ftype="tabular" dbkey="89"/> |
8 | 87 <param name="vsnp_azc_metrics" value="add_zc_metrics2.tabular" ftype="tabular" dbkey="89"/> |
25 | 88 <output name="output" file="vsnp_statistics2.tabular" ftype="tabular" compare="contains"/> |
4 | 89 </test> |
8 | 90 <!-- A collection of paired fastq files --> |
4 | 91 <test expect_num_outputs="1"> |
8 | 92 <param name="input_type" value="paired"/> |
4 | 93 <param name="reads_collection"> |
94 <collection type="paired"> | |
95 <element name="forward" value="13-1941-6_S4_L001_R1_600000.fastq.gz" ftype="fastqsanger.gz"/> | |
96 <element name="reverse" value="13-1941-6_S4_L001_R2_600000.fastq.gz" ftype="fastqsanger.gz"/> | |
97 </collection> | |
98 </param> | |
8 | 99 <param name="samtools_idxstats" value="samtools_idxstats5.tabular" ftype="tabular" dbkey="89"/> |
100 <param name="vsnp_azc_metrics" value="add_zc_metrics5.tabular" ftype="tabular" dbkey="89"/> | |
25 | 101 <output name="output" file="vsnp_statistics4.tabular" ftype="tabular" compare="contains"/> |
0 | 102 </test> |
103 </tests> | |
104 <help> | |
105 **What it does** | |
106 | |
4 | 107 Accepts associated fastq files, SAMtools idxstats files and **vSNP: add zero coverage** metrics files and extracts information from them |
20
d4ef7003c539
"planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_statistics commit a08a9977ae1ac36c46b9fb7898bd4b5c4c302c11"
greg
parents:
18
diff
changeset
|
108 to produce a tabular file containing statistics for each sample. The samples can be a single read, a single set of paired reads in |
d4ef7003c539
"planemo upload for repository https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/sequence_analysis/vsnp/vsnp_statistics commit a08a9977ae1ac36c46b9fb7898bd4b5c4c302c11"
greg
parents:
18
diff
changeset
|
109 separate datasets or a collection of paired reads. The output statistics include reference, file size, mean read length, mean read quality, |
4 | 110 reads passing Q30, total reads, all mapped reads, unmapped reads, unmapped reads percentage of total, reference with coverage, average depth |
111 of coverage and good SNP count. | |
0 | 112 </help> |
4 | 113 <expand macro="citations"/> |
0 | 114 </tool> |
115 |