Mercurial > repos > lparsons > sam_stats
comparison sam-stats.xml @ 1:a51942c74761 draft
planemo upload for repository https://github.com/lparsons/galaxy_tools/tree/master/tools/sam_stats commit 394834f8f34909961cfbf6252fefbdc63342d78d
author | lparsons |
---|---|
date | Mon, 13 Jul 2015 11:45:51 -0400 |
parents | b9e7569a4438 |
children | da985dad64c0 |
comparison
equal
deleted
inserted
replaced
0:b9e7569a4438 | 1:a51942c74761 |
---|---|
1 <tool id="sam_stats" name="sam-stats" version="1.32"> | 1 <tool id="sam_stats" name="sam-stats" version="0.1"> |
2 <description> - Compute statistics from SAM or BAM files</description> | 2 <description> - Compute statistics from SAM or BAM files</description> |
3 | |
3 <requirements> | 4 <requirements> |
4 <requirement type="package" version="1.1.2-484">ea-utils</requirement> | 5 <requirement type="package" version="1.1.2-484">ea-utils</requirement> |
5 </requirements> | 6 </requirements> |
6 <command> | 7 |
8 <stdio> | |
9 <exit_code range="1:" level="fatal" description="Unknown error occurred" /> | |
10 </stdio> | |
11 | |
12 <command><![CDATA[ | |
7 sam-stats | 13 sam-stats |
8 $trackMultAlign | 14 $trackMultAlign |
9 $reportAllChr | 15 $reportAllChr |
10 #if $rnaSeqStats: | 16 #if $rnaSeqStats: |
11 -R $rnaSeqStatsFile | 17 -R $rnaSeqStatsFile |
13 #if $input.extension == "bam": | 19 #if $input.extension == "bam": |
14 -B | 20 -B |
15 #end if | 21 #end if |
16 -S $histBinSize | 22 -S $histBinSize |
17 $input | 23 $input |
18 > $samStats | 24 > $samStats |
25 ]]> | |
19 </command> | 26 </command> |
27 | |
20 <inputs> | 28 <inputs> |
21 <param format="sam,bam" name="input" type="data" label="SAM/BAM File" /> | 29 <param format="sam, bam" name="input" type="data" label="SAM/BAM File" /> |
22 <param name="trackMultAlign" type="boolean" value="False" truevalue="-D" falsevalue="" label="Keep track of multiple alignments (slower!)" /> | 30 <param name="trackMultAlign" type="boolean" value="False" truevalue="-D" falsevalue="" label="Keep track of multiple alignments (slower!)" /> |
23 <param name="reportAllChr" type="boolean" value="False" truevalue="-A" falsevalue="" label="Report all chr sigs, even if there are more than 1000" /> | 31 <param name="reportAllChr" type="boolean" value="False" truevalue="-A" falsevalue="" label="Report all chr sigs, even if there are more than 1000" /> |
24 <!-- <param name="numReadsSubsample" type="integer" value="1000000" min="1" max="1000000" label="Number of reads to sample for per-base statistics (max 1,000,000)" /> --> | 32 <!-- <param name="numReadsSubsample" type="integer" value="1000000" min="1" max="1000000" label="Number of reads to sample for per-base statistics (max 1,000,000)" /> --> |
25 <param name="histBinSize" type="integer" value="30" min="1" label="Number of bins per chromosome for reads by chromosome "histogram"" /> | 33 <param name="histBinSize" type="integer" value="30" min="1" label="Number of bins per chromosome for reads by chromosome "histogram"" /> |
26 <param name="rnaSeqStats" type="boolean" value="False" label="Output RNA-Seq statistics (coverage, 3 prime bias, etc.)" /> | 34 <param name="rnaSeqStats" type="boolean" value="False" label="Output RNA-Seq statistics (coverage, 3 prime bias, etc.)" /> |
30 <data format="tabular" name="samStats" label="${tool.name} on ${on_string}"/> | 38 <data format="tabular" name="samStats" label="${tool.name} on ${on_string}"/> |
31 <data format="tabular" name="rnaSeqStatsFile" label="${tool.name} on ${on_string} (RNA-Seq Stats)"> <filter>rnaSeqStats</filter> | 39 <data format="tabular" name="rnaSeqStatsFile" label="${tool.name} on ${on_string} (RNA-Seq Stats)"> <filter>rnaSeqStats</filter> |
32 </data> | 40 </data> |
33 </outputs> | 41 </outputs> |
34 | 42 |
35 <stdio> | |
36 <exit_code range="1:" level="fatal" description="Unknown error occurred" /> | |
37 </stdio> | |
38 | |
39 <tests> | 43 <tests> |
40 <test> | 44 <test> |
41 <param name="input" value="test.sam" /> | 45 <param name="input" value="test.sam" /> |
42 <output name="samStats" file="testout.txt" /> | 46 <output name="samStats" file="testout.txt" /> |
43 </test> | 47 </test> |
44 </tests> | 48 </tests> |
45 | 49 |
46 <help> | 50 <help><![CDATA[ |
47 Overview | 51 Overview |
48 -------- | 52 -------- |
49 sam-stats computes varius statics on SAM/BAM alignment files. | 53 sam-stats computes varius statics on SAM/BAM alignment files. |
50 | 54 |
51 Complete Stats:: | 55 Complete Stats:: |
52 | 56 |
53 <STATS> : mean, max, stdev, median, Q1 (25 percentile), Q3 | 57 <STATS> : mean, max, stdev, median, Q1 (25 percentile), Q3 |
54 reads : # of entries in the sam file, might not be # reads | 58 reads : # of entries in the sam file, might not be # reads |
55 phred : phred scale used | 59 phred : phred scale used |
56 bsize : # reads used for qual stats | 60 bsize : # reads used for qual stats |
57 mapped reads : number of aligned reads (unique probe id sequences) | 61 mapped reads : number of aligned reads (unique probe id sequences) |
58 mapped bases : total of the lengths of the aligned reads | 62 mapped bases : total of the lengths of the aligned reads |
60 reverse : number of reverse-aligned reads | 64 reverse : number of reverse-aligned reads |
61 snp rate : mismatched bases / total bases | 65 snp rate : mismatched bases / total bases |
62 ins rate : insert bases / total bases | 66 ins rate : insert bases / total bases |
63 del rate : deleted bases / total bases | 67 del rate : deleted bases / total bases |
64 pct mismatch : percent of reads that have mismatches | 68 pct mismatch : percent of reads that have mismatches |
65 len <STATS> : read length stats, ignored if fixed-length | 69 len <STATS> : read length stats, ignored if fixed-length |
66 mapq <STATS> : stats for mapping qualities | 70 mapq <STATS> : stats for mapping qualities |
67 insert <STATS> : stats for insert sizes | 71 insert <STATS> : stats for insert sizes |
68 <CHR> : percentage of mapped bases per chr, followed by a signature | 72 <CHR> : percentage of mapped bases per chr, followed by a signature |
69 | 73 |
70 Subsampled stats (1M reads max):: | 74 Subsampled stats (1M reads max):: |
71 | 75 |
72 base qual <STATS> : stats for base qualities | 76 base qual <STATS> : stats for base qualities |
73 A,T,C,G : base percentages | 77 A,T,C,G : base percentages |
74 | 78 |
75 Meaning of the per-chromosome signature: | 79 Meaning of the per-chromosome signature: |
76 | 80 |
77 A ascii-histogram of mapped reads by chromosome position. It is only output if the original SAM/BAM has a header. The values are the log2 of the # of mapped reads at each position + ascii '0'. | 81 A ascii-histogram of mapped reads by chromosome position. It is only output if the original SAM/BAM has a header. The values are the log2 of the # of mapped reads at each position + ascii '0'. |
78 | 82 |
79 See http://code.google.com/p/ea-utils/wiki/SamStatsDetails for more information on each stat, how it's calculated and what it means. | 83 See http://code.google.com/p/ea-utils/wiki/SamStatsDetails for more information on each stat, how it's calculated and what it means. |
80 | 84 |
81 This tool uses the sam-stats program that is part of the ea-utils suite. See http://code.google.com/p/ea-utils/wiki/SamStats for details. | 85 This tool uses the sam-stats program that is part of the ea-utils suite. See http://code.google.com/p/ea-utils/wiki/SamStats for details. |
86 ]]> | |
82 </help> | 87 </help> |
88 | |
89 <citations> | |
90 <citation type="bibtex"> | |
91 @article{aronesty_comparison_2013, | |
92 title = {Comparison of {Sequencing} {Utility} {Programs}}, | |
93 volume = {7}, | |
94 issn = {18750362}, | |
95 url = {http://benthamopen.com/ABSTRACT/TOBIOIJ-7-1}, | |
96 doi = {10.2174/1875036201307010001}, | |
97 language = {en}, | |
98 number = {1}, | |
99 urldate = {2015-07-10}, | |
100 journal = {The Open Bioinformatics Journal}, | |
101 author = {Aronesty, Erik}, | |
102 month = jan, | |
103 year = {2013}, | |
104 pages = {1--8} | |
105 } | |
106 </citation> | |
107 </citations> | |
108 | |
83 </tool> | 109 </tool> |