0
|
1 <?xml version="1.0"?>
|
|
2
|
|
3 <tool id="microarray_reports_1" name="Compute NGS/microarray concordance">
|
|
4 <description>over targeted regions in a genome</description>
|
|
5 <version_string>microarray_reports -v</version_string>
|
|
6 <command interpreter="perl">microarray_reports $__tool_data_path__ -q $out_discordant_bed $out_summary_table $input_ngs_calls $input_micro_calls $input_bam $target_gtf $ref_genome.fa $coverage_cutoff $target_bed</command>
|
|
7 <inputs>
|
|
8 <param format="achri_snp_table" name="input_ngs_calls" type="data" label="HGVS annotated NGS variant calls"/>
|
|
9 <param format="tabular" name="input_micro_calls" type="data" label="Microarray genotype calls. See help info below this form for required input format."/>
|
|
10 <param format="bam" name="input_bam" type="data" label="Mapped reads file (BAM) that was used to generate the NGS variant calls"/>
|
|
11 <param type="integer" name="coverage_cutoff" value="9" min="0" max="40" label="Report only positions with read depth greater than..."/>
|
|
12 <param name="ref_genome" type="genomebuild" label="Reference genome" help="against which the NGS variants were called"/>
|
|
13 <param format="gtf" name="target_gtf" type="data" label="Target regions" help="This must be the same (GTF) file used to define the coding regions for the HGVS annotation of the NGS variant calls"/>
|
|
14 <param format="bed" name="target_bed" type="data" label="Target sequencing regions" help="e.g. a BED file from the Shared Data 'Exome target regions' folder, corresponding the
|
|
15 to the capture kit used for sequencing the sample"/>
|
|
16 </inputs>
|
|
17 <outputs>
|
|
18 <data name="out_summary_table" format="tabular" label="Concordance summary (false positive rate, etc.)"/>
|
|
19 <data name="out_discordant_bed" format="bed" label="Discordant call locations"/>
|
|
20 </outputs>
|
|
21
|
|
22 <tests>
|
|
23 </tests>
|
|
24
|
|
25 <help>
|
|
26 **What it does**
|
|
27
|
|
28 This tool reports several statistics comparing the genotypes derived from a next-gen sequencing run to a microarray genotyping result
|
|
29 for the same individual. When coverage is good (10x for colorspace, 20x for base space), false positive and false negative rates should
|
|
30 be below 2%, assuming 99% accuracy of both the microarray and the NGS genotyping.
|
|
31
|
|
32 ------
|
|
33
|
|
34 ** Example**
|
|
35
|
|
36 The microarray file should have five columns (ProbeID, forward strand genotypes, dbSNP ID, chr, pos), e.g.::
|
|
37
|
|
38 #Comment lines...
|
|
39 Probe set header line
|
|
40 SNP_A-1780520 GG rs16994928 20 48440771
|
|
41 SNP_A-1780985 AG rs3859360 18 34178190
|
|
42 </help>
|
|
43
|
|
44 </tool>
|