annotate tools/human_genome_variation/snpFreq.xml @ 2:c2a356708570

Uploaded
author xuebing
date Fri, 09 Mar 2012 19:45:42 -0500
parents 9071e359b9a3
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
1 <tool id="hgv_snpFreq" name="snpFreq" version="1.0.0">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
2 <description>significant SNPs in case-control data</description>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
4 <command interpreter="perl">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
5 snpFreq2.pl $input $group1_1 $group1_2 $group1_3 $group2_1 $group2_2 $group2_3 0.05 $output
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
6 </command>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
7
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
8 <inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
9 <param format="tabular" name="input" type="data" label="Dataset" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
10 <param name="group1_1" label="Column with genotype 1 count for group 1" type="data_column" data_ref="input" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
11 <param name="group1_2" label="Column with genotype 2 count for group 1" type="data_column" data_ref="input" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
12 <param name="group1_3" label="Column with genotype 3 count for group 1" type="data_column" data_ref="input" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
13 <param name="group2_1" label="Column with genotype 1 count for group 2" type="data_column" data_ref="input" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
14 <param name="group2_2" label="Column with genotype 2 count for group 2" type="data_column" data_ref="input" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
15 <param name="group2_3" label="Column with genotype 3 count for group 2" type="data_column" data_ref="input" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
16 </inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
17
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
18 <outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
19 <data format="tabular" name="output" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
20 </outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
21
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
22 <requirements>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
23 <requirement type="binary">R</requirement>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
24 </requirements>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
25
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
26 <tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
27 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
28 <param name="input" ftype="tabular" value="snpFreqInput.txt" dbkey="hg18" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
29 <param name="group1_1" value="4" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
30 <param name="group1_2" value="5" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
31 <param name="group1_3" value="6" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
32 <param name="group2_1" value="7" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
33 <param name="group2_2" value="8" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
34 <param name="group2_3" value="9" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
35 <output name="output" file="snpFreqTestOut.txt" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
36 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
37 </tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
38
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
39 <help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
40
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
41 **Dataset formats**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
42
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
43 The input is tabular_, with six columns of allele counts. The output is also tabular,
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
44 and includes all of the input data plus the additional columns described below.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
45 (`Dataset missing?`_)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
46
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
47 .. _tabular: ./static/formatHelp.html#tab
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
48 .. _Dataset missing?: ./static/formatHelp.html
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
49
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
50 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
51
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
52 **What it does**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
53
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
54 This tool performs a basic analysis of bi-allelic SNPs in case-control
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
55 data, using the R statistical environment and Fisher's exact test to
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
56 identify SNPs with a significant difference in the allele frequencies
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
57 between the two groups. R's "qvalue" package is used to correct for
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
58 multiple testing.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
59
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
60 The input file includes counts for each allele combination (AA aa Aa)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
61 for each group at each SNP position. The assignment of codes (1 2 3)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
62 to these genotypes is arbitrary, as long as it is consistent for both
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
63 groups. Any other input columns are ignored in the computation, but
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
64 are copied to the output. The output appends eight additional columns,
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
65 namely the minimum expected counts of the three genotypes for each
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
66 group, the p-value, and the q-value.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
67
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
68 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
69
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
70 **Example**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
71
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
72 - input file::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
73
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
74 chr1 210 211 38 4 15 56 0 1 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
75 chr1 228 229 55 0 2 56 0 1 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
76 chr1 230 231 46 0 11 55 0 2 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
77 chr1 234 235 43 0 14 55 0 2 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
78 chr1 236 237 55 0 2 13 10 34 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
79 chr1 437 438 55 0 2 46 0 11 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
80 chr1 439 440 56 0 1 55 0 2 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
81 chr1 449 450 56 0 1 13 20 24 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
82 chr1 518 519 56 0 1 38 4 15 x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
83
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
84 Here the group 1 genotype counts are in columns 4 - 6, while those
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
85 for group 2 are in columns 7 - 9.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
86
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
87 Note that the "x" column has no meaning. It was added to this example
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
88 to show that extra columns can be included, and to make it easier
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
89 to see where the new columns are appended in the output.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
90
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
91 - output file::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
92
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
93 chr1 210 211 38 4 15 56 0 1 x 47 2 8 47 2 8 1.50219088598917e-05 6.32501425679652e-06
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
94 chr1 228 229 55 0 2 56 0 1 x 55.5 0 1.5 55.5 0 1.5 1 0.210526315789474
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
95 chr1 230 231 46 0 11 55 0 2 x 50.5 0 6.5 50.5 0 6.5 0.0155644201009862 0.00409590002657532
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
96 chr1 234 235 43 0 14 55 0 2 x 49 0 8 49 0 8 0.00210854461554067 0.000739840215979182
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
97 chr1 236 237 55 0 2 13 10 34 x 34 5 18 34 5 18 6.14613878554783e-17 4.31307984950725e-17
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
98 chr1 437 438 55 0 2 46 0 11 x 50.5 0 6.5 50.5 0 6.5 0.0155644201009862 0.00409590002657532
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
99 chr1 439 440 56 0 1 55 0 2 x 55.5 0 1.5 55.5 0 1.5 1 0.210526315789474
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
100 chr1 449 450 56 0 1 13 20 24 x 34.5 10 12.5 34.5 10 12.5 2.25757007974134e-18 2.37638955762246e-18
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
101 chr1 518 519 56 0 1 38 4 15 x 47 2 8 47 2 8 1.50219088598917e-05 6.32501425679652e-06
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
102
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
103 </help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
104 </tool>