Mercurial > repos > iuc > mageck_mle
comparison mageck_mle.xml @ 2:9cd937788131 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/mageck commit 49e456dda49db1f52fc876f406a10273a408b1a2
author | iuc |
---|---|
date | Wed, 04 Apr 2018 11:03:44 -0400 |
parents | 93f268840b0c |
children | b34c9d6373e0 |
comparison
equal
deleted
inserted
replaced
1:93f268840b0c | 2:9cd937788131 |
---|---|
28 | 28 |
29 #if $adv.cnv_norm: | 29 #if $adv.cnv_norm: |
30 --cnv-norm $adv.cnv_norm | 30 --cnv-norm $adv.cnv_norm |
31 #end if | 31 #end if |
32 | 32 |
33 --norm-method $adv.norm_method | 33 #if $adv.norm_method: |
34 --genes-varmodeling $adv.genes_var | 34 --norm-method $adv.norm_method |
35 --permutation-round $adv.permutation | 35 #end if |
36 --adjust-method $adv.adjust_method | 36 |
37 #if $adv.genes_var: | |
38 --genes-varmodeling $adv.genes_var | |
39 #end if | |
40 | |
41 #if $adv.permutation: | |
42 --permutation-round $adv.permutation | |
43 #end if | |
44 | |
45 #if $adv.adjust_method: | |
46 --adjust-method $adv.adjust_method | |
47 #end if | |
37 | 48 |
38 #if $adv.sgrnaeff_file: | 49 #if $adv.sgrnaeff_file: |
39 --sgrna-efficiency $adv.sgrnaeff_file | 50 --sgrna-efficiency $adv.sgrnaeff_file |
40 --sgrna-eff-name-column $adv.sgrnaid_col | 51 --sgrna-eff-name-column $adv.sgrnaid_col |
41 --sgrna-eff-score-column $adv.sgrnaeff_col | 52 --sgrna-eff-score-column $adv.sgrnaeff_col |
56 </param> | 67 </param> |
57 <when value="dmatrix"> | 68 <when value="dmatrix"> |
58 <param name="design_matrix" argument="--design-matrix" type="data" format="tabular" label="Design Matrix file" help="Provide a design matrix, either a file name or a quoted string of the design matrix. For example, 1,1;1,0. The row of the design matrix must match the order of the samples in the count table (if --include-samples is not specified), or the order of the samples by the --include-samples option" /> | 69 <param name="design_matrix" argument="--design-matrix" type="data" format="tabular" label="Design Matrix file" help="Provide a design matrix, either a file name or a quoted string of the design matrix. For example, 1,1;1,0. The row of the design matrix must match the order of the samples in the count table (if --include-samples is not specified), or the order of the samples by the --include-samples option" /> |
59 </when> | 70 </when> |
60 <when value="labels"> | 71 <when value="labels"> |
61 <param name="include_samples" argument="--include-samples" type="text" label="Sample labels" help="Specify the sample labels if the design matrix is not given by file in the --design-matrix option. Sample labels are separated by comma (,) and must match the labels in the count table" /> | 72 <param name="include_samples" argument="--include-samples" type="text" label="Sample labels" help="Specify the sample labels if the design matrix is not given by file in the --design-matrix option. Sample labels are separated by comma (,) and must match the labels in the count table"> |
62 <param name="day0_label" argument="--day0-label" type="text" format="tabular" optional="true" value="" label="Control sample" help="Specify the control sample label (usually day 0 or plasmid). For every other sample label, the MLE module will treat it as a single condition and generate an corresponding design matrix" /> | 73 <validator type="regex" message="Please only use letters, numbers or underscores in sample labels, and separate labels by commas">^[\w,]+$</validator> |
63 <param name="beta_labels" argument="--beta-labels" type="text" label="Variables" help="Specify the labels of the variables (i.e., beta), if the design matrix is not given by file in the --design-matrix option. Should be separated by commas (,), and the number of labels must equal to the number of columns of design matrix), including baseline labels. Default: bata_0,beta_1,beta_2,...." /> | 74 </param> |
75 <param name="day0_label" argument="--day0-label" type="text" format="tabular" optional="true" value="" label="Control sample" help="Specify the control sample label (usually day 0 or plasmid). For every other sample label, the MLE module will treat it as a single condition and generate an corresponding design matrix"> | |
76 <validator type="regex" message="Please only use letters, numbers or underscores in sample label">^[\w]+$</validator> | |
77 </param> | |
78 <param name="beta_labels" argument="--beta-labels" type="text" label="Variables" help="Specify the labels of the variables (i.e., beta), if the design matrix is not given by file in the --design-matrix option. Should be separated by commas (,), and the number of labels must equal to the number of columns of design matrix), including baseline labels. Default: bata_0,beta_1,beta_2,...."> | |
79 <validator type="regex" message="Please only use letters, numbers or underscores in labels, and separate labels by commas">^[\w,]+$</validator> | |
80 </param> | |
64 </when> | 81 </when> |
65 </conditional> | 82 </conditional> |
66 | 83 |
67 <section name="adv" title="Advanced Options"> | 84 <section name="adv" title="Advanced Options"> |
68 <param name="control_sgrna" argument="--control-sgrna" type="data" format="tabular" optional="true" label="Control sgRNAs file" help="A list of control sgRNAs for normalization and for generating the null distribution of RRA" /> | 85 <param name="control_sgrna" argument="--control-sgrna" type="data" format="tabular" optional="true" label="Control sgRNAs file" help="A list of control sgRNAs for normalization and for generating the null distribution of RRA" /> |
69 <param name="cnv_norm" argument="--cnv-norm" type="data" format="tabular" optional="true" label="CNV profile file" help="A matrix of copy number variation data across cell lines to normalize CNV-biased BetaScores" /> | 86 <param name="cnv_norm" argument="--cnv-norm" type="data" format="tabular" optional="true" label="CNV profile file" help="A matrix of copy number variation data across cell lines to normalize CNV-biased BetaScores" /> |
70 <param name="norm_method" argument="--norm-method" type="select" label="Method for normalization" help="If control is specified, the size factor will be estimated using control sgRNAs specified in --control-sgrna option. Default: Median" > | 87 <param name="norm_method" argument="--norm-method" type="select" optional="true" label="Method for normalization" help="If control is specified, the size factor will be estimated using control sgRNAs specified in --control-sgrna option. Default: Median" > |
88 <option value="median" selected="True">Median</option> | |
71 <option value="none">None</option> | 89 <option value="none">None</option> |
72 <option value="median" selected="True">Median</option> | |
73 <option value="total">Total</option> | 90 <option value="total">Total</option> |
74 <option value="control">Control</option> | 91 <option value="control">Control</option> |
75 </param> | 92 </param> |
76 <param name="genes_var" argument="--genes-varmodeling" type="integer" value="1000" label="Number of genes for mean-variance modeling" help="Default: 1000" /> | 93 <param name="genes_var" argument="--genes-varmodeling" type="integer" optional="true" label="Number of genes for mean-variance modeling" help="Default: 1000" /> |
77 <param name="permutation" argument="--permutation-round" type="integer" value="2" label="Number of permutations" help="The rounds for permutation. The permutation time is (# genes) * x for x rounds of permutation. Default: 2" /> | 94 <param name="permutation" argument="--permutation-round" type="integer" optional="true" label="Number of permutations" help="The rounds for permutation. The permutation time is (# genes) * x for x rounds of permutation. Default: 2" /> |
78 <param name="remove_outliers" argument="--remove-outliers" type="boolean" truevalue="--remove-outliers" falsevalue="" checked="false" optional="true" label="Try to remove outliers" help="Turning this option on will slow the algorithm" /> | 95 <param name="remove_outliers" argument="--remove-outliers" type="boolean" truevalue="--remove-outliers" falsevalue="" checked="false" optional="true" label="Try to remove outliers" help="Turning this option on will slow the algorithm" /> |
79 <param name="adjust_method" argument="--adjust-method" type="select" label="P-Value Adjustment Method" help="Method for sgRNA-level p-value adjustment, including False Discovery Rate (FDR), Holm's method (Holm), or Pounds's method (Pounds). Default: FDR"> | 96 <param name="adjust_method" argument="--adjust-method" type="select" optional="true" label="P-Value Adjustment Method" help="Method for sgRNA-level p-value adjustment, including False Discovery Rate (FDR), Holm's method (Holm), or Pounds's method (Pounds). Default: FDR"> |
80 <option value="fdr" selected="True">FDR</option> | 97 <option value="fdr">FDR</option> |
81 <option value="holm">Holm</option> | 98 <option value="holm">Holm</option> |
82 <option value="pounds">Pounds</option> | 99 <option value="pounds">Pounds</option> |
83 </param> | 100 </param> |
84 <param name="sgrnaeff_file" argument="--sgrna-efficiency" type="data" format="tabular" optional="true" label="sgRNA efficiency file" help="An optional file of sgRNA efficiency prediction. The efficiency prediction will be used as an initial guess of the probability an sgRNA is efficient. Must contain at least two columns, one containing sgRNA ID, the other containing sgRNA efficiency prediction" /> | 101 <param name="sgrnaeff_file" argument="--sgrna-efficiency" type="data" format="tabular" optional="true" label="sgRNA efficiency file" help="An optional file of sgRNA efficiency prediction. The efficiency prediction will be used as an initial guess of the probability an sgRNA is efficient. Must contain at least two columns, one containing sgRNA ID, the other containing sgRNA efficiency prediction" /> |
85 <param name="sgrnaeff_name_col" argument="--sgrna-eff-score-column" type="data_column" data_ref="sgrnaeff_file" value="1" optional="true" label="sgRNA score column" help="The sgRNA efficiency prediction column in sgRNA efficiency prediction file (specified by the --sgrna-efficiency option). Default is 1 (the second column)." /> | 102 <param name="sgrnaeff_name_col" argument="--sgrna-eff-score-column" type="data_column" data_ref="sgrnaeff_file" value="1" optional="true" label="sgRNA score column" help="The sgRNA efficiency prediction column in sgRNA efficiency prediction file (specified by the --sgrna-efficiency option). Default is 1 (the second column)." /> |
166 | 183 |
167 The optional Control sgRNAs file is used to generate null distribution when calculating the p values. If this option is not specified, MAGeCK generates the null distribution of RRA scores by assuming all of the genes in the library are non-essential, see **More Information** below. This approach is sometimes over-conservative, and you can improve this if you know some genes are not essential. By providing the corresponding sgRNA IDs in this option, MAGeCK will have a better estimation of p values. To use this option, you need to prepare a text file specifying the IDs of control sgRNAs, one line for one sgRNA ID. | 184 The optional Control sgRNAs file is used to generate null distribution when calculating the p values. If this option is not specified, MAGeCK generates the null distribution of RRA scores by assuming all of the genes in the library are non-essential, see **More Information** below. This approach is sometimes over-conservative, and you can improve this if you know some genes are not essential. By providing the corresponding sgRNA IDs in this option, MAGeCK will have a better estimation of p values. To use this option, you need to prepare a text file specifying the IDs of control sgRNAs, one line for one sgRNA ID. |
168 | 185 |
169 **Outputs** | 186 **Outputs** |
170 | 187 |
171 If successful, MAGeCK mle will generate two files, the gene_summary file (including gene beta scores), and the sgrna_summary file (including sgRNA efficiency probability predictions). | 188 This tool outputs |
172 | 189 |
173 **Gene summary file (including beta scores)** | 190 * a ranked sgRNA Summary file |
191 * a ranked Gene Summary file | |
192 | |
193 Optionally, under **Output Options** you can choose to output | |
194 | |
195 * a Log file of the analysis | |
196 | |
197 If successful, MAGeCK mle will generate two files, the Gene Summary file (including gene beta scores), and the sgRNA Summary file (including sgRNA efficiency probability predictions). | |
198 | |
199 **Gene Summary file (including beta scores)** | |
174 | 200 |
175 An example of the gene summary output file is below. This file includes the beta scores in two conditions specified in the design matrix (HL60|beta and KBM7|beta), and the associated statistics. For more information, check the output format specification of the **mageck test** *Gene Summary* file. | 201 An example of the gene summary output file is below. This file includes the beta scores in two conditions specified in the design matrix (HL60|beta and KBM7|beta), and the associated statistics. For more information, check the output format specification of the **mageck test** *Gene Summary* file. |
176 | 202 |
177 ======== ========= ============= ========== ================ ============ ===================== ================= ============= =========== ================ ============ ===================== ================= | 203 ======== ========= ============= ========== ================ ============ ===================== ================= ============= =========== ================ ============ ===================== ================= |
178 **Gene** **sgRNA** **HL60|beta** **HL60|z** **HL60|p-value** **HL60|fdr** **HL60|wald-p-value** **HL60|wald-fdr** **KBM7|beta** **KBM7|ze** **KBM7|p-value** **KBM7|fdr** **KBM7|wald-p-value** **KBM7|wald-fdr** | 204 **Gene** **sgRNA** **HL60|beta** **HL60|z** **HL60|p-value** **HL60|fdr** **HL60|wald-p-value** **HL60|wald-fdr** **KBM7|beta** **KBM7|ze** **KBM7|p-value** **KBM7|fdr** **KBM7|wald-p-value** **KBM7|wald-fdr** |
181 RNF10 10 0.10159 0.29373 0.92087 0.98235 0.76896 0.9999 0.11341 0.32794 0.90145 0.97365 0.74296 0.98421 | 207 RNF10 10 0.10159 0.29373 0.92087 0.98235 0.76896 0.9999 0.11341 0.32794 0.90145 0.97365 0.74296 0.98421 |
182 RNF11 10 3.6354 10.513 0.00028 0.021739 7.5197e-26 1.3376e-22 2.5928 7.4925 0.0014898 0.032024 6.7577e-14 1.33e-11 | 208 RNF11 10 3.6354 10.513 0.00028 0.021739 7.5197e-26 1.3376e-22 2.5928 7.4925 0.0014898 0.032024 6.7577e-14 1.33e-11 |
183 ======== ========= ============= ========== ================ ============ ===================== ================= ============= =========== ================ ============ ===================== ================= | 209 ======== ========= ============= ========== ================ ============ ===================== ================= ============= =========== ================ ============ ===================== ================= |
184 | 210 |
185 | 211 |
186 **sgRNA summary file (including sgRNA efficiency probability predictions)** | 212 **sgRNA Summary file (including sgRNA efficiency probability predictions)** |
187 | 213 |
188 An example of the sgRNA ranking output is as follows: | 214 An example of the sgRNA ranking output is as follows: |
189 | 215 |
190 ================ ======== ================= =================== ================ ============== ======= =============== =========== ========= ========= =========== ============== =========== ===================== | 216 ================ ======== ================= =================== ================ ============== ======= =============== =========== ========= ========= =========== ============== =========== ===================== |
191 **sgrna** **Gene** **control_count** **treatment_count** **control_mean** **treat_mean** **LFC** **control_var** **adj_var** **score** **p.low** **p.high** **p.twosided** **FDR** **high_in_treatment** | 217 **sgrna** **Gene** **control_count** **treatment_count** **control_mean** **treat_mean** **LFC** **control_var** **adj_var** **score** **p.low** **p.high** **p.twosided** **FDR** **high_in_treatment** |