Mercurial > repos > grau > dimont_deprecated
comparison DimontWeb.xml @ 0:5130880b8e0a draft
Uploaded
| author | grau |
|---|---|
| date | Tue, 12 Nov 2013 12:55:52 -0500 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:5130880b8e0a |
|---|---|
| 1 <tool id="Dimont" name="Dimont" version="0.1" force_history_refresh="true"> | |
| 2 <description>- a universal tool for de-novo motif discovery.</description> | |
| 3 <command>java -Xms256M -Xmx2G -jar \$JAR_PATH/DimontWeb.jar --run $script_file $summary $summary.id $__new_file_path__ $summary.extra_files_path</command> | |
| 4 <inputs> | |
| 5 <param type="text" size="40" name="Dimont_jobname" label="Job name" value="" optional="true" help="Please enter a name for your job that should be used in the history (optional)"> | |
| 6 </param> | |
| 7 <param type="data" format="fasta" name="Dimont_ps_Input_sequences" label="<hr />Input sequences" help="The input sequences for de-novo motif discovery (can be uploaded using "GetData" -> "Upload File"), annotated FastA format. The required format is described in the help section." value="" optional="false"> | |
| 8 </param> | |
| 9 | |
| 10 <param type="text" size="40" name="Dimont_ps_Position_tag" label="Position tag" help="The tag for the position information in the FastA-annotation of the input file" value="" optional="false"> | |
| 11 </param> | |
| 12 | |
| 13 <param type="text" size="40" name="Dimont_ps_Value_tag" label="Value tag" help="The tag for the value information in the FastA-annotation of the input file" value="" optional="false"> | |
| 14 </param> | |
| 15 | |
| 16 <param type="float" name="Dimont_ps_Standard_deviation" label="Standard deviation" help="The standard deviation of the position distribution centered at the position specified by the position tag" value="75.0" optional="false"> | |
| 17 <validator type="in_range" min="1.0" max="10000.0" message="Value is not in the specified range [1.0, 10000.0]."/></param> | |
| 18 | |
| 19 <param type="text" size="40" name="Dimont_ps_Weighting_factor" label="Weighting factor" help="The value for weighting the data; either a value between 0 and 1, or a description relative to the standard deviation (e.g. +4sd)" value="0.2" optional="false"> | |
| 20 </param> | |
| 21 | |
| 22 <param type="integer" name="Dimont_ps_Starts" label="<hr />Starts" help="The number of pre-optimization runs." value="20" optional="false"> | |
| 23 <validator type="in_range" min="1" max="100" message="Value is not in the specified range [1, 100]."/></param> | |
| 24 | |
| 25 <param type="integer" name="Dimont_ps_Initial_motif_width" label="<hr />Initial motif width" help="The motif width that is used initially, may be adjusted during optimization." value="15" optional="false"> | |
| 26 <validator type="in_range" min="1" max="50" message="Value is not in the specified range [1, 50]."/></param> | |
| 27 | |
| 28 <param type="integer" name="Dimont_ps_Markov_order_of_motif_model" label="Markov order of motif model" help="The Markov order of the model for the motif." value="0" optional="false"> | |
| 29 <validator type="in_range" min="0" max="3" message="Value is not in the specified range [0, 3]."/></param> | |
| 30 | |
| 31 <param type="integer" name="Dimont_ps_Markov_order_of_background_model" label="Markov order of background model" help="The Markov order of the model for the background sequence and the background sequence, -1 defines uniform distribution." value="-1" optional="false"> | |
| 32 <validator type="in_range" min="-1" max="5" message="Value is not in the specified range [-1, 5]."/></param> | |
| 33 | |
| 34 <param type="float" name="Dimont_ps_Equivalent_sample_size" label="<hr />Equivalent sample size" help="Reflects the strength of the prior on the model parameters." value="4.0" optional="false"> | |
| 35 <validator type="in_range" min="0.0" max="Infinity" message="Value is not in the specified range [0.0, Infinity]."/></param> | |
| 36 | |
| 37 <param type="boolean" name="Dimont_ps_Delete_BSs_from_profile" label="Delete BSs from profile" help="A switch for deleting binding site positions of discovered motifs from the profile before searching for futher motifs." checked="True" optional="false"> | |
| 38 </param> | |
| 39 | |
| 40 </inputs> | |
| 41 <requirements> | |
| 42 <requirement type="set_environment">JAR_PATH</requirement> | |
| 43 <requirement type="binary" version=">=1.6">java</requirement> | |
| 44 </requirements> | |
| 45 <configfiles> | |
| 46 <configfile name="script_file"> | |
| 47 <Dimont_ps_Input_sequences> | |
| 48 <value> | |
| 49 ${Dimont_ps_Input_sequences}</value> | |
| 50 <extension> | |
| 51 ${Dimont_ps_Input_sequences.ext}</extension> | |
| 52 </Dimont_ps_Input_sequences> | |
| 53 | |
| 54 <Dimont_ps_Position_tag> | |
| 55 ${Dimont_ps_Position_tag}</Dimont_ps_Position_tag> | |
| 56 | |
| 57 <Dimont_ps_Value_tag> | |
| 58 ${Dimont_ps_Value_tag}</Dimont_ps_Value_tag> | |
| 59 | |
| 60 <Dimont_ps_Standard_deviation> | |
| 61 ${Dimont_ps_Standard_deviation}</Dimont_ps_Standard_deviation> | |
| 62 | |
| 63 <Dimont_ps_Weighting_factor> | |
| 64 ${Dimont_ps_Weighting_factor}</Dimont_ps_Weighting_factor> | |
| 65 | |
| 66 <Dimont_ps_Starts> | |
| 67 ${Dimont_ps_Starts}</Dimont_ps_Starts> | |
| 68 | |
| 69 <Dimont_ps_Initial_motif_width> | |
| 70 ${Dimont_ps_Initial_motif_width}</Dimont_ps_Initial_motif_width> | |
| 71 | |
| 72 <Dimont_ps_Markov_order_of_motif_model> | |
| 73 ${Dimont_ps_Markov_order_of_motif_model}</Dimont_ps_Markov_order_of_motif_model> | |
| 74 | |
| 75 <Dimont_ps_Markov_order_of_background_model> | |
| 76 ${Dimont_ps_Markov_order_of_background_model}</Dimont_ps_Markov_order_of_background_model> | |
| 77 | |
| 78 <Dimont_ps_Equivalent_sample_size> | |
| 79 ${Dimont_ps_Equivalent_sample_size}</Dimont_ps_Equivalent_sample_size> | |
| 80 | |
| 81 <Dimont_ps_Delete_BSs_from_profile> | |
| 82 ${Dimont_ps_Delete_BSs_from_profile}</Dimont_ps_Delete_BSs_from_profile> | |
| 83 | |
| 84 </configfile> | |
| 85 </configfiles> | |
| 86 <outputs> | |
| 87 <data format="html" name="summary" label="#if str($Dimont_jobname) == '' then $tool.name + ' on ' + $on_string else $Dimont_jobname#"> | |
| 88 </data> | |
| 89 </outputs> | |
| 90 <tests> | |
| 91 <test> | |
| 92 <param name="Dimont_jobname" value="Test" /> | |
| 93 <param name="Dimont_ps_Input_sequences" value="dimont_test.fasta" /> | |
| 94 <param name="Dimont_ps_Position_tag" value="peakSummit" /> | |
| 95 <param name="Dimont_ps_Value_tag" value="maxT" /> | |
| 96 <param name="Dimont_ps_Standard_deviation" value="75.0" /> | |
| 97 <param name="Dimont_ps_Weighting_factor" value="0.2" /> | |
| 98 <param name="Dimont_ps_Starts" value="20" /> | |
| 99 <param name="Dimont_ps_Initial_motif_width" value="15" /> | |
| 100 <param name="Dimont_ps_Markov_order_of_motif_model" value="0" /> | |
| 101 <param name="Dimont_ps_Markov_order_of_background_model" value="-1" /> | |
| 102 <param name="Dimont_ps_Equivalent_sample_size" value="4.0" /> | |
| 103 <param name="Dimont_ps_Delete_BSs_from_profile" value="True" /> | |
| 104 <output name="summary" file="Test/Test_html.html" /> | |
| 105 </test> | |
| 106 </tests> | |
| 107 <help> | |
| 108 **Dimont** is a universal tool for de-novo motif discovery. Dimont has successfully been applied to ChIP-seq, ChIP-exo and protein-binding microarray (PBM) data. | |
| 109 | |
| 110 Input sequences must be supplied in an annotated FastA format as a file uploaded by the "Upload File" task in section "Get Data" of Galaxy or generated using the "Dimont Data Extractor" tool. | |
| 111 In the annotation of each sequence, you need to provide a value that reflects the confidence that this sequence is bound by the factor of interest. | |
| 112 Such confidences may be peak statistics (e.g., number of fragments under a peak) for ChIP data or signal intensities for PBM data. In addition, you need to provide an anchor position within the sequence. | |
| 113 In case of ChIP data, this anchor position could for instance be the peak summit. | |
| 114 For instance, an annotated FastA file for ChIP-exo data comprising sequences of length 100 centered around the peak summit could look like:: | |
| 115 | |
| 116 > peak: 50; signal: 515 | |
| 117 ggccatgtgtatttttttaaatttccac... | |
| 118 > peak: 50; signal: 199 | |
| 119 GGTCCCCTGGGAGGATGGGGACGTGCTG... | |
| 120 ... | |
| 121 | |
| 122 where the anchor point is given as 50 for the first two sequences, and the confidence amounts to 515 and 199, respectively. | |
| 123 The FastA comment may contain additional annotations of the format ``key1 : value1; key2: value2;...``. | |
| 124 We also provide an example_ input file and a Perl script_ for preparing data in the format required by Dimont. | |
| 125 | |
| 126 Accordingly, you would need to set the parameter "Position tag" to ``peak`` and the parameter "Value tag" to ``signal`` for the input file. | |
| 127 | |
| 128 For the standard deviation of the position prior, the initial motif length and the number of pre-optimization runs, we provide default values that worked well in our studies on ChIP and PBM data. | |
| 129 However, you may want adjust these parameters to meet your prior information. | |
| 130 | |
| 131 The parameter "Markov order of the motif model" sets the order of the inhomogeneous Markov model used for modeling the motif. If this parameter is set to ``0``, you obtain a position weight matrix (PWM) model. | |
| 132 If it is set to ``1``, you obtain a weight array matrix (WAM) model. You can set the order of the motif model to at most ``3``. | |
| 133 | |
| 134 The parameter "Markov order of the background model" sets the order of the homogeneous Markov model used for modeling positions not covered by a motif. | |
| 135 If this parameter is set to ``-1``, you obtain a uniform distribution, which worked well for ChIP data. For PBM data, orders of up to ``4`` resulted in an increased prediction performance in our case studies. The maximum allowed value is ``5``. | |
| 136 | |
| 137 The parameter "Weighting factor" defines the proportion of sequences that you expect to be bound by the targeted factor with high confidence. For ChIP data, the default value of ``0.2`` typically works well. | |
| 138 For PBM data, containing a large number of unspecific probes, this parameter should be set to a lower value, e.g. ``0.01``. | |
| 139 | |
| 140 The "Equivalent sample size" reflects the strength of the influence of the prior on the model parameters, where higher values smooth out the parameters to a greater extent. | |
| 141 | |
| 142 The parameter "Delete BSs from profile" defines if BSs of already discovered motifs should be deleted, i.e., "blanked out", from the sequence before searching for futher motifs. | |
| 143 | |
| 144 You can also install this web-application within your local Galaxy server. Instructions can be found at the Dimont_ page of Jstacs. | |
| 145 There you can also download a command line version of Dimont. | |
| 146 | |
| 147 If you experience problems using Dimont, please contact_ us. | |
| 148 | |
| 149 .. _example: http://www.jstacs.de/downloads/dimont-example.fa | |
| 150 .. _script: http://www.jstacs.de/index.php/Dimont#Data_preparation | |
| 151 .. _Dimont: http://jstacs.de/index.php/Dimont | |
| 152 .. _contact: mailto:grau@informatik.uni-halle.de | |
| 153 </help> | |
| 154 </tool> | |
| 155 |
