Mercurial > repos > galaxy-australia > alphafold2
comparison alphafold.xml @ 20:6ab1a261520a draft
planemo upload for repository https://github.com/usegalaxy-au/tools-au commit c3a90eb12ada44d477541baa4dd6182be29cd554-dirty
author | galaxy-australia |
---|---|
date | Sun, 28 Jul 2024 20:09:55 +0000 |
parents | 2f7702fd0a4c |
children | e7f1b552a695 |
comparison
equal
deleted
inserted
replaced
19:2f7702fd0a4c | 20:6ab1a261520a |
---|---|
1 <tool id="alphafold" name="Alphafold 2" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.01"> | 1 <tool id="alphafold" name="Alphafold 2" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="22.05"> |
2 <description> - AI-guided 3D structural prediction of proteins</description> | 2 <description> - AI-guided 3D structural prediction of proteins</description> |
3 <macros> | 3 <macros> |
4 <token name="@TOOL_VERSION@">2.3.1</token> | 4 <token name="@TOOL_VERSION@">2.3.2</token> |
5 <token name="@TOOL_MINOR_VERSION@">2.3</token> | 5 <token name="@TOOL_MINOR_VERSION@">2.3</token> |
6 <token name="@VERSION_SUFFIX@">5</token> | 6 <token name="@VERSION_SUFFIX@">0</token> |
7 <import>macro_output.xml</import> | 7 <import>macro_output.xml</import> |
8 <import>macro_test_output.xml</import> | 8 <import>macro_test_output.xml</import> |
9 </macros> | 9 </macros> |
10 <edam_topics> | 10 <edam_topics> |
11 <edam_topic>topic_0082</edam_topic> | 11 <edam_topic>topic_0082</edam_topic> |
15 </edam_operations> | 15 </edam_operations> |
16 <xrefs> | 16 <xrefs> |
17 <xref type="bio.tools">alphafold_2</xref> | 17 <xref type="bio.tools">alphafold_2</xref> |
18 </xrefs> | 18 </xrefs> |
19 <requirements> | 19 <requirements> |
20 <container type="docker">neoformit/alphafold:v2.3.1_2</container> | 20 <container type="docker">neoformit/alphafold:v2.3.2_0</container> |
21 </requirements> | 21 </requirements> |
22 <required_files> | 22 <required_files> |
23 <include path="scripts/outputs.py" /> | 23 <include path="scripts/outputs.py" /> |
24 <include path="scripts/validate_fasta.py" /> | 24 <include path="scripts/validate_fasta.py" /> |
25 <include path="alphafold.html" /> | 25 <include path="scripts/alphafold.html" /> |
26 </required_files> | 26 </required_files> |
27 <command detect_errors="exit_code"><![CDATA[ | 27 <command detect_errors="exit_code"><![CDATA[ |
28 | 28 |
29 ## Developers: to test with mock alphafold run, set `export PLANEMO_TESTING=1` | 29 ## Developers: to test with mock alphafold run, set `export PLANEMO_TESTING=1` |
30 ## in planemo's gx_venv_n/bin/activate script. AlphaFold outputs will be copied | 30 ## in planemo's gx_venv_n/bin/activate script. AlphaFold outputs will be copied |
44 #end if | 44 #end if |
45 | 45 |
46 && python3 '$__tool_directory__/scripts/validate_fasta.py' input.fasta | 46 && python3 '$__tool_directory__/scripts/validate_fasta.py' input.fasta |
47 --min_length \${ALPHAFOLD_AA_LENGTH_MIN:-0} | 47 --min_length \${ALPHAFOLD_AA_LENGTH_MIN:-0} |
48 --max_length \${ALPHAFOLD_AA_LENGTH_MAX:-0} | 48 --max_length \${ALPHAFOLD_AA_LENGTH_MAX:-0} |
49 #if $model_preset == 'multimer': | 49 #if $model_preset.selection == 'multimer': |
50 --multimer | 50 --multimer |
51 --max-sequences \${ALPHAFOLD_MAX_SEQUENCES:-10} | 51 --max-sequences \${ALPHAFOLD_MAX_SEQUENCES:-10} |
52 #end if | 52 #end if |
53 > alphafold.fasta | 53 > alphafold.fasta |
54 | 54 |
58 && export TODAY=`date +"%Y-%m-%d"` | 58 && export TODAY=`date +"%Y-%m-%d"` |
59 | 59 |
60 ## Run AlphaFold ------------------------------------------------------------- | 60 ## Run AlphaFold ------------------------------------------------------------- |
61 #if os.environ.get('PLANEMO_TESTING'): | 61 #if os.environ.get('PLANEMO_TESTING'): |
62 ## Run in testing mode (mocks a successful AlphaFold run by copying outputs) | 62 ## Run in testing mode (mocks a successful AlphaFold run by copying outputs) |
63 && echo "Creating dummy outputs for model_preset=$model_preset..." | 63 && echo "Creating dummy outputs for model_preset=$model_preset.selection..." |
64 && bash '$__tool_directory__/scripts/mock_alphafold.sh' $model_preset | 64 && bash '$__tool_directory__/scripts/mock_alphafold.sh' $model_preset |
65 #else: | 65 #else: |
66 ## Run AlphaFold | 66 ## Run AlphaFold |
67 && python /app/alphafold/run_alphafold.py | 67 && python /app/alphafold/run_alphafold.py |
68 --fasta_paths alphafold.fasta | 68 --fasta_paths alphafold.fasta |
69 --output_dir output | 69 --output_dir output |
70 --data_dir \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/ | 70 --data_dir \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/ |
71 --model_preset=$model_preset | 71 --model_preset=$model_preset.selection |
72 | 72 |
73 ## Set reference database paths | 73 ## Set reference database paths |
74 --uniref90_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/uniref90/uniref90.fasta | 74 --uniref90_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/uniref90/uniref90.fasta |
75 --mgnify_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/mgnify/mgy_clusters_2022_05.fa | 75 --mgnify_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/mgnify/mgy_clusters_2022_05.fa |
76 --template_mmcif_dir \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/pdb_mmcif/mmcif_files | 76 --template_mmcif_dir \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/pdb_mmcif/mmcif_files |
81 #else | 81 #else |
82 --db_preset=reduced_dbs | 82 --db_preset=reduced_dbs |
83 --small_bfd_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/small_bfd/bfd-first_non_consensus_sequences.fasta | 83 --small_bfd_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/small_bfd/bfd-first_non_consensus_sequences.fasta |
84 #end if | 84 #end if |
85 | 85 |
86 #if $max_template_date: | 86 #if $advanced.max_template_date: |
87 --max_template_date=$max_template_date | 87 --max_template_date=$advanced.max_template_date |
88 #else | 88 #else |
89 --max_template_date=\$TODAY | 89 --max_template_date=\$TODAY |
90 #end if | 90 #end if |
91 | 91 |
92 --use_gpu_relax=\${ALPHAFOLD_USE_GPU:-True} ## introduced in v2.1.2 | 92 --use_gpu_relax=\${ALPHAFOLD_USE_GPU:-True} |
93 | 93 |
94 #if $model_preset == 'multimer': | 94 #if $model_preset.selection == 'multimer': |
95 --pdb_seqres_database_path=\${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/pdb_seqres/pdb_seqres.txt | 95 --pdb_seqres_database_path=\${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/pdb_seqres/pdb_seqres.txt |
96 --uniprot_database_path=\${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/uniprot/uniprot.fasta | 96 --uniprot_database_path=\${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/uniprot/uniprot.fasta |
97 --num_multimer_predictions_per_model=1 ## introduced in v2.2.0 | 97 --num_multimer_predictions_per_model=$model_preset.num_multimer_predictions_per_model |
98 #else | 98 #else |
99 --pdb70_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/pdb70/pdb70 | 99 --pdb70_database_path \${ALPHAFOLD_DB:-/data}/@TOOL_MINOR_VERSION@/pdb70/pdb70 |
100 #end if | 100 #end if |
101 | |
102 ## Galaxy-specific options -------------------------------------------- | |
103 ## See https://github.com/neoformit/alphafold/tree/release_2.3.2_galaxy | |
104 #if $advanced.disable_amber_relax: | |
105 --disable_amber_relax | |
106 #end if | |
107 | |
108 #if $advanced.limit_model_outputs: | |
109 --output_models=$limit_model_outputs | |
110 #end if | |
111 ## End Galaxy-specific options ---------------------------------------- | |
112 | |
101 #end if | 113 #end if |
102 | 114 |
103 ## Generate additional outputs ------------------------------------------------ | 115 ## Generate additional outputs ------------------------------------------------ |
104 && python3 '$__tool_directory__/scripts/outputs.py' output/alphafold | 116 && python3 '$__tool_directory__/scripts/outputs.py' output/alphafold |
105 $outputs.plddts | 117 $outputs.plddts |
106 $outputs.model_pkls | 118 $outputs.model_pkls |
107 $outputs.pae_csv | 119 $outputs.pae_csv |
108 $outputs.plots | 120 $outputs.plots |
109 #if $model_preset == 'multimer': | 121 #if $model_preset.selection == 'multimer': |
110 --multimer | 122 --multimer |
111 #end if | 123 #end if |
112 | 124 |
113 ## HTML output | 125 ## HTML output |
114 && mkdir -p '${ html.files_path }' | 126 && mkdir -p '${ html.files_path }' |
115 && cp '$__tool_directory__/alphafold.html' '${html}' | 127 && cp output/alphafold/extra/alphafold.html '${html}' |
116 && cp output/alphafold/ranked_*.pdb '${html.files_path}' | 128 && cp output/alphafold/ranked_*.pdb '${html.files_path}' |
117 | 129 |
118 ## This is a (hacky) fix for a bug that has appeared in multiple Pulsar servers. | 130 ## This is a (hacky) fix for a bug that has appeared in multiple Pulsar servers. |
119 ## The working directory ends up two levels deep and the visualization html page | 131 ## The working directory ends up two levels deep and the visualization html page |
120 ## fails to load the PDB files as static assets. | 132 ## fails to load the PDB files as static assets. |
134 <param name="fasta_text" type="text" area="true" value="" label="Paste sequence" help="Paste single protein sequence into the textbox. If you wish to fold multiple proteins, submit individual jobs for each protein. If you wish to run AlphaFold multimer, please supply multiple sequences in FASTA format." /> | 146 <param name="fasta_text" type="text" area="true" value="" label="Paste sequence" help="Paste single protein sequence into the textbox. If you wish to fold multiple proteins, submit individual jobs for each protein. If you wish to run AlphaFold multimer, please supply multiple sequences in FASTA format." /> |
135 </when> | 147 </when> |
136 </conditional> | 148 </conditional> |
137 | 149 |
138 <param | 150 <param |
139 name="max_template_date" | |
140 type="text" | |
141 label="Max template date (yyyy-mm-dd) (optional)" | |
142 help="The model will reference PDB structures deposited before this date only. Defaults to today's date." | |
143 optional="true" | |
144 > | |
145 <sanitizer> | |
146 <valid initial="string.digits"> | |
147 <add value="-" /> | |
148 </valid> | |
149 </sanitizer> | |
150 <validator type="regex">[0-9]{4}-[0-9]{2}-[0-9]{2}</validator> | |
151 </param> | |
152 | |
153 <param | |
154 name="dbs" | 151 name="dbs" |
155 type="select" | 152 type="select" |
156 display="radio" | 153 display="radio" |
157 label="Select database" | 154 label="Select database" |
158 help="The reduced database allows significantly faster run time in | 155 help="The reduced database allows significantly faster run time in |
160 > | 157 > |
161 <option value="reduced" selected="true">Reduced database</option> | 158 <option value="reduced" selected="true">Reduced database</option> |
162 <option value="full">Full database</option> | 159 <option value="full">Full database</option> |
163 </param> | 160 </param> |
164 | 161 |
162 <conditional name="model_preset"> | |
165 <param | 163 <param |
166 name="model_preset" | 164 name="selection" |
167 type="select" | 165 type="select" |
168 label="Model preset" | 166 label="Model preset" |
169 help="Select which prediction model to run. The monomer model is the most accurate for single protein prediction. The multimer model allows prediction of protein complexes." | 167 help="Select which prediction model to run. The monomer model is the most accurate for single protein prediction. The multimer model allows prediction of protein complexes." |
170 > | 168 > |
171 <option value="monomer" selected="true">monomer - default prediction model</option> | 169 <option value="monomer" selected="true">monomer - default prediction model</option> |
174 </option> | 172 </option> |
175 <option value="multimer"> | 173 <option value="multimer"> |
176 multimer - model a protein complex (requires multi-sequence FASTA input) | 174 multimer - model a protein complex (requires multi-sequence FASTA input) |
177 </option> | 175 </option> |
178 </param> | 176 </param> |
177 <when value="monomer"></when> | |
178 <when value="monomer_ptm"></when> | |
179 <when value="multimer"> | |
180 <param | |
181 name="num_multimer_predictions_per_model" | |
182 type="integer" | |
183 value="5" | |
184 label="Multimer predictions per model" | |
185 help="How many predictions (each with a different random seed) will be generated per model. E.g. if this is 2 and there are 5 models then there will be 10 predictions per input. For a small drop in accuracy you may wish to run a single seed per model (default 5, max 10)." | |
186 min="1" | |
187 max="10" | |
188 /> | |
189 </when> | |
190 </conditional> | |
191 | |
192 <section name="advanced" title="Advanced options" expanded="false"> | |
193 <param | |
194 name="max_template_date" | |
195 type="text" | |
196 label="Max template date (yyyy-mm-dd) (optional)" | |
197 help="The model will reference PDB structures deposited before this date only. Defaults to today's date." | |
198 optional="true" | |
199 > | |
200 <sanitizer> | |
201 <valid initial="string.digits"> | |
202 <add value="-" /> | |
203 </valid> | |
204 </sanitizer> | |
205 <validator type="regex">[0-9]{4}-[0-9]{2}-[0-9]{2}</validator> | |
206 </param> | |
207 | |
208 <param | |
209 name="disable_amber_relax" | |
210 type="boolean" | |
211 label="Disable Amber relaxation" | |
212 value="false" | |
213 optional="true" | |
214 help="Amber relaxation can be disabled to speed up processing time. Amber relaxation is used to refine predicted structures by removing stereochemical violations, resulting in more accurate prediction of side-chain geometry. Disabling this option with large proteins may lead to artefacts in the predicted structure. Disabling amber relax will result in the unrelaxed models being collected as PDB outputs." | |
215 /> | |
216 | |
217 <param | |
218 name="limit_model_outputs" | |
219 type="integer" | |
220 label="Limit model outputs" | |
221 value="5" | |
222 help="Limit the number of models to output. The top N models will be output, where N is the value entered here (default 5). Please note that the top-ranking model is not always the correct one, and it is usually recommended to inspect multiple models. Reducing the number of models will result in a slight reduction in run time." | |
223 min="1" | |
224 max="5" | |
225 /> | |
226 </section> | |
179 | 227 |
180 <section name="outputs" title="Optional outputs" expanded="false"> | 228 <section name="outputs" title="Optional outputs" expanded="false"> |
181 <param | 229 <param |
182 name="plots" | 230 name="plots" |
183 type="boolean" | 231 type="boolean" |
225 name="relax_json" | 273 name="relax_json" |
226 type="boolean" | 274 type="boolean" |
227 checked="false" | 275 checked="false" |
228 label="relax_metrics.json" | 276 label="relax_metrics.json" |
229 help="A JSON-formatted text file containing relax metrics (mostly remaining violations)." | 277 help="A JSON-formatted text file containing relax metrics (mostly remaining violations)." |
278 /> | |
279 <param | |
280 name="timings_json" | |
281 type="boolean" | |
282 checked="false" | |
283 label="timings.json" | |
284 help="A JSON file with timings reported for each phase of the AlphaFold run." | |
230 /> | 285 /> |
231 </section> | 286 </section> |
232 </inputs> | 287 </inputs> |
233 | 288 |
234 <outputs> | 289 <outputs> |
239 <expand macro="output_confidence_scores" /> | 294 <expand macro="output_confidence_scores" /> |
240 <expand macro="output_pickles" /> | 295 <expand macro="output_pickles" /> |
241 <expand macro="output_pae_csv" /> | 296 <expand macro="output_pae_csv" /> |
242 <expand macro="output_plots" /> | 297 <expand macro="output_plots" /> |
243 <expand macro="output_relax_json" /> | 298 <expand macro="output_relax_json" /> |
299 <expand macro="output_timings_json" /> | |
244 </outputs> | 300 </outputs> |
245 | 301 |
246 <tests> | 302 <tests> |
247 <!-- Test monomer with default outputs --> | 303 <!-- Test monomer with default outputs --> |
248 <test expect_num_outputs="6"> | 304 <test expect_num_outputs="6"> |
249 <conditional name="fasta_or_text"> | 305 <conditional name="fasta_or_text"> |
250 <param name="input_mode" value="history"/> | 306 <param name="input_mode" value="history"/> |
251 <param name="fasta_file" value="test1.fasta"/> | 307 <param name="fasta_file" value="test1.fasta"/> |
252 </conditional> | 308 </conditional> |
253 <param name="model_preset" value="monomer"/> | 309 <param name="model_preset|selection" value="monomer"/> |
254 <expand macro="test_output_pdb_models" /> | 310 <expand macro="test_output_pdb_models" /> |
255 </test> | 311 </test> |
256 | 312 |
257 <!-- Test monomer with all outputs --> | 313 <!-- Test monomer with all outputs --> |
258 <test expect_num_outputs="19"> | 314 <test expect_num_outputs="19"> |
259 <conditional name="fasta_or_text"> | 315 <conditional name="fasta_or_text"> |
260 <param name="input_mode" value="history"/> | 316 <param name="input_mode" value="history"/> |
261 <param name="fasta_file" value="test1.fasta"/> | 317 <param name="fasta_file" value="test1.fasta"/> |
262 </conditional> | 318 </conditional> |
263 <param name="model_preset" value="monomer"/> | 319 <param name="model_preset|selection" value="monomer"/> |
264 <param name="outputs|plots" value="true"/> | 320 <param name="outputs|plots" value="true"/> |
265 <param name="outputs|confidence_scores" value="true"/> | 321 <param name="outputs|confidence_scores" value="true"/> |
266 <param name="outputs|plddts" value="true"/> | 322 <param name="outputs|plddts" value="true"/> |
267 <param name="outputs|pae_csv" value="true"/> | 323 <param name="outputs|pae_csv" value="true"/> |
268 <param name="outputs|model_pkls" value="true"/> | 324 <param name="outputs|model_pkls" value="true"/> |
279 <test expect_num_outputs="24"> | 335 <test expect_num_outputs="24"> |
280 <conditional name="fasta_or_text"> | 336 <conditional name="fasta_or_text"> |
281 <param name="input_mode" value="history"/> | 337 <param name="input_mode" value="history"/> |
282 <param name="fasta_file" value="test1.fasta"/> | 338 <param name="fasta_file" value="test1.fasta"/> |
283 </conditional> | 339 </conditional> |
284 <param name="model_preset" value="monomer_ptm"/> | 340 <param name="model_preset|selection" value="monomer_ptm"/> |
285 <param name="outputs|plots" value="true"/> | 341 <param name="outputs|plots" value="true"/> |
286 <param name="outputs|confidence_scores" value="true"/> | 342 <param name="outputs|confidence_scores" value="true"/> |
287 <param name="outputs|plddts" value="true"/> | 343 <param name="outputs|plddts" value="true"/> |
288 <param name="outputs|pae_csv" value="true"/> | 344 <param name="outputs|pae_csv" value="true"/> |
289 <param name="outputs|model_pkls" value="true"/> | 345 <param name="outputs|model_pkls" value="true"/> |
301 <test expect_num_outputs="24"> | 357 <test expect_num_outputs="24"> |
302 <conditional name="fasta_or_text"> | 358 <conditional name="fasta_or_text"> |
303 <param name="input_mode" value="history"/> | 359 <param name="input_mode" value="history"/> |
304 <param name="fasta_file" value="multimer.fasta"/> | 360 <param name="fasta_file" value="multimer.fasta"/> |
305 </conditional> | 361 </conditional> |
306 <param name="model_preset" value="multimer"/> | 362 <param name="model_preset|selection" value="multimer"/> |
307 <param name="outputs|plots" value="true"/> | 363 <param name="outputs|plots" value="true"/> |
308 <param name="outputs|confidence_scores" value="true"/> | 364 <param name="outputs|confidence_scores" value="true"/> |
309 <param name="outputs|plddts" value="true"/> | 365 <param name="outputs|plddts" value="true"/> |
310 <param name="outputs|pae_csv" value="true"/> | 366 <param name="outputs|pae_csv" value="true"/> |
311 <param name="outputs|model_pkls" value="true"/> | 367 <param name="outputs|model_pkls" value="true"/> |
312 <param name="outputs|relax_json" value="true"/> | 368 <param name="outputs|relax_json" value="true"/> |
369 <param name="outputs|timings_json" value="true"/> | |
313 <expand macro="test_output_plots_3" /> | 370 <expand macro="test_output_plots_3" /> |
314 <expand macro="test_output_confidence_scores" /> | 371 <expand macro="test_output_confidence_scores" /> |
315 <expand macro="test_output_plddts" /> | 372 <expand macro="test_output_plddts" /> |
316 <expand macro="test_output_pdb_models" /> | 373 <expand macro="test_output_pdb_models" /> |
317 <expand macro="test_output_pickles" /> | 374 <expand macro="test_output_pickles" /> |
318 <expand macro="test_output_relax_json" /> | 375 <expand macro="test_output_relax_json" /> |
376 <expand macro="test_output_timings_json" /> | |
319 <expand macro="test_output_pae_csv" /> | 377 <expand macro="test_output_pae_csv" /> |
320 </test> | 378 </test> |
321 </tests> | 379 </tests> |
322 <help><![CDATA[ | 380 <help><![CDATA[ |
323 | 381 |
324 .. class:: infomark | 382 .. class:: infomark |
325 | 383 |
326 | AlphaFold v2: AI-guided 3D structural prediction of proteins | 384 | AlphaFold v2: AI-guided 3D structural prediction of proteins |
327 | | 385 | |
328 | **NOTE: this tool packages AlphaFold v2.3.1.** | 386 | **NOTE: this tool packages** `a modified branch of AlphaFold v2.3.2. <https://github.com/neoformit/alphafold/tree/release_2.3.2_galaxy>`_ |
329 | | 387 | |
330 | This means that the neural network has been trained on PDBs with a release | 388 | This means that the neural network has been trained on PDBs with a release |
331 | date before 2021-09-30 (the training cutoff was 2018-04-30 until ``v2.3.0``). | 389 | date before 2021-09-30 (the training cutoff was 2018-04-30 until ``v2.3.0``). |
332 | | 390 | |
333 | Find out more in the technical and release notes: | 391 | Find out more in the technical and release notes: |
334 | | 392 | |
335 | 393 |
336 - `Release notes for v2.3.1 <https://github.com/deepmind/alphafold/releases/tag/v2.3.1>`_ | 394 - `Release notes for v2.3.2 <https://github.com/deepmind/alphafold/releases/tag/v2.3.2>`_ |
337 - `Technical notes for v2.3 <https://github.com/deepmind/alphafold/blob/main/docs/technical_note_v2.3.0.md>`_ | 395 - `Technical notes for v2.3 <https://github.com/deepmind/alphafold/blob/main/docs/technical_note_v2.3.0.md>`_ |
338 | |
339 | If you want to use AlphaFold trained against an older cutoff date, switch to Galaxy version ``2.1.2`` (which was trained to data up to 2018-04-30). | |
340 | | |
341 | 396 |
342 **What it does** | 397 **What it does** |
343 | 398 |
344 *What is AlphaFold?* | 399 *What is AlphaFold?* |
345 | 400 |
360 | 415 |
361 | AlphaFold monomer (default) accepts a **single amino acid sequence** in FASTA format. | 416 | AlphaFold monomer (default) accepts a **single amino acid sequence** in FASTA format. |
362 | You can choose to input either a file from your Galaxy history or paste a sequence into a text box. | 417 | You can choose to input either a file from your Galaxy history or paste a sequence into a text box. |
363 | If you choose the ``multimer`` option, you can supply a FASTA file containing **multiple sequences** to be folded concurrently into a multimer. | 418 | If you choose the ``multimer`` option, you can supply a FASTA file containing **multiple sequences** to be folded concurrently into a multimer. |
364 | | 419 | |
420 | For pairwise screening of target-candidate with multimer, you can submit a list of paired protein sequences in batch mode (i.e. two protein sequences in each FASTA file). | |
365 | | 421 | |
366 | 422 |
367 **Outputs** | 423 **Outputs** |
368 | 424 |
369 *Visualization* | 425 *Visualization* |
378 | 434 |
379 | | 435 | |
380 | 436 |
381 *PDB files* | 437 *PDB files* |
382 | 438 |
383 | Five PDB (Protein Data Bank) files are be created, ordered by rank, as predicted by AlphaFold. | 439 | PDB (Protein Data Bank) files (5 by default) are be created, ordered by rank, as predicted by AlphaFold. The tool produces 5 models by default, but this can be reduced with the "Limit model outputs" for a reduced run time. |
384 | These files describe the molecular structures and can be used for downstream analysis. e.g. *in silico* molecular docking. | 440 | These files describe the molecular structures and can be used for downstream analysis. e.g. *in silico* molecular docking. |
385 | **PLEASE NOTE** that all outputs have been renamed to their respective rank order, including model and model.pkl files. | 441 | **PLEASE NOTE** that all outputs have been renamed to their respective rank order, including model and model.pkl files. |
386 | | 442 | |
387 | 443 |
388 *Model confidence scores (optional)* | 444 *Model confidence scores (optional)* |
416 | | 472 | |
417 | 473 |
418 *relax_metrics.json (optional)* | 474 *relax_metrics.json (optional)* |
419 | 475 |
420 | A JSON-formatted text file containing relax metrics (primarily remaining violations). | 476 | A JSON-formatted text file containing relax metrics (primarily remaining violations). |
477 | | |
478 | | |
479 | |
480 *timings.json (optional)* | |
481 | |
482 | A JSON-formatted text file containing the timings for each phase of the prediction. | |
421 | | 483 | |
422 | | 484 | |
423 | 485 |
424 **AlphaFold configuration** | 486 **AlphaFold configuration** |
425 | 487 |