comparison optdoe.xml @ 0:4f1acbf17618 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/optdoe commit ef03bd3baa194ea25b29a8e87d0cb0faab56f913
author iuc
date Thu, 27 Oct 2022 21:27:31 +0000
parents
children 9a2fb8d83eb0
comparison
equal deleted inserted replaced
-1:000000000000 0:4f1acbf17618
1 <tool id="optdoe" name="Optimal Design of Experiment" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.09">
2 <description>Combine selected genetic parts and enzyme variants for the desired pathways</description>
3 <macros>
4 <token name="@VERSION_SUFFIX@">0</token>
5 <token name="@TOOL_VERSION@">2.0.2</token>
6 </macros>
7 <requirements>
8 <requirement type="package" version="@TOOL_VERSION@">doebase</requirement>
9 </requirements>
10 <command detect_errors="exit_code"><![CDATA[
11 python -m doebase
12 --func doeGetSBOL
13 #if $adv.genes_sbol_file
14 --sbol_file '$adv.genes_sbol_file'
15 #end if
16 #if $adv.ref_parts_file
17 --ref_parts_file '$adv.ref_parts_file'
18 #end if
19 --libsize '$adv.libsize'
20 $adv.get_sequences
21 $adv.backtranslate
22 --codon_table '$adv.codon_table'
23 '$genes_file'
24 '$constructs'
25 ]]></command>
26 <inputs>
27 <param name="genes_file" type="data" format="csv" label="Genes" help="CSV file with header: Name,Type,Part,Step. Provided by the tool Selenzyme"/>
28 <section name="adv" title="Advanced Options" expanded="false">
29 <param name="genes_sbol_file" type="data" format="xml" optional="true" label="Optimised Genes" help="SBOL file with genes associated with different RBS. Provided by the tool PartsGenie"/>
30 <param argument="--ref_parts_file" type="data" format="csv" value="None" optional="true" label="Ref Parts (default: E. coli compliant)" help="Provide fixed parts"/>
31 <param argument="--libsize" type="integer" value="32" min="32" label="Maximal library size" help="Maximal number of contructs in the output"/>
32 <param argument="--get_sequences" type="boolean" truevalue="--get_sequences true" falsevalue="--get_sequences false" checked="true" label="Get sequences" help="Grab the sequence for each part of the SBOL output"/>
33 <param argument="--backtranslate" type="boolean" truevalue="--backtranslate true" falsevalue="--backtranslate false" checked="true" label="Back translate" help="Translate the protein sequence given by its Uniprot ID to a DNA sequence"/>
34 <param argument="--codon_table" type="select" label="Codon Table">
35 <option value="Eecoli.cut">Escherichia coli K12</option>
36 <option value="Ehuman.cut">Homo sapiens</option>
37 <option value="Eacica.cut">Acinetobacter calcoaceticus</option>
38 <option value="Eagrtu.cut">Agrobacterium tumefaciens str C58</option>
39 <option value="Eanasp.cut">Anabaena sp</option>
40 <option value="Earath.cut">Arabidopsis thaliana</option>
41 <option value="Eazovi.cut">Azotobacter vinelandii</option>
42 <option value="Ebacme.cut">Bacillus megaterium</option>
43 <option value="Ebacst.cut">Geobacillus stearothermophilus</option>
44 <option value="Ebacsu.cut">Bacillus subtilis</option>
45 <option value="Ebacsu_high.cut">Bacillus subtilis (high)</option>
46 <option value="Ebommo.cut">Bombyx mori (silkmoth)</option>
47 <option value="Ebovin.cut">Bos taurus</option>
48 <option value="Ebpphx.cut">Bacteriophage phi-X174</option>
49 <option value="Ebraja.cut">Bradyrhizobium japonicum USDA 110</option>
50 <option value="Ebrana.cut">Brassica napus (rape)</option>
51 <option value="Ebrare.cut">Brachydanio rerio (zebrafish)</option>
52 <option value="Ecaeel.cut">Caenorhabditis elegans (nematode)</option>
53 <option value="Ecanal.cut">Candida albicans</option>
54 <option value="Ecanfa.cut">Canis familiaris (dog)</option>
55 <option value="Ecaucr.cut">Caulobacter crescentus CB15</option>
56 <option value="Echick.cut">Gallus gallus (chicken)</option>
57 <option value="Echlre.cut">Chlamydomonas reinhardtii</option>
58 <option value="Echltr.cut">Chlamydia trachomatis D UW-3 CX</option>
59 <option value="Ecloab.cut">Clostridium acetobutylicum ATCC 824</option>
60 <option value="Ecrigr.cut">Cricetulus greseus (hamster)</option>
61 <option value="Ecyapa.cut">Cyanophora paradoxa</option>
62 <option value="Edicdi.cut">Dictyostelium discoideum</option>
63 <option value="Edicdi_high.cut">Dictyostelium discoideum (high)</option>
64 <option value="Edrome.cut">Drosophila melanogaster</option>
65 <option value="Edrome_high.cut">Drosophila melanogaster (high)</option>
66 <option value="Eecoli_high.cut">Escherichia coli K12 (high)</option>
67 <option value="Eemeni.cut">Emericella nidulans</option>
68 <option value="Eemeni_mit.cut">Emericella nidulans mitochondrion</option>
69 <option value="Eemeni_high.cut">Emericella nidulans highly expressed</option>
70 <option value="Eerwct.cut">Erwinia carotovora subsp atroseptica SCRI1043</option>
71 <option value="Ehaein.cut">Haemophilus influenzae Rd KW20</option>
72 <option value="Ehalma.cut">Haloarcula marismortui ATCC 43049 (Halobacterium marismortui)</option>
73 <option value="Ehalsa.cut">Halobacterium salinarum NRC-1 (Halobacterium halobium)</option>
74 <option value="Ehorvu.cut">Hordeum vulgare subsp vulgare (Barley)</option>
75 <option value="Eklepn.cut">Klebsiella pneumoniae</option>
76 <option value="Eklula.cut">Kluyveromyces lactis NRRL Y-1140</option>
77 <option value="Elacdl.cut">Lactococcus lactis subsp lactis Il1403 L. delbrueckii subsp lactis</option>
78 <option value="Elyces.cut">Lycopersicon esculentum (tomato)</option>
79 <option value="Emacfa.cut">Macaca fascicularis</option>
80 <option value="Emaize.cut">Zea mays</option>
81 <option value="Emaize_chl.cut">Zea mays chloroplast</option>
82 <option value="Emammal_high.cut">Mammalian species (high)</option>
83 <option value="Emanse.cut">Manduca sexta</option>
84 <option value="Emarpo_chl.cut">Marchantia polymorpha chloroplast (liverwort)</option>
85 <option value="Emedsa.cut">Medicago sativa</option>
86 <option value="Emetth.cut">Methanothermobacter thermautotrophicus str Delta H</option>
87 <option value="Emouse.cut">Mus musculus</option>
88 <option value="Emyctu.cut">Mycobacterium tuberculosis H37Rv</option>
89 <option value="Eneigo.cut">Neisseria gonorrhoeae</option>
90 <option value="Eneucr.cut">Neurospora crassa</option>
91 <option value="Eoncmy.cut">Oncorhynchus mykiss (rainbow trout)</option>
92 <option value="Eorysa.cut">Oryza sativa (rice)</option>
93 <option value="Eorysa_chl.cut">Oryza sativa chloroplast (rice)</option>
94 <option value="Epea.cut">Pisum sativum (pea)</option>
95 <option value="Epethy.cut">Petunia x hybrida</option>
96 <option value="Ephavu.cut">Phaseolus vulgaris</option>
97 <option value="Epig.cut">Sus scrofa (pig)</option>
98 <option value="Eplafa.cut">Plasmodium falciparum 3D7</option>
99 <option value="Eprovu.cut">Proteus vulgaris</option>
100 <option value="Epseae.cut">Pseudomonas aeruginosa PAO1</option>
101 <option value="Epsepu.cut">Pseudomonas putida KT2440</option>
102 <option value="Epsesm.cut">Pseudomonas syringae pv tomato str DC3000</option>
103 <option value="Erabit.cut">Oryctolagus cuniculus (rabbit)</option>
104 <option value="Erat.cut">Rattus norvegicus</option>
105 <option value="Erhile.cut">Rhizobium leguminosarum</option>
106 <option value="Erhime.cut">Sinorhizobium meliloti 1021</option>
107 <option value="Erhoca.cut">Rhodobacter capsulatus</option>
108 <option value="Erhosh.cut">Rhodobacter sphaeroides</option>
109 <option value="Esalsa.cut">Salmo salar (Atlantic salmon)</option>
110 <option value="Esalty.cut">Salmonella typhimurium LT2</option>
111 <option value="Eschma.cut">Schistosoma mansoni</option>
112 <option value="Eschpo.cut">Schizosaccharomyces pombe</option>
113 <option value="Eschpo_cai.cut">Schizosaccharomyces pombe (CAI equivalent)</option>
114 <option value="Eschpo_high.cut">Schizosaccharomyces pombe (high)</option>
115 <option value="Eserma.cut">Serratia marcescens</option>
116 <option value="Esheep.cut">Ovis aries (sheep)</option>
117 <option value="Esoltu.cut">Solanum tuberosum (potato)</option>
118 <option value="Esoybn.cut">Glycine max (soybean)</option>
119 <option value="Espiol.cut">Spinacia oleracea (spinach)</option>
120 <option value="Estaau.cut">Staphylococcus aureus</option>
121 <option value="Estrco.cut">Streptomyces coelicolor A3 2</option>
122 <option value="Estrmu.cut">Streptococcus mutans UA159</option>
123 <option value="Estrpn.cut">Streptococcus pneumoniae R6</option>
124 <option value="Estrpu.cut">Strongylocentrotus purpuratus (sea urchin)</option>
125 <option value="Esv40.cut">Simian Virus 40</option>
126 <option value="Esynco.cut">Synechococcus sp WH 8102</option>
127 <option value="Esyncy.cut">Synechocystis sp PCC 6803</option>
128 <option value="Etetth.cut">Tetrahymena thermophila</option>
129 <option value="Etheth.cut">Thermus thermophilus HB8</option>
130 <option value="Etobac.cut">Nicotiana tabacum (tobacco)</option>
131 <option value="Etobac_chl.cut">Nicotiana tabacum chloroplast (tobacco)</option>
132 <option value="Etrybr.cut">Trypanosoma brucei</option>
133 <option value="Etrycr.cut">Trypanosoma cruzi</option>
134 <option value="Evibch.cut">Vibrio cholerae O1 biovar eltor str N16961</option>
135 <option value="Ewheat.cut">Triticum aestivum (wheat)</option>
136 <option value="Exenla.cut">Xenopus laevis</option>
137 <option value="Eyeast.cut">Saccharomyces cerevisiae</option>
138 <option value="Eyeast_cai.cut">Saccharomyces cerevisiae original CAI set</option>
139 <option value="Eyeast_high.cut">Saccharomyces cerevisiae (high)</option>
140 <option value="Eyeast_mit.cut">Saccharomyces cerevisiae mitochondrion</option>
141 <option value="Eyeren.cut">Yersinia enterocolitica</option>
142 </param>
143 </section>
144 </inputs>
145 <outputs>
146 <data name="constructs" format="xml" label="Constructs" />
147 </outputs>
148 <tests>
149 <test>
150 <!-- test 1: check if identical outputs are produced with default parameters -->
151 <param name="genes_file" value="genes_lycopene.csv" />
152 <output name="constructs" >
153 <assert_contents>
154 <is_valid_xml />
155 <has_text text='rdf:RDF xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:sbol="http://sbols.org/v2#" xmlns:xsd1="http://www.w3.org/2001/XMLSchema#dateTime/" xmlns:om="http://www.ontology-of-units-of-measure.org/resource/om-2/" xmlns:synbiohub="http://synbiohub.org#" xmlns:sbh="http://wiki.synbiohub.org/wiki/Terms/synbiohub#" xmlns:sybio="http://www.sybio.ncl.ac.uk#" xmlns:ncbi="http://www.ncbi.nlm.nih.gov#" xmlns:igem="http://wiki.synbiohub.org/wiki/Terms/igem#" xmlns:genbank="http://www.ncbi.nlm.nih.gov/genbank#" xmlns:gbconv="http://sbols.org/genBankConversion#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:obo="http://purl.obolibrary.org/obo/"'/>
156 </assert_contents>
157 </output>
158 </test>
159 </tests>
160 <help><![CDATA[
161 OptDoE
162 ===========
163
164 An optimal design of experiments is performed by using OptBioDes based on logistic regression analysis with an assumed linear model for the response. The design is evaluated by its D-efficiency, defined as:
165
166 .. math:: D_{eff} = \frac{1}{n}\abs{X^{T}X}^{\frac{1}{p}}
167
168 |
169
170 Where n is the number of experimental runs or library size, p is the number of independent variables, and X is the model matrix, i.e., a row for each experimental run and a column for each term in the model. The library size n can be selected and should be above a minimal threshold depending on the number of combinatorial complexity of the library.
171 The experimental design can be evaluated through the provided diagnostics for D-efficiency, power analysis, and relative prediction variance, allowing the optimal selection of library size.
172 The resulting design is provided as an SBOL collection containing the definition of each DNA component and the combinatorial library of constructs.
173
174 .. image:: https://raw.githubusercontent.com/brsynth/synbiocad-galaxy-wrappers/master/OptDoE/img/image3.png
175 :width: 80 %
176 :align: center
177
178
179 .. image:: https://raw.githubusercontent.com/brsynth/synbiocad-galaxy-wrappers/master/OptDoE/img/image46.png
180 :width: 80 %
181 :align: center
182
183 |
184
185 Above are examples of two constructs generated through optimal combinatorial design and represented using SBOL Visual in SynBioHub.
186 Note: if advanced parameter "input_parts" is left empty, the following parts are used:
187
188
189 +---------+------------+--------------------------------------------------+
190 | Name | Type | SynBioHub |
191 +=========+============+==================================================+
192 | PlacUV5 | Promoter | https://synbiohub.org/public/igem/BBa_K1847014/1 |
193 +---------+------------+--------------------------------------------------+
194 | Ptrc | Promoter | https://synbiohub.org/public/igem/BBa_J56012/1 |
195 +---------+------------+--------------------------------------------------+
196 | BBR1 | Origin | https://synbiohub.org/public/igem/BBa_I50041/1 |
197 +---------+------------+--------------------------------------------------+
198 | p15A | Origin | https://synbiohub.org/public/igem/BBa_I50032/1 |
199 +---------+------------+--------------------------------------------------+
200 | ColE1 | Origin | https://synbiohub.org/public/igem/BBa_J64101/1 |
201 +---------+------------+--------------------------------------------------+
202 | res1 | Resistance | https://synbiohub.org/public/igem/BBa_I13800/1 |
203 +---------+------------+--------------------------------------------------+
204 | Ter | Terminator | https://synbiohub.org/public/igem/BBa_B1006/1 |
205 +---------+------------+--------------------------------------------------+
206
207 The source of this file can be found here as a model: https://raw.githubusercontent.com/pablocarb/doebase/master/doebase/data/ref_parts.csv
208
209 Input
210 -----
211
212 Required:
213
214 * **Genes**\ : Output of Selenzyme. The CSV file contains four columnds: Name,Type,Part,Step. The column "Name" contains the Uniprot ID found by Selenzyme. The column "Type" represents the type of the "Part", a *gene*. The column "Part" has the same information as the column "Name". The column "Step" contains the order of the position in the pathway of the gene.
215
216 Advanced options:
217
218 * **Optimised Genes**\ : SBOL file containing optimized versions of the genes associated with different RBS. Output of the PartsGenie tool.
219 * **Ref Parts**\ : CSV with the genetic parts. Default (if left empty) is the above table. To generate a new compatible CSV file, please use the "OptDoE Parts Reference Generator" tool
220 * **Maximal library size**\ : (integer, default: 32) Maximal number of constructs in the SBOL output.
221 * **Get sequences**\ : (boolean, default: True) Grab the sequence for each part of the SBOL output.
222 * **Back translate**\ : (boolean, default: True) Translate the protein sequence given by its Uniprot ID to a DNA sequence.
223 * **Codon Table**\ : (text, default: Eecoli.cut) Codon Usage Table. See `codon_table <https://www.ebi.ac.uk/seqdb/confluence/display/JDSAT/EMBOSS+backtranseq+Help+and+Documentation#EMBOSSbacktranseqHelpandDocumentation-WebServices>`_ for more codons.
224
225 Output
226 ------
227
228 * **Constructs**\ : Output SBOL file. It contains some combinations of constructs according to the algorithm described above.
229
230 Project Link
231 ------------
232
233 * `Original Project <https://github.com/pablocarb/doebase>`_
234
235 License
236 -------
237
238 `MIT <https://raw.githubusercontent.com/pablocarb/appoptdes/master/LICENSE>`_
239
240 Acknowledgments
241 ---------------
242
243 * Joan Hérisson
244 * Thomas Duigou
245 ]]></help>
246 <creator>
247 <person givenName="Pablo" familyName="Carbonell" email="pablo.carbonell@upv.es" identifier="https://orcid.org/0000-0002-0993-5625" />
248 </creator>
249 </tool>