comparison optdoe.xml @ 3:34e11d0590fa draft default tip

planemo upload for repository ['https://github.com/brsynth/icfree-ml', 'https://github.com/pablocarb/doebase'] commit 2e8aa2e7c0581c7eed2074d15f7e4317ecde2ad6
author tduigou
date Mon, 01 May 2023 01:29:51 +0000
parents 593e0f787172
children
comparison
equal deleted inserted replaced
2:593e0f787172 3:34e11d0590fa
1 <tool id="optdoe" name="Design of Experiment" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.09">
2 <description>An optimal design of experiments (DoE) base package for synthetic biology</description>
3 <macros>
4 <token name="@VERSION_SUFFIX@">0</token>
5 <token name="@TOOL_VERSION@">2.0.2</token>
6 </macros>
7 <requirements>
8 <requirement type="package" version="@TOOL_VERSION@">doebase</requirement>
9 </requirements>
10 <command detect_errors="exit_code"><![CDATA[
11 python -m doebase
12 --func doeGetSBOL
13 #if $adv.genes_sbol_file
14 --sbol_file '$adv.genes_sbol_file'
15 #end if
16 #if $adv.ref_parts_file
17 --ref_parts_file '$adv.ref_parts_file'
18 #end if
19 --libsize '$adv.libsize'
20 $adv.get_sequences
21 $adv.backtranslate
22 --codon_table '$adv.codon_table'
23 '$genes_file'
24 '$constructs'
25 ]]></command>
26 <inputs>
27 <param name="genes_file" type="data" format="csv" label="Genes" help="CSV file with header: Name,Type,Part,Step. Provided by the tool Selenzyme"/>
28 <section name="adv" title="Advanced Options" expanded="false">
29 <param name="genes_sbol_file" type="data" format="xml" optional="true" label="Optimised Genes" help="SBOL file with genes associated with different RBS. Provided by the tool PartsGenie"/>
30 <param argument="--ref_parts_file" type="data" format="csv" value="None" optional="true" label="Ref Parts (default: E. coli compliant)" help="Provide fixed parts"/>
31 <param argument="--libsize" type="integer" value="32" min="32" label="Maximal library size" help="Maximal number of contructs in the output"/>
32 <param argument="--get_sequences" type="boolean" truevalue="--get_sequences true" falsevalue="--get_sequences false" checked="true" label="Get sequences" help="Grab the sequence for each part of the SBOL output"/>
33 <param argument="--backtranslate" type="boolean" truevalue="--backtranslate true" falsevalue="--backtranslate false" checked="true" label="Back translate" help="Translate the protein sequence given by its Uniprot ID to a DNA sequence"/>
34 <param argument="--codon_table" type="select" label="Codon Table">
35 <option value="Eecoli.cut">Escherichia coli K12</option>
36 <option value="Ehuman.cut">Homo sapiens</option>
37 <option value="Eacica.cut">Acinetobacter calcoaceticus</option>
38 <option value="Eagrtu.cut">Agrobacterium tumefaciens str C58</option>
39 <option value="Eanasp.cut">Anabaena sp</option>
40 <option value="Earath.cut">Arabidopsis thaliana</option>
41 <option value="Eazovi.cut">Azotobacter vinelandii</option>
42 <option value="Ebacme.cut">Bacillus megaterium</option>
43 <option value="Ebacst.cut">Geobacillus stearothermophilus</option>
44 <option value="Ebacsu.cut">Bacillus subtilis</option>
45 <option value="Ebacsu_high.cut">Bacillus subtilis (high)</option>
46 <option value="Ebommo.cut">Bombyx mori (silkmoth)</option>
47 <option value="Ebovin.cut">Bos taurus</option>
48 <option value="Ebpphx.cut">Bacteriophage phi-X174</option>
49 <option value="Ebraja.cut">Bradyrhizobium japonicum USDA 110</option>
50 <option value="Ebrana.cut">Brassica napus (rape)</option>
51 <option value="Ebrare.cut">Brachydanio rerio (zebrafish)</option>
52 <option value="Ecaeel.cut">Caenorhabditis elegans (nematode)</option>
53 <option value="Ecanal.cut">Candida albicans</option>
54 <option value="Ecanfa.cut">Canis familiaris (dog)</option>
55 <option value="Ecaucr.cut">Caulobacter crescentus CB15</option>
56 <option value="Echick.cut">Gallus gallus (chicken)</option>
57 <option value="Echlre.cut">Chlamydomonas reinhardtii</option>
58 <option value="Echltr.cut">Chlamydia trachomatis D UW-3 CX</option>
59 <option value="Ecloab.cut">Clostridium acetobutylicum ATCC 824</option>
60 <option value="Ecrigr.cut">Cricetulus greseus (hamster)</option>
61 <option value="Ecyapa.cut">Cyanophora paradoxa</option>
62 <option value="Ebraja.cut">Bradyrhizobium japonicum USDA 110</option>
63 <option value="Ebrana.cut">Brassica napus (rape)</option>
64 <option value="Ebrare.cut">Brachydanio rerio (zebrafish)</option>
65 <option value="Ecaeel.cut">Caenorhabditis elegans (nematode)</option>
66 <option value="Ecanal.cut">Candida albicans</option>
67 <option value="Ecanfa.cut">Canis familiaris (dog)</option>
68 <option value="Ecaucr.cut">Caulobacter crescentus CB15</option>
69 <option value="Echick.cut">Gallus gallus (chicken)</option>
70 <option value="Echlre.cut">Chlamydomonas reinhardtii</option>
71 <option value="Echltr.cut">Chlamydia trachomatis D UW-3 CX</option>
72 <option value="Ecloab.cut">Clostridium acetobutylicum ATCC 824</option>
73 <option value="Ecrigr.cut">Cricetulus greseus (hamster)</option>
74 <option value="Ecyapa.cut">Cyanophora paradoxa</option>
75 <option value="Edicdi.cut">Dictyostelium discoideum</option>
76 <option value="Edicdi_high.cut">Dictyostelium discoideum (high)</option>
77 <option value="Edrome.cut">Drosophila melanogaster</option>
78 <option value="Edrome_high.cut">Drosophila melanogaster (high)</option>
79 <option value="Eecoli_high.cut">Escherichia coli K12 (high)</option>
80 <option value="Eemeni.cut">Emericella nidulans</option>
81 <option value="Eemeni_mit.cut">Emericella nidulans mitochondrion</option>
82 <option value="Eemeni_high.cut">Emericella nidulans highly expressed</option>
83 <option value="Eerwct.cut">Erwinia carotovora subsp atroseptica SCRI1043</option>
84 <option value="Ehaein.cut">Haemophilus influenzae Rd KW20</option>
85 <option value="Ehalma.cut">Haloarcula marismortui ATCC 43049 (Halobacterium marismortui)</option>
86 <option value="Ehalsa.cut">Halobacterium salinarum NRC-1 (Halobacterium halobium)</option>
87 <option value="Ehorvu.cut">Hordeum vulgare subsp vulgare (Barley)</option>
88 <option value="Eklepn.cut">Klebsiella pneumoniae</option>
89 <option value="Eklula.cut">Kluyveromyces lactis NRRL Y-1140</option>
90 <option value="Elacdl.cut">Lactococcus lactis subsp lactis Il1403 L. delbrueckii subsp lactis</option>
91 <option value="Elyces.cut">Lycopersicon esculentum (tomato)</option>
92 <option value="Emacfa.cut">Macaca fascicularis</option>
93 <option value="Emaize.cut">Zea mays</option>
94 <option value="Emaize_chl.cut">Zea mays chloroplast</option>
95 <option value="Emammal_high.cut">Mammalian species (high)</option>
96 <option value="Emanse.cut">Manduca sexta</option>
97 <option value="Emarpo_chl.cut">Marchantia polymorpha chloroplast (liverwort)</option>
98 <option value="Emedsa.cut">Medicago sativa</option>
99 <option value="Emetth.cut">Methanothermobacter thermautotrophicus str Delta H</option>
100 <option value="Emouse.cut">Mus musculus</option>
101 <option value="Emyctu.cut">Mycobacterium tuberculosis H37Rv</option>
102 <option value="Eneigo.cut">Neisseria gonorrhoeae</option>
103 <option value="Eneucr.cut">Neurospora crassa</option>
104 <option value="Eoncmy.cut">Oncorhynchus mykiss (rainbow trout)</option>
105 <option value="Eorysa.cut">Oryza sativa (rice)</option>
106 <option value="Eorysa_chl.cut">Oryza sativa chloroplast (rice)</option>
107 <option value="Epea.cut">Pisum sativum (pea)</option>
108 <option value="Epethy.cut">Petunia x hybrida</option>
109 <option value="Ephavu.cut">Phaseolus vulgaris</option>
110 <option value="Epig.cut">Sus scrofa (pig)</option>
111 <option value="Eplafa.cut">Plasmodium falciparum 3D7</option>
112 <option value="Eprovu.cut">Proteus vulgaris</option>
113 <option value="Epseae.cut">Pseudomonas aeruginosa PAO1</option>
114 <option value="Epsepu.cut">Pseudomonas putida KT2440</option>
115 <option value="Epsesm.cut">Pseudomonas syringae pv tomato str DC3000</option>
116 <option value="Erabit.cut">Oryctolagus cuniculus (rabbit)</option>
117 <option value="Erat.cut">Rattus norvegicus</option>
118 <option value="Erhile.cut">Rhizobium leguminosarum</option>
119 <option value="Erhime.cut">Sinorhizobium meliloti 1021</option>
120 <option value="Erhoca.cut">Rhodobacter capsulatus</option>
121 <option value="Erhosh.cut">Rhodobacter sphaeroides</option>
122 <option value="Esalsa.cut">Salmo salar (Atlantic salmon)</option>
123 <option value="Esalty.cut">Salmonella typhimurium LT2</option>
124 <option value="Eschma.cut">Schistosoma mansoni</option>
125 <option value="Eschpo.cut">Schizosaccharomyces pombe</option>
126 <option value="Eschpo_cai.cut">Schizosaccharomyces pombe (CAI equivalent)</option>
127 <option value="Eschpo_high.cut">Schizosaccharomyces pombe (high)</option>
128 <option value="Eserma.cut">Serratia marcescens</option>
129 <option value="Esheep.cut">Ovis aries (sheep)</option>
130 <option value="Esoltu.cut">Solanum tuberosum (potato)</option>
131 <option value="Esoybn.cut">Glycine max (soybean)</option>
132 <option value="Espiol.cut">Spinacia oleracea (spinach)</option>
133 <option value="Estaau.cut">Staphylococcus aureus</option>
134 <option value="Estrco.cut">Streptomyces coelicolor A3 2</option>
135 <option value="Estrmu.cut">Streptococcus mutans UA159</option>
136 <option value="Estrpn.cut">Streptococcus pneumoniae R6</option>
137 <option value="Estrpu.cut">Strongylocentrotus purpuratus (sea urchin)</option>
138 <option value="Esv40.cut">Simian Virus 40</option>
139 <option value="Esynco.cut">Synechococcus sp WH 8102</option>
140 <option value="Esyncy.cut">Synechocystis sp PCC 6803</option>
141 <option value="Etetth.cut">Tetrahymena thermophila</option>
142 <option value="Etheth.cut">Thermus thermophilus HB8</option>
143 <option value="Etobac.cut">Nicotiana tabacum (tobacco)</option>
144 <option value="Etobac_chl.cut">Nicotiana tabacum chloroplast (tobacco)</option>
145 <option value="Etrybr.cut">Trypanosoma brucei</option>
146 <option value="Etrycr.cut">Trypanosoma cruzi</option>
147 <option value="Evibch.cut">Vibrio cholerae O1 biovar eltor str N16961</option>
148 <option value="Ewheat.cut">Triticum aestivum (wheat)</option>
149 <option value="Exenla.cut">Xenopus laevis</option>
150 <option value="Eyeast.cut">Saccharomyces cerevisiae</option>
151 <option value="Eyeast_cai.cut">Saccharomyces cerevisiae original CAI set</option>
152 <option value="Eyeast_high.cut">Saccharomyces cerevisiae (high)</option>
153 <option value="Eyeast_mit.cut">Saccharomyces cerevisiae mitochondrion</option>
154 <option value="Eyeren.cut">Yersinia enterocolitica</option>
155 </param>
156 </section>
157 </inputs>
158 <outputs>
159 <data name="constructs" format="xml" label="Constructs" />
160 </outputs>
161 <tests>
162 <test>
163 <!-- test 1: check if identical outputs are produced with default parameters -->
164 <param name="genes_file" value="genes_lycopene.csv" />
165 <output name="constructs" >
166 <assert_contents>
167 <is_valid_xml />
168 <has_text text='rdf:RDF xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:sbol="http://sbols.org/v2#" xmlns:xsd1="http://www.w3.org/2001/XMLSchema#dateTime/" xmlns:om="http://www.ontology-of-units-of-measure.org/resource/om-2/" xmlns:synbiohub="http://synbiohub.org#" xmlns:sbh="http://wiki.synbiohub.org/wiki/Terms/synbiohub#" xmlns:sybio="http://www.sybio.ncl.ac.uk#" xmlns:ncbi="http://www.ncbi.nlm.nih.gov#" xmlns:igem="http://wiki.synbiohub.org/wiki/Terms/igem#" xmlns:genbank="http://www.ncbi.nlm.nih.gov/genbank#" xmlns:gbconv="http://sbols.org/genBankConversion#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:obo="http://purl.obolibrary.org/obo/"'/>
169 </assert_contents>
170 </output>
171 </test>
172 </tests>
173 <help><![CDATA[
174 OptDoE
175 ===========
176
177 An optimal design of experiments is performed by using OptBioDes based on logistic regression analysis with an assumed linear model for the response. The design is evaluated by its D-efficiency, defined as:
178
179 .. math:: D_{eff} = \frac{1}{n}\abs{X^{T}X}^{\frac{1}{p}}
180
181 |
182
183 Where n is the number of experimental runs or library size, p is the number of independent variables, and X is the model matrix, i.e., a row for each experimental run and a column for each term in the model. The library size n can be selected and should be above a minimal threshold depending on the number of combinatorial complexity of the library.
184 The experimental design can be evaluated through the provided diagnostics for D-efficiency, power analysis, and relative prediction variance, allowing the optimal selection of library size.
185 The resulting design is provided as an SBOL collection containing the definition of each DNA component and the combinatorial library of constructs.
186
187 .. image:: https://raw.githubusercontent.com/brsynth/synbiocad-galaxy-wrappers/master/OptDoE/img/image3.png
188 :width: 80 %
189 :align: center
190
191
192 .. image:: https://raw.githubusercontent.com/brsynth/synbiocad-galaxy-wrappers/master/OptDoE/img/image46.png
193 :width: 80 %
194 :align: center
195
196 |
197
198 Above are examples of two constructs generated through optimal combinatorial design and represented using SBOL Visual in SynBioHub.
199 Note: if advanced parameter "input_parts" is left empty, the following parts are used:
200
201
202 +---------+------------+--------------------------------------------------+
203 | Name | Type | SynBioHub |
204 +=========+============+==================================================+
205 | PlacUV5 | Promoter | https://synbiohub.org/public/igem/BBa_K1847014/1 |
206 +---------+------------+--------------------------------------------------+
207 | Ptrc | Promoter | https://synbiohub.org/public/igem/BBa_J56012/1 |
208 +---------+------------+--------------------------------------------------+
209 | BBR1 | Origin | https://synbiohub.org/public/igem/BBa_I50041/1 |
210 +---------+------------+--------------------------------------------------+
211 | p15A | Origin | https://synbiohub.org/public/igem/BBa_I50032/1 |
212 +---------+------------+--------------------------------------------------+
213 | ColE1 | Origin | https://synbiohub.org/public/igem/BBa_J64101/1 |
214 +---------+------------+--------------------------------------------------+
215 | res1 | Resistance | https://synbiohub.org/public/igem/BBa_I13800/1 |
216 +---------+------------+--------------------------------------------------+
217 | Ter | Terminator | https://synbiohub.org/public/igem/BBa_B1006/1 |
218 +---------+------------+--------------------------------------------------+
219
220 The source of this file can be found here as a model: https://raw.githubusercontent.com/pablocarb/doebase/master/doebase/data/ref_parts.csv
221
222 Input
223 -----
224
225 Required:
226
227 * **Genes**\ : Output of Selenzyme. The CSV file contains four columnds: Name,Type,Part,Step. The column "Name" contains the Uniprot ID found by Selenzyme. The column "Type" represents the type of the "Part", a *gene*. The column "Part" has the same information as the column "Name". The column "Step" contains the order of the position in the pathway of the gene.
228
229 Advanced options:
230
231 * **Optimised Genes**\ : SBOL file containing optimized versions of the genes associated with different RBS. Output of the PartsGenie tool.
232 * **Ref Parts**\ : CSV with the genetic parts. Default (if left empty) is the above table. To generate a new compatible CSV file, please use the "OptDoE Parts Reference Generator" tool
233 * **Maximal library size**\ : (integer, default: 32) Maximal number of constructs in the SBOL output.
234 * **Get sequences**\ : (boolean, default: True) Grab the sequence for each part of the SBOL output.
235 * **Back translate**\ : (boolean, default: True) Translate the protein sequence given by its Uniprot ID to a DNA sequence.
236 * **Codon Table**\ : (text, default: Eecoli.cut) Codon Usage Table. See `codon_table <https://www.ebi.ac.uk/seqdb/confluence/display/JDSAT/EMBOSS+backtranseq+Help+and+Documentation#EMBOSSbacktranseqHelpandDocumentation-WebServices>`_ for more codons.
237
238 Output
239 ------
240
241 * **Constructs**\ : Output SBOL file. It contains some combinations of constructs according to the algorithm described above.
242
243 Project Link
244 ------------
245
246 * `Original Project <https://github.com/pablocarb/doebase>`_
247
248 License
249 -------
250
251 `MIT <https://raw.githubusercontent.com/pablocarb/appoptdes/master/LICENSE>`_
252
253 Acknowledgments
254 ---------------
255
256 * Joan Hérisson
257 * Thomas Duigou
258 ]]></help>
259 <creator>
260 <person givenName="Pablo" familyName="Carbonell" email="pablo.carbonell@upv.es" identifier="https://orcid.org/0000-0002-0993-5625" />
261 </creator>
262 </tool>