Mercurial > repos > tduigou > optdoe
comparison optdoe.xml @ 3:34e11d0590fa draft default tip
planemo upload for repository ['https://github.com/brsynth/icfree-ml', 'https://github.com/pablocarb/doebase'] commit 2e8aa2e7c0581c7eed2074d15f7e4317ecde2ad6
author | tduigou |
---|---|
date | Mon, 01 May 2023 01:29:51 +0000 |
parents | 593e0f787172 |
children |
comparison
equal
deleted
inserted
replaced
2:593e0f787172 | 3:34e11d0590fa |
---|---|
1 <tool id="optdoe" name="Design of Experiment" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.09"> | |
2 <description>An optimal design of experiments (DoE) base package for synthetic biology</description> | |
3 <macros> | |
4 <token name="@VERSION_SUFFIX@">0</token> | |
5 <token name="@TOOL_VERSION@">2.0.2</token> | |
6 </macros> | |
7 <requirements> | |
8 <requirement type="package" version="@TOOL_VERSION@">doebase</requirement> | |
9 </requirements> | |
10 <command detect_errors="exit_code"><![CDATA[ | |
11 python -m doebase | |
12 --func doeGetSBOL | |
13 #if $adv.genes_sbol_file | |
14 --sbol_file '$adv.genes_sbol_file' | |
15 #end if | |
16 #if $adv.ref_parts_file | |
17 --ref_parts_file '$adv.ref_parts_file' | |
18 #end if | |
19 --libsize '$adv.libsize' | |
20 $adv.get_sequences | |
21 $adv.backtranslate | |
22 --codon_table '$adv.codon_table' | |
23 '$genes_file' | |
24 '$constructs' | |
25 ]]></command> | |
26 <inputs> | |
27 <param name="genes_file" type="data" format="csv" label="Genes" help="CSV file with header: Name,Type,Part,Step. Provided by the tool Selenzyme"/> | |
28 <section name="adv" title="Advanced Options" expanded="false"> | |
29 <param name="genes_sbol_file" type="data" format="xml" optional="true" label="Optimised Genes" help="SBOL file with genes associated with different RBS. Provided by the tool PartsGenie"/> | |
30 <param argument="--ref_parts_file" type="data" format="csv" value="None" optional="true" label="Ref Parts (default: E. coli compliant)" help="Provide fixed parts"/> | |
31 <param argument="--libsize" type="integer" value="32" min="32" label="Maximal library size" help="Maximal number of contructs in the output"/> | |
32 <param argument="--get_sequences" type="boolean" truevalue="--get_sequences true" falsevalue="--get_sequences false" checked="true" label="Get sequences" help="Grab the sequence for each part of the SBOL output"/> | |
33 <param argument="--backtranslate" type="boolean" truevalue="--backtranslate true" falsevalue="--backtranslate false" checked="true" label="Back translate" help="Translate the protein sequence given by its Uniprot ID to a DNA sequence"/> | |
34 <param argument="--codon_table" type="select" label="Codon Table"> | |
35 <option value="Eecoli.cut">Escherichia coli K12</option> | |
36 <option value="Ehuman.cut">Homo sapiens</option> | |
37 <option value="Eacica.cut">Acinetobacter calcoaceticus</option> | |
38 <option value="Eagrtu.cut">Agrobacterium tumefaciens str C58</option> | |
39 <option value="Eanasp.cut">Anabaena sp</option> | |
40 <option value="Earath.cut">Arabidopsis thaliana</option> | |
41 <option value="Eazovi.cut">Azotobacter vinelandii</option> | |
42 <option value="Ebacme.cut">Bacillus megaterium</option> | |
43 <option value="Ebacst.cut">Geobacillus stearothermophilus</option> | |
44 <option value="Ebacsu.cut">Bacillus subtilis</option> | |
45 <option value="Ebacsu_high.cut">Bacillus subtilis (high)</option> | |
46 <option value="Ebommo.cut">Bombyx mori (silkmoth)</option> | |
47 <option value="Ebovin.cut">Bos taurus</option> | |
48 <option value="Ebpphx.cut">Bacteriophage phi-X174</option> | |
49 <option value="Ebraja.cut">Bradyrhizobium japonicum USDA 110</option> | |
50 <option value="Ebrana.cut">Brassica napus (rape)</option> | |
51 <option value="Ebrare.cut">Brachydanio rerio (zebrafish)</option> | |
52 <option value="Ecaeel.cut">Caenorhabditis elegans (nematode)</option> | |
53 <option value="Ecanal.cut">Candida albicans</option> | |
54 <option value="Ecanfa.cut">Canis familiaris (dog)</option> | |
55 <option value="Ecaucr.cut">Caulobacter crescentus CB15</option> | |
56 <option value="Echick.cut">Gallus gallus (chicken)</option> | |
57 <option value="Echlre.cut">Chlamydomonas reinhardtii</option> | |
58 <option value="Echltr.cut">Chlamydia trachomatis D UW-3 CX</option> | |
59 <option value="Ecloab.cut">Clostridium acetobutylicum ATCC 824</option> | |
60 <option value="Ecrigr.cut">Cricetulus greseus (hamster)</option> | |
61 <option value="Ecyapa.cut">Cyanophora paradoxa</option> | |
62 <option value="Ebraja.cut">Bradyrhizobium japonicum USDA 110</option> | |
63 <option value="Ebrana.cut">Brassica napus (rape)</option> | |
64 <option value="Ebrare.cut">Brachydanio rerio (zebrafish)</option> | |
65 <option value="Ecaeel.cut">Caenorhabditis elegans (nematode)</option> | |
66 <option value="Ecanal.cut">Candida albicans</option> | |
67 <option value="Ecanfa.cut">Canis familiaris (dog)</option> | |
68 <option value="Ecaucr.cut">Caulobacter crescentus CB15</option> | |
69 <option value="Echick.cut">Gallus gallus (chicken)</option> | |
70 <option value="Echlre.cut">Chlamydomonas reinhardtii</option> | |
71 <option value="Echltr.cut">Chlamydia trachomatis D UW-3 CX</option> | |
72 <option value="Ecloab.cut">Clostridium acetobutylicum ATCC 824</option> | |
73 <option value="Ecrigr.cut">Cricetulus greseus (hamster)</option> | |
74 <option value="Ecyapa.cut">Cyanophora paradoxa</option> | |
75 <option value="Edicdi.cut">Dictyostelium discoideum</option> | |
76 <option value="Edicdi_high.cut">Dictyostelium discoideum (high)</option> | |
77 <option value="Edrome.cut">Drosophila melanogaster</option> | |
78 <option value="Edrome_high.cut">Drosophila melanogaster (high)</option> | |
79 <option value="Eecoli_high.cut">Escherichia coli K12 (high)</option> | |
80 <option value="Eemeni.cut">Emericella nidulans</option> | |
81 <option value="Eemeni_mit.cut">Emericella nidulans mitochondrion</option> | |
82 <option value="Eemeni_high.cut">Emericella nidulans highly expressed</option> | |
83 <option value="Eerwct.cut">Erwinia carotovora subsp atroseptica SCRI1043</option> | |
84 <option value="Ehaein.cut">Haemophilus influenzae Rd KW20</option> | |
85 <option value="Ehalma.cut">Haloarcula marismortui ATCC 43049 (Halobacterium marismortui)</option> | |
86 <option value="Ehalsa.cut">Halobacterium salinarum NRC-1 (Halobacterium halobium)</option> | |
87 <option value="Ehorvu.cut">Hordeum vulgare subsp vulgare (Barley)</option> | |
88 <option value="Eklepn.cut">Klebsiella pneumoniae</option> | |
89 <option value="Eklula.cut">Kluyveromyces lactis NRRL Y-1140</option> | |
90 <option value="Elacdl.cut">Lactococcus lactis subsp lactis Il1403 L. delbrueckii subsp lactis</option> | |
91 <option value="Elyces.cut">Lycopersicon esculentum (tomato)</option> | |
92 <option value="Emacfa.cut">Macaca fascicularis</option> | |
93 <option value="Emaize.cut">Zea mays</option> | |
94 <option value="Emaize_chl.cut">Zea mays chloroplast</option> | |
95 <option value="Emammal_high.cut">Mammalian species (high)</option> | |
96 <option value="Emanse.cut">Manduca sexta</option> | |
97 <option value="Emarpo_chl.cut">Marchantia polymorpha chloroplast (liverwort)</option> | |
98 <option value="Emedsa.cut">Medicago sativa</option> | |
99 <option value="Emetth.cut">Methanothermobacter thermautotrophicus str Delta H</option> | |
100 <option value="Emouse.cut">Mus musculus</option> | |
101 <option value="Emyctu.cut">Mycobacterium tuberculosis H37Rv</option> | |
102 <option value="Eneigo.cut">Neisseria gonorrhoeae</option> | |
103 <option value="Eneucr.cut">Neurospora crassa</option> | |
104 <option value="Eoncmy.cut">Oncorhynchus mykiss (rainbow trout)</option> | |
105 <option value="Eorysa.cut">Oryza sativa (rice)</option> | |
106 <option value="Eorysa_chl.cut">Oryza sativa chloroplast (rice)</option> | |
107 <option value="Epea.cut">Pisum sativum (pea)</option> | |
108 <option value="Epethy.cut">Petunia x hybrida</option> | |
109 <option value="Ephavu.cut">Phaseolus vulgaris</option> | |
110 <option value="Epig.cut">Sus scrofa (pig)</option> | |
111 <option value="Eplafa.cut">Plasmodium falciparum 3D7</option> | |
112 <option value="Eprovu.cut">Proteus vulgaris</option> | |
113 <option value="Epseae.cut">Pseudomonas aeruginosa PAO1</option> | |
114 <option value="Epsepu.cut">Pseudomonas putida KT2440</option> | |
115 <option value="Epsesm.cut">Pseudomonas syringae pv tomato str DC3000</option> | |
116 <option value="Erabit.cut">Oryctolagus cuniculus (rabbit)</option> | |
117 <option value="Erat.cut">Rattus norvegicus</option> | |
118 <option value="Erhile.cut">Rhizobium leguminosarum</option> | |
119 <option value="Erhime.cut">Sinorhizobium meliloti 1021</option> | |
120 <option value="Erhoca.cut">Rhodobacter capsulatus</option> | |
121 <option value="Erhosh.cut">Rhodobacter sphaeroides</option> | |
122 <option value="Esalsa.cut">Salmo salar (Atlantic salmon)</option> | |
123 <option value="Esalty.cut">Salmonella typhimurium LT2</option> | |
124 <option value="Eschma.cut">Schistosoma mansoni</option> | |
125 <option value="Eschpo.cut">Schizosaccharomyces pombe</option> | |
126 <option value="Eschpo_cai.cut">Schizosaccharomyces pombe (CAI equivalent)</option> | |
127 <option value="Eschpo_high.cut">Schizosaccharomyces pombe (high)</option> | |
128 <option value="Eserma.cut">Serratia marcescens</option> | |
129 <option value="Esheep.cut">Ovis aries (sheep)</option> | |
130 <option value="Esoltu.cut">Solanum tuberosum (potato)</option> | |
131 <option value="Esoybn.cut">Glycine max (soybean)</option> | |
132 <option value="Espiol.cut">Spinacia oleracea (spinach)</option> | |
133 <option value="Estaau.cut">Staphylococcus aureus</option> | |
134 <option value="Estrco.cut">Streptomyces coelicolor A3 2</option> | |
135 <option value="Estrmu.cut">Streptococcus mutans UA159</option> | |
136 <option value="Estrpn.cut">Streptococcus pneumoniae R6</option> | |
137 <option value="Estrpu.cut">Strongylocentrotus purpuratus (sea urchin)</option> | |
138 <option value="Esv40.cut">Simian Virus 40</option> | |
139 <option value="Esynco.cut">Synechococcus sp WH 8102</option> | |
140 <option value="Esyncy.cut">Synechocystis sp PCC 6803</option> | |
141 <option value="Etetth.cut">Tetrahymena thermophila</option> | |
142 <option value="Etheth.cut">Thermus thermophilus HB8</option> | |
143 <option value="Etobac.cut">Nicotiana tabacum (tobacco)</option> | |
144 <option value="Etobac_chl.cut">Nicotiana tabacum chloroplast (tobacco)</option> | |
145 <option value="Etrybr.cut">Trypanosoma brucei</option> | |
146 <option value="Etrycr.cut">Trypanosoma cruzi</option> | |
147 <option value="Evibch.cut">Vibrio cholerae O1 biovar eltor str N16961</option> | |
148 <option value="Ewheat.cut">Triticum aestivum (wheat)</option> | |
149 <option value="Exenla.cut">Xenopus laevis</option> | |
150 <option value="Eyeast.cut">Saccharomyces cerevisiae</option> | |
151 <option value="Eyeast_cai.cut">Saccharomyces cerevisiae original CAI set</option> | |
152 <option value="Eyeast_high.cut">Saccharomyces cerevisiae (high)</option> | |
153 <option value="Eyeast_mit.cut">Saccharomyces cerevisiae mitochondrion</option> | |
154 <option value="Eyeren.cut">Yersinia enterocolitica</option> | |
155 </param> | |
156 </section> | |
157 </inputs> | |
158 <outputs> | |
159 <data name="constructs" format="xml" label="Constructs" /> | |
160 </outputs> | |
161 <tests> | |
162 <test> | |
163 <!-- test 1: check if identical outputs are produced with default parameters --> | |
164 <param name="genes_file" value="genes_lycopene.csv" /> | |
165 <output name="constructs" > | |
166 <assert_contents> | |
167 <is_valid_xml /> | |
168 <has_text text='rdf:RDF xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:sbol="http://sbols.org/v2#" xmlns:xsd1="http://www.w3.org/2001/XMLSchema#dateTime/" xmlns:om="http://www.ontology-of-units-of-measure.org/resource/om-2/" xmlns:synbiohub="http://synbiohub.org#" xmlns:sbh="http://wiki.synbiohub.org/wiki/Terms/synbiohub#" xmlns:sybio="http://www.sybio.ncl.ac.uk#" xmlns:ncbi="http://www.ncbi.nlm.nih.gov#" xmlns:igem="http://wiki.synbiohub.org/wiki/Terms/igem#" xmlns:genbank="http://www.ncbi.nlm.nih.gov/genbank#" xmlns:gbconv="http://sbols.org/genBankConversion#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:obo="http://purl.obolibrary.org/obo/"'/> | |
169 </assert_contents> | |
170 </output> | |
171 </test> | |
172 </tests> | |
173 <help><![CDATA[ | |
174 OptDoE | |
175 =========== | |
176 | |
177 An optimal design of experiments is performed by using OptBioDes based on logistic regression analysis with an assumed linear model for the response. The design is evaluated by its D-efficiency, defined as: | |
178 | |
179 .. math:: D_{eff} = \frac{1}{n}\abs{X^{T}X}^{\frac{1}{p}} | |
180 | |
181 | | |
182 | |
183 Where n is the number of experimental runs or library size, p is the number of independent variables, and X is the model matrix, i.e., a row for each experimental run and a column for each term in the model. The library size n can be selected and should be above a minimal threshold depending on the number of combinatorial complexity of the library. | |
184 The experimental design can be evaluated through the provided diagnostics for D-efficiency, power analysis, and relative prediction variance, allowing the optimal selection of library size. | |
185 The resulting design is provided as an SBOL collection containing the definition of each DNA component and the combinatorial library of constructs. | |
186 | |
187 .. image:: https://raw.githubusercontent.com/brsynth/synbiocad-galaxy-wrappers/master/OptDoE/img/image3.png | |
188 :width: 80 % | |
189 :align: center | |
190 | |
191 | |
192 .. image:: https://raw.githubusercontent.com/brsynth/synbiocad-galaxy-wrappers/master/OptDoE/img/image46.png | |
193 :width: 80 % | |
194 :align: center | |
195 | |
196 | | |
197 | |
198 Above are examples of two constructs generated through optimal combinatorial design and represented using SBOL Visual in SynBioHub. | |
199 Note: if advanced parameter "input_parts" is left empty, the following parts are used: | |
200 | |
201 | |
202 +---------+------------+--------------------------------------------------+ | |
203 | Name | Type | SynBioHub | | |
204 +=========+============+==================================================+ | |
205 | PlacUV5 | Promoter | https://synbiohub.org/public/igem/BBa_K1847014/1 | | |
206 +---------+------------+--------------------------------------------------+ | |
207 | Ptrc | Promoter | https://synbiohub.org/public/igem/BBa_J56012/1 | | |
208 +---------+------------+--------------------------------------------------+ | |
209 | BBR1 | Origin | https://synbiohub.org/public/igem/BBa_I50041/1 | | |
210 +---------+------------+--------------------------------------------------+ | |
211 | p15A | Origin | https://synbiohub.org/public/igem/BBa_I50032/1 | | |
212 +---------+------------+--------------------------------------------------+ | |
213 | ColE1 | Origin | https://synbiohub.org/public/igem/BBa_J64101/1 | | |
214 +---------+------------+--------------------------------------------------+ | |
215 | res1 | Resistance | https://synbiohub.org/public/igem/BBa_I13800/1 | | |
216 +---------+------------+--------------------------------------------------+ | |
217 | Ter | Terminator | https://synbiohub.org/public/igem/BBa_B1006/1 | | |
218 +---------+------------+--------------------------------------------------+ | |
219 | |
220 The source of this file can be found here as a model: https://raw.githubusercontent.com/pablocarb/doebase/master/doebase/data/ref_parts.csv | |
221 | |
222 Input | |
223 ----- | |
224 | |
225 Required: | |
226 | |
227 * **Genes**\ : Output of Selenzyme. The CSV file contains four columnds: Name,Type,Part,Step. The column "Name" contains the Uniprot ID found by Selenzyme. The column "Type" represents the type of the "Part", a *gene*. The column "Part" has the same information as the column "Name". The column "Step" contains the order of the position in the pathway of the gene. | |
228 | |
229 Advanced options: | |
230 | |
231 * **Optimised Genes**\ : SBOL file containing optimized versions of the genes associated with different RBS. Output of the PartsGenie tool. | |
232 * **Ref Parts**\ : CSV with the genetic parts. Default (if left empty) is the above table. To generate a new compatible CSV file, please use the "OptDoE Parts Reference Generator" tool | |
233 * **Maximal library size**\ : (integer, default: 32) Maximal number of constructs in the SBOL output. | |
234 * **Get sequences**\ : (boolean, default: True) Grab the sequence for each part of the SBOL output. | |
235 * **Back translate**\ : (boolean, default: True) Translate the protein sequence given by its Uniprot ID to a DNA sequence. | |
236 * **Codon Table**\ : (text, default: Eecoli.cut) Codon Usage Table. See `codon_table <https://www.ebi.ac.uk/seqdb/confluence/display/JDSAT/EMBOSS+backtranseq+Help+and+Documentation#EMBOSSbacktranseqHelpandDocumentation-WebServices>`_ for more codons. | |
237 | |
238 Output | |
239 ------ | |
240 | |
241 * **Constructs**\ : Output SBOL file. It contains some combinations of constructs according to the algorithm described above. | |
242 | |
243 Project Link | |
244 ------------ | |
245 | |
246 * `Original Project <https://github.com/pablocarb/doebase>`_ | |
247 | |
248 License | |
249 ------- | |
250 | |
251 `MIT <https://raw.githubusercontent.com/pablocarb/appoptdes/master/LICENSE>`_ | |
252 | |
253 Acknowledgments | |
254 --------------- | |
255 | |
256 * Joan Hérisson | |
257 * Thomas Duigou | |
258 ]]></help> | |
259 <creator> | |
260 <person givenName="Pablo" familyName="Carbonell" email="pablo.carbonell@upv.es" identifier="https://orcid.org/0000-0002-0993-5625" /> | |
261 </creator> | |
262 </tool> |