Mercurial > repos > bimib > cobraxy
diff COBRAxy/src/flux_simulation.xml @ 539:2fb97466e404 draft
Uploaded
| author | francesco_lapi |
|---|---|
| date | Sat, 25 Oct 2025 14:55:13 +0000 |
| parents | |
| children | 5a73d813b1db |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/COBRAxy/src/flux_simulation.xml Sat Oct 25 14:55:13 2025 +0000 @@ -0,0 +1,260 @@ +<tool id="fluxSimulation" name="Flux Simulation" version="2.0.0"> + + <macros> + <import>marea_macros.xml</import> + </macros> + + <requirements> + <requirement type="package" version="1.24.4">numpy</requirement> + <requirement type="package" version="2.0.3">pandas</requirement> + <requirement type="package" version="0.29.0">cobra</requirement> + <requirement type="package" version="5.2.2">lxml</requirement> + <requirement type="package" version="1.4.2">joblib</requirement> + <requirement type="package" version="1.11">scipy</requirement> + </requirements> + + <command detect_errors="exit_code"> + <![CDATA[ + python $__tool_directory__/flux_simulation.py + --tool_dir $__tool_directory__ + + --model_and_bounds $model_and_bounds.model_and_bounds + + #if $model_and_bounds.model_and_bounds == 'True': + --model_upload $model_and_bounds.model_upload + --input "${",".join(map(str, $model_and_bounds.inputs))}" + #set $names_list = [] + #for $input_temp in $model_and_bounds.inputs: + #silent $names_list.append(str($input_temp.element_identifier)) + #end for + --name "${",".join($names_list)}" + #else: + --input "${",".join(map(str, $model_and_bounds.model_files))}" + #set $names_list = [] + #for $input_temp in $model_and_bounds.model_files: + #silent $names_list.append(str($input_temp.element_identifier)) + #end for + --name "${",".join($names_list)}" + #end if + + --sampling_enabled $sampling_params.sampling_enabled + + #if $sampling_params.sampling_enabled == 'true': + --thinning 0 + #if $sampling_params.algorithm_param.algorithm == 'OPTGP': + --thinning $sampling_params.algorithm_param.thinning + #end if + --algorithm $sampling_params.algorithm_param.algorithm + --n_batches $sampling_params.n_batches + --n_samples $sampling_params.n_samples + --seed $sampling_params.seed + --output_type "${",".join(map(str, $sampling_params.output_types))}" + #else: + --thinning 0 + --algorithm 'CBS' + --n_batches 1 + --n_samples 1 + --seed 0 + --output_type 'mean' + #end if + + #if $output_types_analysis: + --output_type_analysis "${",".join(map(str, $output_types_analysis))}" + #end if + + #if 'FVA' in str($output_types_analysis): + --perc_opt $fva_params.optimality_fraction + #end if + + --out_log $log + + #if $sampling_params.sampling_enabled == 'true': + #if 'mean' in str($sampling_params.output_types): + --out_mean $mean_results + #end if + #if 'median' in str($sampling_params.output_types): + --out_median $median_results + #end if + #if 'quantiles' in str($sampling_params.output_types): + --out_quantiles $quantile_results + #end if + #end if + + #if 'FVA' in str($output_types_analysis): + --out_fva $fva_results + #end if + #if 'pFBA' in str($output_types_analysis): + --out_pfba $pFBA_results + #end if + #if 'sensitivity' in str($output_types_analysis): + --out_sensitivity $sensitivity_results + #end if + ]]> + </command> + + <inputs> + <conditional name="model_and_bounds"> + <param name="model_and_bounds" argument="--model_and_bounds" type="select" label="Input format:" help="Choose whether to upload the model and bounds in separate files or to upload multiple complete model files."> + <option value="True" selected="true">Model + bounds (separate files)</option> + <option value="False">Multiple complete models</option> + </param> + + <when value="True"> + <param name="model_upload" argument="--model_upload" type="data" format="csv,tsv,tabular" + label="Model tabular:" + help="Upload a CSV/TSV file that contains the model reaction rules generated by the Import Metabolic Model tool. Recommended columns: ReactionID, Reaction (formula), Rule (GPR). Optional columns: name, lower_bound, upper_bound, InMedium. If bounds are present here they may be overridden by separate bound files." /> + + <param name="inputs" argument="--inputs" multiple="true" type="data" format="tabular,csv,tsv" + label="Bound file(s):" + help="Upload one or more CSV/TSV files containing reaction bounds generated by the Ras2Bounds tool. Each file must include at least: ReactionID, lower_bound, upper_bound. Files are applied in the order provided; later files override earlier ones for the same ReactionID." /> + </when> + + <when value="False"> + <param name="model_files" argument="--model_files" multiple="true" type="data" format="csv,tsv,tabular" + label="Complete Model tabular:" + help="Upload one or more CSV/TSV files, each containing both model rules and reaction bounds for different contexts/cells. Required columns: ReactionID, Reaction, Rule, lower_bound, upper_bound." /> + </when> + </conditional> + + <conditional name="sampling_params"> + <param name="sampling_enabled" argument="--sampling_enabled" type="boolean" display="checkboxes" checked="false" label="Enable sampling" help="Enable flux sampling"/> + + <when value="true"> + <conditional name="algorithm_param"> + <param name="algorithm" argument="--algorithm" type="select" label="Choose sampling algorithm:"> + <option value="CBS" selected="true">CBS</option> + <option value="OPTGP">OPTGP</option> + </param> + <when value="OPTGP"> + <param name="thinning" argument="--thinning" type="integer" label="Thinning:" value="100" help="Number of iterations to wait before taking a sample."/> + </when> + </conditional> + + <param name="n_samples" argument="--n_samples" type="integer" label="Samples:" value="1000" min="1" max="1000"/> + <param name="n_batches" argument="--n_batches" type="integer" label="Batches:" value="1" help="This is useful for computational performances."/> + <param name="seed" argument="--seed" type="integer" label="Seed:" value="0" help="Random seed."/> + + <param type="select" argument="--output_types" multiple="true" name="output_types" label="Choose outputs from sampling"> + <option value="mean" selected="true">Mean</option> + <option value="median" selected="true">Median</option> + <option value="quantiles" selected="true">Quantiles</option> + <option value="fluxes" selected="false">All fluxes</option> + </param> + </when> + + <when value="false"> + <!-- Hidden parameters when sampling is disabled --> + <param name="algorithm" type="hidden" value="CBS"/> + <param name="n_samples" type="hidden" value="1000"/> + <param name="n_batches" type="hidden" value="1"/> + <param name="seed" type="hidden" value="0"/> + <param name="output_types" type="hidden" value="mean"/> + </when> + </conditional> + + <param type="select" argument="--output_types_analysis" multiple="true" name="output_types_analysis" label="Choose outputs from optimization"> + <option value="FVA" selected="true">FVA</option> + <option value="pFBA" selected="false">pFBA</option> + <option value="sensitivity" selected="false">Sensitivity reaction knock-out (Biomass)</option> + </param> + + <conditional name="fva_params"> + <param name="show_fva_options" type="boolean" display="checkboxes" checked="false" label="Configure FVA parameters" help="Show additional FVA configuration options"/> + <when value="true"> + <param name="optimality_fraction" argument="--fva_optimality" type="float" label="FVA Optimality (fraction):" value="0.90" min="0.0" max="1.0" + help="Fraction of optimality for FVA analysis. 1.0 means the flux must be optimal, lower values allow suboptimal solutions."/> + </when> + <when value="false"> + <param name="optimality_fraction" argument="--fva_optimality" type="hidden" value="1.0"/> + </when> + </conditional> + + </inputs> + + <outputs> + <data format="txt" name="log" label="Flux Simulation - Log" /> + + <collection name="fluxes_results" type="list" label="Fluxes"> + <filter>sampling_params['sampling_enabled'] and 'fluxes' in sampling_params['output_types']</filter> + <discover_datasets name="collection" pattern="__name_and_ext__" directory="flux_simulation"/> + </collection> + + <data format="tabular" name="mean_results" label="Mean"> + <filter>sampling_params['sampling_enabled'] and 'mean' in sampling_params['output_types']</filter> + </data> + + <data format="tabular" name="median_results" label="Median"> + <filter>sampling_params['sampling_enabled'] and 'median' in sampling_params['output_types']</filter> + </data> + + <data format="tabular" name="quantile_results" label="Quantiles"> + <filter>sampling_params['sampling_enabled'] and 'quantiles' in sampling_params['output_types']</filter> + </data> + + <data format="tabular" name="fva_results" label="FVA"> + <filter>output_types_analysis and 'FVA' in output_types_analysis</filter> + </data> + + <data format="tabular" name="pFBA_results" label="pFBA"> + <filter>output_types_analysis and 'pFBA' in output_types_analysis</filter> + </data> + + <data format="tabular" name="sensitivity_results" label="Sensitivity"> + <filter>output_types_analysis and 'sensitivity' in output_types_analysis</filter> + </data> + </outputs> + + <help> + <![CDATA[ +Overview +------------- + +This tool generates flux samples from a set of metabolic models. It supports two input modes: + - Model + bounds: upload a single base model and multiple bound files (one per context/cell type) + - Multiple complete models: upload multiple model files, each already containing its own bounds. + +In the first mode: + - the base model must be in tabular format as produced by the Import Metabolic Model tool. + - the bound files should come from the RAStoBounds tool. + +In the second mode, provide a separate tabular file for each complete model. + +Available analyses +------------- + +Two types of analysis are available: + - flux optimization + - flux sampling + +For flux optimization, one of the following methods can be performed: + - parsimonious-FBA + - Flux Variability Analysis + - Biomass sensitivity analysis (single reaction knock-out) +The objective function — a linear combination of fluxes weighted by specific coefficients — depends on the provided metabolic network. + +For flux sampling, one of the following methods can be performed: + - CBS (Corner-based sampling) + - OPTGP (Improved Artificial Centering Hit-and-Run sampler) algorithms. + + +Output: +------------- + +The tool produces: + - Samples: reporting the sampled fluxes for each reaction (reaction names on the rows and sample names on the columns). Format: tab-separated. + - a log file (.txt). + +The sampled fluxes can be reported as full datasets or summarized using descriptive statistics such as mean, median, and quantiles (0.25, 0.50, 0.75), computed for each model. + +**TIP**: Bounds generated by RAStoBound are grouped in a collection. You can select collections by clicking on "Dataset Collection" option in the "Bound file(s):" input parameter. + +**TIP**: The Batches parameter helps maintain memory efficiency. For example, for 10,000 samples, use n_samples=1,000 and n_batches=10. + +**TIP**: Adjust the Thinning parameter to improve convergence toward the stationary distribution. +Common thinning values are 100 or 1000.Note that if you set thinning = 100 and request 100 samples, the total number of generated flux samples will be 100 * 100. + +**TIP**: FVA optimality percentage allows you to explore suboptimal flux ranges. 100% restricts to optimal solutions, while lower values (e.g., 90%) allow broader flux ranges. +]]> + </help> + <expand macro="citations_fluxes" /> +</tool> \ No newline at end of file
