view waveica.xml @ 9:6fc9f6dbcef5 draft

planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/waveica commit bbcbf9c32acaedffb78f0caef47faeed8f68cb52
author recetox
date Fri, 16 May 2025 10:14:27 +0000
parents bf32ae95a06f
children 821062fc5782
line wrap: on
line source

<tool id="waveica" name="WaveICA" version="@TOOL_VERSION@+galaxy9" profile="23.0">
    <description>removal of batch effects for untargeted metabolomics data</description>
    <macros>
        <import>macros.xml</import>
    </macros>
    <expand macro="annotation"/>
    <expand macro="creator"/>

    <requirements>
        <requirement type="package" version="@TOOL_VERSION@">r-recetox-waveica</requirement>
        <requirement type="package" version="8.0.0">r-arrow</requirement>
    </requirements>
    <command detect_errors="aggressive"><![CDATA[
        Rscript
            -e 'source("${__tool_directory__}/waveica_wrapper.R")'

            #if $batch_correction.mode == "batchwise":
            -e 'normalized_data <- waveica(
                file = "$input_num.data",
                #if $input_num.input_choice == "2":
                    metadata = "$input_num.metadata",
                    ext = "$input_num.data.ext,$input_num.metadata.ext",
                    transpose = $input_num.transpose_feature_table,
                #else:
                    ext = "$input_num.data.ext",
                #end if
                wavelet_filter = "$wf.wavelet_filter",
                wavelet_length = "$wf.wavelet_length",
                k = $k,
                t = $batch_correction.t,
                t2 = $batch_correction.t2,
                alpha = $alpha,
                exclude_blanks = $exclude_blanks
            )'
            #else if $batch_correction.mode == "single_batch":
            -e 'normalized_data <- waveica_singlebatch( 
                file = "$input_num.data",
                #if $input_num.input_choice == "2":
                    metadata = "$input_num.metadata",
                    ext = "$input_num.data.ext,$input_num.metadata.ext",
                    transpose = $input_num.transpose_feature_table,
                #else:
                    ext = "$input_num.data.ext",
                #end if
                wavelet_filter = "$wf.wavelet_filter",
                wavelet_length = "$wf.wavelet_length",
                k = $k,
                alpha = $alpha,
                cutoff = $batch_correction.cutoff,
                exclude_blanks = $exclude_blanks
            )'
            #end if

            -e 'store_data(normalized_data, "$normalized_data", "$metadata", "$input_num.data.ext", $keep_two_output)'
    ]]></command>

    <inputs>
        <conditional name="input_num">
            <param name="input_choice" type="select" label="Choose input files:">
                    <option value="1" selected="true">1: intensity-by-feature table with metadata</option>
                    <option value="2">2: intensity-by-feature table and metadata table separately</option>
            </param>
            <when value="1">
                <expand macro="input_data"/>
            </when>
            <when value="2">
                <expand macro="input_data"/>
                <param name="metadata" label="Input metadata" type="data" format="csv,tsv,tabular,parquet" help="" />
                <param name = "transpose_feature_table" label="Transpose feature table" type="boolean" checked="false" 
                truevalue="TRUE" falsevalue="FALSE" help="Swap sample names with feature names as column headers (to fit recetox-aplcms outputs)." />
            </when>
        </conditional>
        <param type="integer" value="20" name="k" label="Number of components to decompose" help="maximal component that ICA decomposes"/>
        <param type="float" value="0" name="alpha" label="Alpha" help="trade-off value between the independence of samples (temporal ICA) and variables (spatial ICA), should be between 0 and 1"/>
        <expand macro="wf"/>
        <conditional name="batch_correction">
            <param name="mode" type="select" label="Batch correction mode" help="'multiple batches' takes into account
            inter- and intrabatch intensity drift; 'single batch' relies only on the injection order of the samples and
            requires no batch information [2]">
                <option value="batchwise" selected="true">Multiple batches</option>
                <option value="single_batch">Single batch (or no batch information)</option>
            </param>
            <when value="batchwise">
                <param type="float" value="0.05" name="t" label="Batch-association threshold" help="threshold to consider a component associate with the batch, should be between 0 and 1"/>
                <param type="float" value="0.05" name="t2" label="Group-association threshold" help="threshold to consider a component associate with the group, should be between 0 and 1"/>
            </when>
            <when value="single_batch">
                <param type="float" value="0" name="cutoff" label="Cutoff" help="threshold of the variation explained by the injection order for independent components, should be between 0 and 1"/>
            </when>
        </conditional>
        <param name="exclude_blanks" type="boolean" checked="false" truevalue="TRUE" falsevalue="FALSE" label="Remove blanks" help="Excludes blank samples from the output" />
        <expand macro="split_output"/>
    </inputs>

    <expand macro="outputs"/>

    <tests>
        <test expect_num_outputs="1"><!-- TEST 1 -->
            <conditional name="input_num">
                <param name="data" value="input_data.csv" ftype="csv"/>
            </conditional>
            <param name="alpha" value="0"/>
            <param name="k" value="20"/>
            <conditional name="wf">
                <param name="wavelet_filter" value="d"/>
                <param name="wavelet_length" value="2"/>
            </conditional>
            <conditional name="batch_correction">
                <param name="mode" value="batchwise"/>
                <param name="t" value="0.05"/>
                <param name="t2" value="0.05"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.tsv" ftype="tabular"/>
        </test>
        <test expect_num_outputs="1"><!-- TEST 2 -->
            <conditional name="input_num">
                <param name="data" value="input_data.tsv" ftype="tsv"/>
            </conditional>
            <param name="alpha" value="0"/>
            <param name="k" value="20"/>
            <conditional name="wf">
                <param name="wavelet_filter" value="d"/>
                <param name="wavelet_length" value="2"/>
            </conditional>
            <conditional name="batch_correction">
                <param name="mode" value="batchwise"/>
                <param name="t" value="0.05"/>
                <param name="t2" value="0.05"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.tsv" ftype="tabular"/>
        </test>
        <test expect_num_outputs="1"><!-- TEST 3 -->
            <conditional name="input_num">
                <param name="data" value="input_data.parquet" ftype="parquet"/>
            </conditional>
            <param name="k" value="20"/>
            <param name="alpha" value="0"/>
            <conditional name="wf">
                <param name="wavelet_filter" value="d"/>
                <param name="wavelet_length" value="2"/>
            </conditional>
            <conditional name="batch_correction">
                <param name="mode" value="batchwise"/>
                <param name="t" value="0.05"/>
                <param name="t2" value="0.05"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.parquet" ftype="parquet"/>
        </test>
        <test expect_num_outputs="1"><!-- TEST 4 -->
            <conditional name="input_num">
                <param name="input_choice" value="2"/>
                <param name="data" value="feature_table.csv" ftype="csv"/>
                <param name="metadata" value="metadata.csv" ftype="csv"/>
            </conditional>
            <param name="alpha" value="0"/>
            <param name="k" value="20"/>
            <conditional name="wf">
                <param name="wavelet_filter" value="d"/>
                <param name="wavelet_length" value="2"/>
            </conditional>
            <conditional name="batch_correction">
                <param name="mode" value="batchwise"/>
                <param name="t" value="0.05"/>
                <param name="t2" value="0.05"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.tsv" ftype="tabular"/>
        </test>
        <test expect_num_outputs="1"><!-- TEST 5 -->
            <conditional name="input_num">
                <param name="input_choice" value="2"/>
                <param name="data" value="feature_table.tsv" ftype="tabular"/>
                <param name="metadata" value="metadata.tsv" ftype="tabular"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.tsv" ftype="tabular"/>
        </test>
        <test expect_num_outputs="1"><!-- TEST 6 -->
            <conditional name="input_num">
                <param name="input_choice" value="2"/>
                <param name="data" value="feature_table.parquet" ftype="parquet"/>
                <param name="metadata" value="metadata.csv" ftype="csv"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.parquet" compare="sim_size" delta="200" ftype="parquet"/>
        </test>
        <test expect_num_outputs="1"><!-- TEST 7 -->
            <conditional name="input_num">
                <param name="input_choice" value="2"/>
                <param name="data" value="feature_table_transpose_version.parquet" ftype="parquet"/>
                <param name="metadata" value="metadata.parquet" ftype="parquet"/>
                <param name="transpose_feature_table" value="TRUE"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.parquet" compare="sim_size" delta="200" ftype="parquet"/>
        </test>
        <test expect_num_outputs="1"><!-- TEST 8 -->
            <conditional name="input_num">
                <param name="input_choice" value="2"/>
                <param name="data" value="feature_table_transpose_version.csv" ftype="csv"/>
                <param name="metadata" value="metadata.csv" ftype="csv"/>
                <param name="transpose_feature_table" value="TRUE"/>
            </conditional>
            <output name="normalized_data" file="normalized_data.tsv" ftype="tabular"/>
        </test>
        <test expect_num_outputs="2"><!-- TEST 9 -->
            <conditional name="input_num">
                <param name="input_choice" value="2"/>
                <param name="data" value="feature_table_transpose_version.parquet" ftype="parquet"/>
                <param name="metadata" value="metadata.parquet" ftype="parquet"/>
                <param name="transpose_feature_table" value="TRUE"/>
            </conditional>
            <param name="keep_two_output" value="TRUE"/>
            <output name="normalized_data" file="test9_output1.parquet" ftype="parquet"/>
            <output name="metadata" file="test9_output2.parquet" ftype="parquet"/>
        </test>
        <test expect_num_outputs="2"><!-- TEST 10 -->
            <conditional name="input_num">
                <param name="input_choice" value="2"/>
                <param name="data" value="feature_table_transpose_version.csv" ftype="csv"/>
                <param name="metadata" value="metadata.csv" ftype="csv"/>
                <param name="transpose_feature_table" value="TRUE"/>
            </conditional>
            <param name="keep_two_output" value="TRUE"/>
            <output name="normalized_data" file="test10_output1.tsv" ftype="tabular"/>
            <output name="metadata" file="test10_output2.tsv" ftype="tabular"/>
        </test>
        <test expect_failure="true"><!-- TEST 11 -->
            <conditional name="input_num">
                <param name="data" value="na_data.csv" ftype="csv"/>
            </conditional>
        </test>
        <test expect_failure="true"><!-- TEST 12 -->
            <conditional name="input_num">
                <param name="data" value="incomplete_metadata_data.csv" ftype="csv"/>
            </conditional>
        </test>
    </tests>

    <help>
        <![CDATA[
        @HELP@
        ]]>
    </help>

    <citations>
        <citation type="doi">10.1016/j.aca.2019.02.010</citation>
        <citation type="doi">10.1007/s11306-021-01839-7</citation>
    </citations>

</tool>