view cherri_eval.xml @ 2:cef4148ac5f2 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/cherri commit 8778c3f71e295ec5b62ef3998319d211fc864e35
author iuc
date Wed, 25 Jan 2023 18:33:29 +0000
parents 7c6c282ecf5a
children
line wrap: on
line source

<tool id="cherri_eval" name="Evaluation of RRIs using CheRRI" version="@VERSION@" profile="@PROFILE@">
    <macros>
        <import>macros.xml</import>
    </macros>
    <expand macro="requirements"/>
    <command detect_errors="exit_code"><![CDATA[
        export PYTHONHASHSEED=31337 &&
        ln -s '$ref_source.genome_fasta' genome.fa &&
        mkdir model_dir &&
        tar -C model_dir -xvf '$model_tar' > /dev/null &&
        cherri eval 
        -i1 '$rris_table'
        -g genome.fa
        -l '$chrom_len_file'
        -o . 
        -on cherri_eval
        -c '$context'
        -st $use_structure
        -hf $hand_feat
        -m 'model_dir/final_full.model'
        -mp 'model_dir/features.npz'
        #if $occupied_regions:
            -i2 '$occupied_regions'
        #end if
        #if $intarna_param_file:
            -p '$intarna_param_file'
        #end if
    ]]></command>
    <inputs>
        <param name="rris_table" type="data" format="csv" label="CSV file containing all RRIs that should be evaluated" />
        <expand macro="reference_source_conditional"/>
        <param name="model_tar" type="data" format="tgz" label="Model and feature files in a tar" />
        <param name="context" type="integer" value="150" label="How much context should be added at up- and downstream of each sequence" />
        <param name="use_structure" type="boolean" truevalue="on" falsevalue="off" checked="true" label="Set 'off' if you want to disable structure, default 'on'" />
        <param name="hand_feat" type="boolean" truevalue="on" falsevalue="off" checked="false" label="If you want to start from hand-curated feature files, use this for evaluating test set performance. Default: 'off'" />
        <param name="occupied_regions" optional="True" type="data" format="binary" label="Occupied regions python object file containing a dictionary" />
        <param name="intarna_param_file" optional="True" type="data" format="txt" label="IntaRNA parameters file" />
    </inputs>
    <outputs>
        <data name="eval_out" format="csv" from_work_dir="cherri_eval/evaluation/evaluation_results_eval_rri.csv" label="Evaluation results on ${on_string}"/>
    </outputs>
    <tests>
        <test>
            <param name="rris_table" value="test_evaluate_rris.csv"/>
            <conditional name="ref_source">
                <param name="ref_source_selector" value="history"/>
                <param name="genome_fasta" value="genome.fa"/>
            </conditional>  
            <param name="chrom_len_file" value="genome.sizes" />
            <param name="model_tar" value="context_150_model.tgz" />
            <output name="eval_out" file="evaluation_results_st_on.csv"/>
        </test>
    </tests>
    <help><![CDATA[

**What it does**

CheRRI detects functional RNA-RNA interaction (RRI) sites, by evaluating if an interaction site most likely occurs in nature. It helps to filter interaction sites generated either experimentally or by an RRI prediction algorithm, by removing false positive interactions.

**Inputs**
        
CheRRI takes a table of RNA-RNA interactions. It supports output of ChiRA or a csv files of interactions in the following format. The table needs the following header line:
        
    `chrom1,start1,stop1,strand1,chrom2,start2,stop2,strand2`
        
Following the header line, each subsequent line represents an RRI, with chromosome ID (format: 1,2,3 ...), interaction start, interaction end, and strand ("+" or "-") of the two interacting partners. For example, you might want to evaluate the following three RRI sites::
        
    19,18307518,18307539,-,14,90454500,90454521,+
    X,109054541,109054590,+,9,89178539,89178562,-
    10,123136102,123136122,+,5,1245880,1245902,+

The tool also additionally takes a genome FASTA file and a chromosome lengths file. User can select an in-built FASTA or a FASTA file from history.
A chromosome legths file is tabular file where each line contains a tab separated chromosome name and its length. Followin is an example:

    chr1    23200231
    chr2    12497572
    chr3    8387920

CheRRI also needs a model file (in binary format). It can be generated by using CheRRI train tool.

**Outputs**

This tool outputs a tabular file containing predictions for each input interaction.

    ]]></help>
    <expand macro="citations" />
</tool>