view PTModel.xml @ 12:3e9d04994968 draft default tip

planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/openms commit 3d1e5f37fd16524a415f707772eeb7ead848c5e3
author galaxyp
date Thu, 01 Dec 2022 19:05:16 +0000
parents b6db68398c9e
children
line wrap: on
line source

<?xml version='1.0' encoding='UTF-8'?>
<!--This is a configuration file for the integration of a tools into Galaxy (https://galaxyproject.org/). This file was automatically generated using CTDConverter.-->
<!--Proposed Tool Section: [Peptide property prediction]-->
<tool id="PTModel" name="PTModel" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.05">
  <description>Trains a model for the prediction of proteotypic peptides from a training set.</description>
  <macros>
    <token name="@EXECUTABLE@">PTModel</token>
    <import>macros.xml</import>
  </macros>
  <expand macro="requirements"/>
  <expand macro="stdio"/>
  <command detect_errors="exit_code"><![CDATA[@QUOTE_FOO@
@EXT_FOO@
#import re

## Preprocessing
mkdir in_positive &&
ln -s '$in_positive' 'in_positive/${re.sub("[^\w\-_]", "_", $in_positive.element_identifier)}.$gxy2omsext($in_positive.ext)' &&
mkdir in_negative &&
ln -s '$in_negative' 'in_negative/${re.sub("[^\w\-_]", "_", $in_negative.element_identifier)}.$gxy2omsext($in_negative.ext)' &&
mkdir out &&
#if "out_oligo_params_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
  mkdir out_oligo_params &&
#end if
#if "out_oligo_trainset_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
  mkdir out_oligo_trainset &&
#end if

## Main program call

set -o pipefail &&
@EXECUTABLE@ -write_ctd ./ &&
python3 '$__tool_directory__/fill_ctd.py' '@EXECUTABLE@.ctd' '$args_json' '$hardcoded_json' &&
@EXECUTABLE@ -ini @EXECUTABLE@.ctd
-in_positive
'in_positive/${re.sub("[^\w\-_]", "_", $in_positive.element_identifier)}.$gxy2omsext($in_positive.ext)'
-in_negative
'in_negative/${re.sub("[^\w\-_]", "_", $in_negative.element_identifier)}.$gxy2omsext($in_negative.ext)'
-out
'out/output.${gxy2omsext("txt")}'
#if "out_oligo_params_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
  -out_oligo_params
  'out_oligo_params/output.${gxy2omsext("paramxml")}'
#end if
#if "out_oligo_trainset_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
  -out_oligo_trainset
  'out_oligo_trainset/output.${gxy2omsext("txt")}'
#end if
#if len(str($OPTIONAL_OUTPUTS).split(',')) == 0
  | tee '$stdout'
#end if

## Postprocessing
&& mv 'out/output.${gxy2omsext("txt")}' '$out'
#if "out_oligo_params_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
  && mv 'out_oligo_params/output.${gxy2omsext("paramxml")}' '$out_oligo_params'
#end if
#if "out_oligo_trainset_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
  && mv 'out_oligo_trainset/output.${gxy2omsext("txt")}' '$out_oligo_trainset'
#end if
#if "ctd_out_FLAG" in $OPTIONAL_OUTPUTS
  && mv '@EXECUTABLE@.ctd' '$ctd_out'
#end if]]></command>
  <configfiles>
    <inputs name="args_json" data_style="paths"/>
    <configfile name="hardcoded_json"><![CDATA[{"log": "log.txt", "threads": "\${GALAXY_SLOTS:-1}", "no_progress": true}]]></configfile>
  </configfiles>
  <inputs>
    <param argument="-in_positive" type="data" format="idxml" optional="false" label="input file with positive examples" help=" select idxml data sets(s)"/>
    <param argument="-in_negative" type="data" format="idxml" optional="false" label="input file with negative examples" help=" select idxml data sets(s)"/>
    <param argument="-c" type="float" optional="true" value="1.0" label="the penalty parameter of the svm" help=""/>
    <param argument="-svm_type" type="select" optional="true" label="the type of the svm (NU_SVC or C_SVC)" help="">
      <option value="NU_SVC">NU_SVC</option>
      <option value="C_SVC" selected="true">C_SVC</option>
      <expand macro="list_string_san" name="svm_type"/>
    </param>
    <param argument="-nu" type="float" optional="true" min="0.0" max="1.0" value="0.5" label="the nu parameter [0..1] of the svm (for nu-SVR)" help=""/>
    <param argument="-kernel_type" type="select" optional="true" label="the kernel type of the svm" help="">
      <option value="LINEAR">LINEAR</option>
      <option value="RBF">RBF</option>
      <option value="POLY">POLY</option>
      <option value="OLIGO" selected="true">OLIGO</option>
      <expand macro="list_string_san" name="kernel_type"/>
    </param>
    <param argument="-degree" type="integer" optional="true" min="1" value="1" label="the degree parameter of the kernel function of the svm (POLY kernel)" help=""/>
    <param argument="-border_length" type="integer" optional="true" min="1" value="22" label="length of the POBK" help=""/>
    <param argument="-k_mer_length" type="integer" optional="true" min="1" value="1" label="k_mer length of the POBK" help=""/>
    <param argument="-sigma" type="float" optional="true" value="5.0" label="sigma of the POBK" help=""/>
    <param argument="-max_positive_count" type="integer" optional="true" min="1" value="1000" label="quantity of positive samples for training (randomly chosen if smaller than available quantity)" help=""/>
    <param argument="-max_negative_count" type="integer" optional="true" min="1" value="1000" label="quantity of positive samples for training (randomly chosen if smaller than available quantity)" help=""/>
    <param argument="-redundant" type="boolean" truevalue="true" falsevalue="false" checked="false" label="if the input sets are redundant and the redundant peptides should occur more than once in the training set, this flag has to be set" help=""/>
    <param argument="-additive_cv" type="boolean" truevalue="true" falsevalue="false" checked="false" label="if the step sizes should be interpreted additively (otherwise the actual value is multiplied with the step size to get the new value" help=""/>
    <section name="cv" title="Parameters for the grid search / cross validation:" help="" expanded="false">
      <param name="skip_cv" argument="-cv:skip_cv" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Has to be set if the cv should be skipped and the model should just be trained with the specified parameters" help=""/>
      <param name="number_of_runs" argument="-cv:number_of_runs" type="integer" optional="true" min="1" value="10" label="number of runs for the CV" help=""/>
      <param name="number_of_partitions" argument="-cv:number_of_partitions" type="integer" optional="true" min="2" value="10" label="number of CV partitions" help=""/>
      <param name="degree_start" argument="-cv:degree_start" type="integer" optional="true" min="1" value="1" label="starting point of degree" help=""/>
      <param name="degree_step_size" argument="-cv:degree_step_size" type="integer" optional="true" value="2" label="step size point of degree" help=""/>
      <param name="degree_stop" argument="-cv:degree_stop" type="integer" optional="true" value="4" label="stopping point of degree" help=""/>
      <param name="c_start" argument="-cv:c_start" type="float" optional="true" value="1.0" label="starting point of c" help=""/>
      <param name="c_step_size" argument="-cv:c_step_size" type="float" optional="true" value="100.0" label="step size of c" help=""/>
      <param name="c_stop" argument="-cv:c_stop" type="float" optional="true" value="1000.0" label="stopping point of c" help=""/>
      <param name="nu_start" argument="-cv:nu_start" type="float" optional="true" min="0.0" max="1.0" value="0.1" label="starting point of nu" help=""/>
      <param name="nu_step_size" argument="-cv:nu_step_size" type="float" optional="true" value="1.3" label="step size of nu" help=""/>
      <param name="nu_stop" argument="-cv:nu_stop" type="float" optional="true" min="0.0" max="1.0" value="0.9" label="stopping point of nu" help=""/>
      <param name="sigma_start" argument="-cv:sigma_start" type="float" optional="true" value="1.0" label="starting point of sigma" help=""/>
      <param name="sigma_step_size" argument="-cv:sigma_step_size" type="float" optional="true" value="1.3" label="step size of sigma" help=""/>
      <param name="sigma_stop" argument="-cv:sigma_stop" type="float" optional="true" value="15.0" label="stopping point of sigma" help=""/>
    </section>
    <expand macro="adv_opts_macro">
      <param argument="-force" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Overrides tool-specific checks" help=""/>
      <param argument="-test" type="hidden" optional="true" value="False" label="Enables the test mode (needed for internal use only)" help="">
        <expand macro="list_string_san" name="test"/>
      </param>
    </expand>
    <param name="OPTIONAL_OUTPUTS" type="select" optional="true" multiple="true" label="Optional outputs">
      <option value="out_oligo_params_FLAG">out_oligo_params (output file with additional model parameters when using the OLIGO kernel)</option>
      <option value="out_oligo_trainset_FLAG">out_oligo_trainset (output file with the used training dataset when using the OLIGO kernel)</option>
      <option value="ctd_out_FLAG">Output used ctd (ini) configuration file</option>
    </param>
  </inputs>
  <outputs>
    <data name="out" label="${tool.name} on ${on_string}: out" format="txt"/>
    <data name="out_oligo_params" label="${tool.name} on ${on_string}: out_oligo_params" format="paramxml">
      <filter>OPTIONAL_OUTPUTS is not None and "out_oligo_params_FLAG" in OPTIONAL_OUTPUTS</filter>
    </data>
    <data name="out_oligo_trainset" label="${tool.name} on ${on_string}: out_oligo_trainset" format="txt">
      <filter>OPTIONAL_OUTPUTS is not None and "out_oligo_trainset_FLAG" in OPTIONAL_OUTPUTS</filter>
    </data>
    <data name="ctd_out" format="xml" label="${tool.name} on ${on_string}: ctd">
      <filter>OPTIONAL_OUTPUTS is not None and "ctd_out_FLAG" in OPTIONAL_OUTPUTS</filter>
    </data>
  </outputs>
  <tests><!-- TOPP_PTModel_1 -->
    <test expect_num_outputs="2">
      <section name="adv_opts">
        <param name="force" value="false"/>
        <param name="test" value="true"/>
      </section>
      <param name="in_positive" value="PTModel_1_input_positive.idXML"/>
      <param name="in_negative" value="PTModel_1_input_negative.idXML"/>
      <output name="out" file="PTModel_1_output.tmp" compare="sim_size" delta_frac="0.7" ftype="txt"/>
      <param name="c" value="0.5"/>
      <param name="svm_type" value="C_SVC"/>
      <param name="nu" value="0.5"/>
      <param name="kernel_type" value="OLIGO"/>
      <param name="degree" value="1"/>
      <param name="border_length" value="22"/>
      <param name="k_mer_length" value="1"/>
      <param name="sigma" value="5.0"/>
      <param name="max_positive_count" value="1000"/>
      <param name="max_negative_count" value="1000"/>
      <param name="redundant" value="false"/>
      <param name="additive_cv" value="false"/>
      <section name="cv">
        <param name="skip_cv" value="true"/>
        <param name="number_of_runs" value="10"/>
        <param name="number_of_partitions" value="10"/>
        <param name="degree_start" value="1"/>
        <param name="degree_step_size" value="2"/>
        <param name="degree_stop" value="4"/>
        <param name="c_start" value="1.0"/>
        <param name="c_step_size" value="100.0"/>
        <param name="c_stop" value="1000.0"/>
        <param name="nu_start" value="0.1"/>
        <param name="nu_step_size" value="1.3"/>
        <param name="nu_stop" value="0.9"/>
        <param name="sigma_start" value="1.0"/>
        <param name="sigma_step_size" value="1.3"/>
        <param name="sigma_stop" value="15.0"/>
      </section>
      <param name="OPTIONAL_OUTPUTS" value="ctd_out_FLAG"/>
      <output name="ctd_out" ftype="xml">
        <assert_contents>
          <is_valid_xml/>
        </assert_contents>
      </output>
    </test>
  </tests>
  <help><![CDATA[Trains a model for the prediction of proteotypic peptides from a training set.


For more information, visit http://www.openms.de/doxygen/release/2.8.0/html/TOPP_PTModel.html]]></help>
  <expand macro="references"/>
</tool>