view CADDSuite/galaxyconfigs/tools/InputPartitioner.xml @ 3:bb26168c5715

author marcel
date Tue, 12 Jul 2011 10:53:07 -0400
children af446ca2d5c6
line wrap: on
line source

<!--This is a configuration file for the integration of a CADDSuite tool into Galaxy ( This file was automatically generated using GalaxyConfigGenerator, so do not bother to make too many manual modifications.-->
<tool id="inputpartitioner" name="InputPartitioner" version="0.95">
    <description>split QSAR data set</description>
    <command interpreter="bash"><![CDATA[../../InputPartitioner 
#if str( $i ) != ''  and str( $i ) != 'None' :
   -i "$i"
#end if
#if str( $o ) != ''  and str( $o ) != 'None' :
   -o "$o"
#end if
#if str( $n ) != ''  and str( $n ) != 'None' :
   -n "$n"
#end if
 | tail -n 5
        <param name="i" optional="false" label="input data-file" type="data" format="dat"/>
        <param name="n" optional="false" label="number of partitions" type="text" area="true" size="1x5" value=""/>
        <data name="o" format="dat"/>
    <help>InputPartitioner partitions a given QSAR data set into n partitions with evenly distributed response values.
Thus, this tool can be useful as part of a nested validation pipeline.
Input is a data file as generated by InputReader.
Output will be written to n files postfixed '_TRAIN&lt;i&gt;.dat' and '_TEST&lt;i&gt;.dat', where &lt;i&gt; is the ID of the resp. partition. For each of these partitions, the training set contains only those compounds that were not selected for the resp. test set.</help>