Mercurial > repos > fangly > grinder

--- a/grinder.xml	Thu Nov 03 23:58:59 2011 -0400
+++ b/grinder.xml	Tue Jan 17 20:15:09 2012 -0500
@@ -1,4 +1,4 @@
-<tool id="grinder" name="Grinder" version="0.4.0">
+<tool id="grinder" name="Grinder" version="0.4.3">

   <description>versatile omic shotgun and amplicon read simulator</description>

@@ -61,6 +61,12 @@
       #if str($chimera_perc):
         -chimera_perc     $chimera_perc
       #end if
+      #if str($chimera_dist):
+        -chimera_dist     $chimera_dist
+      #end if
+      #if str($chimera_kmer):
+        -chimera_kmer     $chimera_kmer
+      #end if
       #if str($abundance_file) != "None":
         -abundance_file   $abundance_file
       #end if
@@ -174,6 +180,10 @@
     <param name="chimera_perc" type="text" value="0" optional="true" label="Percentage of chimeras" help="Specify the percent of reads in amplicon libraries that should be chimeric sequences. The 'reference' field in the description of chimeric reads will
 contain the ID of all the reference sequences forming the chimeric template. A typical value is 10%." />

+    <param name="chimera_dist" type="text" value="314 38 1" optional="true" label="Multimera distribution" help="Specify the distribution of chimeras: bimeras, trimeras, quadrameras and multimeras of higher order. The default is the average values from Quince et al. 2011: '314 38 1', which corresponds to 89% of bimeras, 11% of trimeras and 0.3% of quadrameras. Note that this option only takes effect when you request the generation of chimeras with the chimera percentage option." />
+
+    <param name="chimera_kmer" type="text" value="10" optional="true" label="k-mer based chimeras" help="Activate a method to form chimeras by picking breakpoints at places where k-mers are shared between sequences. The value to provide to this option represents k, the length of the k-mers (in bp). The longer the kmer, the more similar the sequences have to be to be eligible to form chimeras. The more frequent a k-mer is in the pool of reference sequences (taking into account their relative abundance), the more often this k-mer will be chosen. For example, CHSIM (Edgar et al. 2011) uses a k-mer length of 10 bp. If you do not want to use k-mer information to form chimeras, use 0, which will result in the reference sequences and breakpoints to be taken randomly. Note that this option only takes effect when you request the generation of chimeras with the chimera percentage option." />
+
     <param name="abundance_file" type="data" format="tabular" optional="true" label="Abundance file" help="Specify the relative abundance of the reference sequencse manually in an input file. Each line of the file should contain a sequence name and its relative abundance (%), e.g. 'seqABC 82.1' or 'seqABC 82.1 10.2' if you are specifying two different libraries." />

     <param name="abundance_model" type="text" value="uniform 1" optional="true" label="Rank abundance model" help="Relative abundance model for the input reference sequences: uniform, linear, powerlaw, logarithmic or exponential. The uniform and linear models do not require a parameter, but the other models take a parameter in the range [0, infinity). If this parameter is not specified, then it is randomly chosen. Examples:
--- a/tool_data_table_conf.xml.sample	Thu Nov 03 23:58:59 2011 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,7 +0,0 @@
-<tables>
-    <!-- Locations of all fasta files under genome directory -->
-    <table name="all_fasta" comment_char="#">
-        <columns>value, dbkey, name, path</columns>
-        <file path="tool-data/all_fasta.loc" />
-    </table>
-</tables>