annotate grinder.xml @ 8:43def9fa33b9

Grinder 0.4.0
author fangly
date Thu, 03 Nov 2011 23:44:09 -0400
parents bac7e652a9aa
children 577e77853e8b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
1 <tool id="grinder" name="Grinder" version="0.4.0">
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
2
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
3 <description>versatile omic shotgun and amplicon read simulator</description>
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
4
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
5 <requirements>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
6 <requirement type="binary">grinder</requirement>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
7 </requirements>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
8
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
9 <version_string>grinder --version</version_string>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
10
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
11 <command interpreter="python">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
12 stderr_wrapper.py
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
13 grinder
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
14 #if $reference_file.specify == "builtin":
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
15 -reference_file ${ filter( lambda x: str( x[0] ) == str( $reference_file.value ), $__app__.tool_data_tables[ 'all_fasta' ].get_fields() )[0][-1] }
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
16 #else if $reference_file.specify == "uploaded":
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
17 -reference_file $reference_file.value
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
18 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
19 #if str($coverage_fold):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
20 -coverage_fold $coverage_fold
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
21 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
22 #if str($total_reads):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
23 -total_reads $total_reads
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
24 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
25 #if str($read_dist):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
26 -read_dist $read_dist
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
27 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
28 #if str($insert_dist):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
29 -insert_dist $insert_dist
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
30 #end if
7
bac7e652a9aa Added mate orientation option
fangly
parents: 6
diff changeset
31 #if str($mate_orientation):
bac7e652a9aa Added mate orientation option
fangly
parents: 6
diff changeset
32 -mate_orientation $mate_orientation
bac7e652a9aa Added mate orientation option
fangly
parents: 6
diff changeset
33 #end if
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
34 #if str($exclude_chars):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
35 -exclude_chars $exclude_chars
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
36 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
37 #if str($delete_chars):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
38 -delete_chars $delete_chars
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
39 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
40 #if str($forward_reverse) != "None":
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
41 -forward_reverse $forward_reverse
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
42 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
43 #if str($unidirectional):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
44 -unidirectional $unidirectional
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
45 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
46 #if str($length_bias):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
47 -length_bias $length_bias
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
48 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
49 #if str($copy_bias):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
50 -copy_bias $copy_bias
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
51 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
52 #if str($mutation_dist):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
53 -mutation_dist $mutation_dist
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
54 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
55 #if str($mutation_ratio):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
56 -mutation_ratio $mutation_ratio
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
57 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
58 #if str($homopolymer_dist):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
59 -homopolymer_dist $homopolymer_dist
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
60 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
61 #if str($chimera_perc):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
62 -chimera_perc $chimera_perc
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
63 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
64 #if str($abundance_file) != "None":
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
65 -abundance_file $abundance_file
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
66 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
67 #if str($abundance_model):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
68 -abundance_model $abundance_model
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
69 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
70 #if str($num_libraries):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
71 -num_libraries $num_libraries
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
72 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
73 #if str($multiplex_ids) != "None":
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
74 -multiplex_ids $multiplex_ids
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
75 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
76 #if str($diversity):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
77 -diversity $diversity
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
78 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
79 #if str($shared_perc):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
80 -shared_perc $shared_perc
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
81 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
82 #if str($permuted_perc):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
83 -permuted_perc $permuted_perc
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
84 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
85 #if str($random_seed):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
86 -random_seed $random_seed
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
87 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
88 #if str($permuted_perc):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
89 -desc_track $desc_track
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
90 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
91 #if str($qual_levels):
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
92 -qual_levels $qual_levels
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
93 #end if
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
94 #if str($fastq_output) == '1':
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
95 -fastq_output $fastq_output
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
96 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
97 #if str($profile_file) != "None":
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
98 -profile_file $profile_file.value
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
99 #end if
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
100 <!-- When Galaxy bug #661 is resolved, then we can use the same method to check for all optional argument -->
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
101 <!-- i.e. either if str($param) != "None": or if str($param): -->
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
102 <!-- URL: https://bitbucket.org/galaxy/galaxy-central/issue/661/optional-arguments-problems#comment-655611 -->
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
103 </command>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
104
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
105 <inputs>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
106
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
107 <conditional name="reference_file">
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
108 <param name="specify" type="select" label="Specify">
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
109 <option value="builtin">Built-in file</option>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
110 <option value="uploaded">Uploaded file</option>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
111 </param>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
112 <when value="builtin">
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
113 <param name="value" type="select" label="Reference sequences (genomes, genes, transcripts, proteins)" help="Galaxy built-in FASTA file">
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
114 <options from_data_table="all_fasta" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
115 </param>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
116 </when>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
117 <when value="uploaded">
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
118 <param name="value" type="data" format="fasta" label="Reference sequences" help="FASTA file that contains the input reference sequences" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
119 </when>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
120 </conditional>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
121
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
122 <param name="total_reads" type="text" value="100" optional="true" label="Number of reads" help="Number of shotgun or amplicon reads to generate for each library. Do not specify this if you specify the fold coverage." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
123
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
124 <param name="coverage_fold" type="text" optional="true" label="Coverage fold" help="Desired fold coverage of the input reference sequences (the output FASTA length divided by the input FASTA length). Do not specify this if you specify the number of reads directly." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
125
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
126 <param name="read_dist" type="text" value="100" optional="true" label="Sequence length distribution" help="Desired sequence length distribution specified as:
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
127 average length, distribution ('uniform' or 'normal') and standard deviation
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
128 Only the first element is required.
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
129 Examples:
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
130 1/ All reads exactly 101 bp long (Illumina GA 2x): 101
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
131 2/ Uniform read distribution around 100+-10 bp: 100 uniform 10
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
132 3/ Reads normally distributed with an average of 800 and a standard deviation
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
133 of 100 bp (Sanger reads): 800 normal 100
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
134 4/ Reads normally distributed with an average of 450 and a standard deviation
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
135 of 50 bp (454 GS-FLX Ti): 450 normal 50
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
136 Reference sequences smaller than the specified read length are not used." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
137
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
138 <param name="insert_dist" type="text" value="0" optional="true" label="Insert size distribution" help="Create paired-end or mate-pair reads spanning the given insert length. Important: the insert is defined in the biological sense, i.e. its length includes the length of both reads and of the stretch of DNA between them:
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
139 0 : off,
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
140 or: insert size distribution in bp, in the same format as the read length
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
141 distribution (a typical value is 2,500 bp)
7
bac7e652a9aa Added mate orientation option
fangly
parents: 6
diff changeset
142 Two distinct reads are generated whether or not the mate pair overlaps." />
bac7e652a9aa Added mate orientation option
fangly
parents: 6
diff changeset
143
bac7e652a9aa Added mate orientation option
fangly
parents: 6
diff changeset
144 <param name="mate_orientation" type="text" value="FR" optional="true" label="Mate orientation" help="When generating paired-end or mate-pair reads (see the insert distribution parameter), specify the orientation of the reads (F: forward, R: reverse): FR for Sanger or Illumina paired-end, FF for 454, RF for Illumina mate-pairs, or RR" />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
145
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
146 <param name="exclude_chars" type="text" optional="true" label="Characters to exclude" help="Do not create reads containing any of the specified characters (case insensitive), e.g. 'N-' to prevent reads with gaps (-) or ambiguities (N)." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
147
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
148 <param name="delete_chars" type="text" optional="true" label="Characters to delete" help="Remove the specified characters from the reference sequences (case insensitive), e.g. 'N-' to remove gaps (-) and ambiguities (N)." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
149
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
150 <param name="forward_reverse" type="data" format="fasta" optional="true" label="Amplicon primers" help="Use DNA amplicon sequencing using a forward and reverse PCR primer sequence provided in a FASTA file. The primer sequences should use the IUPAC convention for degenerate residues and the reference sequences that that do not match the specified primers are excluded. If your reference sequences are full genomes, it is recommended to turn the copy number bias option on and the length bias option off reads. To sequence from the forward strand, set the sequencing direction option to 1 and put the forward primer first and reverse primer second in the FASTA file. To sequence from the reverse strand, invert the primers in the FASTA file and use -1 for the sequencing direction option. The second primer sequence in the FASTA file is always optional. Example: AAACTYAAAKGAATTGRCGG and ACGGGCGGTGTGTRC for the 926F and 1392R primers that target the V6 to V9 region of the 16S rRNA gene." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
151
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
152 <param name="unidirectional" type="select" display="radio" value="0" label="Sequencing direction" help="Instead of producing reads bidirectionally, from the reference strand and its reverse complement, proceed unidirectionally, from one strand only (forward or reverse). Values: 0 (off, i.e. bidirectional), 1 (forward), -1 (reverse). Use the value 1 for strand specific transcriptomic or proteomic datasets.">
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
153 <option value="0">both strands</option>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
154 <option value="1">forward strand only</option>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
155 <option value="-1">reverse strand only</option>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
156 </param>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
157
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
158 <param name="length_bias" type="boolean" truevalue="1" falsevalue="0" checked="true" label="Length bias" help="In shotgun libraries, sample reference sequences proportionally to their length. For example, in simulated microbial datasets, this means that at the same relative abundance, larger genomes contribute more reads than smaller genomes. 0 = no, 1 = yes." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
159
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
160 <param name="copy_bias" type="boolean" truevalue="1" falsevalue="0" checked="true" label="Copy number bias" help="In amplicon libraries where full genomes are used as input, sample species proportionally to the number of copies of the target gene: at equal relative abundance, genomes that have multiple copies of the target gene contribute more amplicon reads than genomes that have a single copy. 0 = no, 1 = yes." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
161
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
162 <param name="mutation_dist" type="text" value="0" optional="true" label="Mutation distribution" help="Introduce sequencing errors in the reads, under the form of mutations (substitutions, insertions and deletions) at positions that follow a specified distribution (with replacement): model (uniform, linear, poly4), model parameters. For example, for a uniform 0.1% error rate, use: uniform 0.1. To simulate Sanger errors, use a linear model where the errror rate is 1% at the 5' end of reads and 2% at the 3' end: linear 1 2. To model Illumina errors using the 4th degree polynome 3e-3 + 3.3e-8 * i^4 (Korbel et al 2009), use: poly4 3e-3 3.3e-8. Use the mutation ratio option to alter how many of these mutations are substitutions
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
163 or indels." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
164
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
165 <param name="mutation_ratio" type="text" value="80 20" optional="true" label="Mutation ratio" help="Indicate the percentage of substitutions and the number of indels (insertions and deletions). For example, use '80 20' (4 substitutions for each indel) for Sanger reads. Note that this parameter has no effect unless you specify the mutation distribution option." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
166
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
167 <param name="homopolymer_dist" type="text" value="0" optional="true" label="Homopolymer distribution" help="Introduce sequencing errors in the reads under the form of homopolymeric stretches (e.g. AAA, CCCCC) using a specified model where the homopolymer length
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
168 follows a normal distribution N(mean, standard deviation) that is function of
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
169 the homopolymer length n.
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
170 Margulies: N(n, 0.15 * n), Margulies et al. 2005.
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
171 Richter: N(n, 0.15 * sqrt(n)), Richter et al. 2008.
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
172 Balzer: N(n, 0.03494 + n * 0.06856), Balzer et al. 2010." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
173
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
174 <param name="chimera_perc" type="text" value="0" optional="true" label="Percentage of chimeras" help="Specify the percent of reads in amplicon libraries that should be chimeric sequences. The 'reference' field in the description of chimeric reads will
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
175 contain the ID of all the reference sequences forming the chimeric template. A typical value is 10%." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
176
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
177 <param name="abundance_file" type="data" format="tabular" optional="true" label="Abundance file" help="Specify the relative abundance of the reference sequencse manually in an input file. Each line of the file should contain a sequence name and its relative abundance (%), e.g. 'seqABC 82.1' or 'seqABC 82.1 10.2' if you are specifying two different libraries." />
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
178
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
179 <param name="abundance_model" type="text" value="uniform 1" optional="true" label="Rank abundance model" help="Relative abundance model for the input reference sequences: uniform, linear, powerlaw, logarithmic or exponential. The uniform and linear models do not require a parameter, but the other models take a parameter in the range [0, infinity). If this parameter is not specified, then it is randomly chosen. Examples:
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
180
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
181 uniform distribution: uniform
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
182 powerlaw distribution with parameter 0.1: powerlaw 0.1
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
183 exponential distribution with automatically chosen parameter: exponential" />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
184
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
185 <param name="num_libraries" type="text" value="1" optional="true" label="Number of libraries" help="Number of independent libraries to create. Specify how diverse and similar they should be using the diversity, shared percent and permuted percent options. Assign them different MID tags with the multiplex mids option. Note that in Galaxy, the maximum number of libraries is 10." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
186
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
187 <param name="multiplex_ids" type="data" format="fasta" optional="true" label="Specify MID tags file" help="Specify an optional FASTA file that contains sequence identifiers (a.k.a MIDs or barcodes) to add to the sequences (one sequence per library)."/>
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
188
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
189 <!-- When Galaxy bug #661 is resolved, then we can really have optional parameters of type "integer" or "float" -->
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
190 <!-- URL: https://bitbucket.org/galaxy/galaxy-central/issue/661/optional-arguments-problems#comment-655611 -->
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
191 <!-- Affected params: diversity (int), shared_perc (float), permuted_perc (float), random_seed (int), num_libraries (int), chimera_perc (float) -->
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
192 <param name="diversity" type="text" optional="true" label="Diversity (richness)" help="Richness, or number of reference sequences to include in the shotgun libraries. Use 0 for the maximum diversity possible (based on the number of reference sequences
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
193 available). Provide one value to make all libraries have the same diversity, or one diversity value per library otherwise." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
194
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
195 <param name="shared_perc" type="text" value="0" optional="true" label="Percent shared" help="For multiple libraries, percent of reference sequences they should have in common (relative to the diversity of the least diverse library)." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
196
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
197 <param name="permuted_perc" type="text" value="0" optional="true" label="Percent permuted" help="For multiple libraries, percent of the most-abundant reference sequences to permute in rank-abundance." />
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
198
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
199 <param name="random_seed" type="text" optional="true" label="Random seed" help="Seed number to use for the pseudo-random number generator." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
200
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
201 <param name="desc_track" type="boolean" truevalue="1" falsevalue="0" checked="true" label="Read tracking" help="Track read information (reference sequence, position, errors, ...) by writing it in the FASTA read description." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
202
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
203 <param name="qual_levels" type="text" optional="true" label="Quality score levels" help="Generate basic quality scores for the simulated reads. Good residues are given a specified good score (e.g. 30) and residues that are the result of an insertion or substitution are given a specified bad score (e.g. 10). Specify first the good score and then the bad score, e.g. '30 10'" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
204
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
205 <param name="fastq_output" type="boolean" truevalue="1" falsevalue="0" checked="false" label="FASTQ output" help="
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
206 Write the generated reads in FASTQ format (Sanger variant) instead of FASTA and
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
207 QUAL. Quality score levels need to be specified for this option to be effective." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
208
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
209 <param name="profile_file" type="data" format="txt" optional="true" label="Profile file" help="A file that contains Grinder arguments. This is useful if you use many options or often use the same options. Lines with comments (#) are ignored. Consider the profile file, 'simple_profile.txt':
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
210
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
211 # A simple Grinder profile
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
212 -read_dist 105 normal 12
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
213 -total_reads 1000
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
214
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
215 Running: grinder -reference_file viral_genomes.fa -profile_file simple_profile.txt
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
216
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
217 Translates into: grinder -reference_file viral_genomes.fa -read_dist 105 normal 12 -total_reads 1000
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
218
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
219 Note that the arguments specified in the profile should not be specified again on the command line." />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
220
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
221 </inputs>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
222
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
223
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
224 <outputs>
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
225
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
226 <!-- single library output -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
227 <data format="tabular" name="ranks" from_work_dir="grinder-ranks.txt" label="${tool.name} ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
228 <filter>int(str(num_libraries)) == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
229 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
230 <data format="fasta" name="fasta" from_work_dir="grinder-reads.fa" label="${tool.name} reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
231 <filter>int(str(num_libraries)) == 1 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
232 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
233 <data format="qual" name="qual" from_work_dir="grinder-reads.qual" label="${tool.name} quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
234 <filter>int(str(num_libraries)) == 1 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
235 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
236 <data format="fastqsanger" name="fastq" from_work_dir="grinder-reads.fastq" label="${tool.name} reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
237 <filter>int(str(num_libraries)) == 1 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
238 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
239
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
240 <!-- When Galaxy bug #670 is resolved, then we won't have to harcode the number of output datasets -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
241 <!-- URL: https://bitbucket.org/galaxy/galaxy-central/issue/670/better-support-for-multiple-outputs -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
242
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
243 <!-- multiple libraries: library 1 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
244 <data format="tabular" name="ranks1" from_work_dir="grinder-1-ranks.txt" label="${tool.name} lib 1 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
245 <filter>int(str(num_libraries)) >= 2</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
246 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
247 <data format="fasta" name="fasta1" from_work_dir="grinder-1-reads.fa" label="${tool.name} lib 1 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
248 <filter>int(str(num_libraries)) >= 2 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
249 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
250 <data format="qual" name="qual1" from_work_dir="grinder-1-reads.qual" label="${tool.name} lib 1 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
251 <filter>int(str(num_libraries)) >= 2 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
252 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
253 <data format="fastqsanger" name="fastq1" from_work_dir="grinder-1-reads.fastq" label="${tool.name} lib 1 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
254 <filter>int(str(num_libraries)) >= 2 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
255 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
256
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
257 <!-- multiple libraries: library 2 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
258 <data format="tabular" name="ranks2" from_work_dir="grinder-2-ranks.txt" label="${tool.name} lib 2 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
259 <filter>int(str(num_libraries)) >= 2</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
260 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
261 <data format="fasta" name="fasta2" from_work_dir="grinder-2-reads.fa" label="${tool.name} lib 2 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
262 <filter>int(str(num_libraries)) >= 2 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
263 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
264 <data format="qual" name="qual2" from_work_dir="grinder-2-reads.qual" label="${tool.name} lib 2 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
265 <filter>int(str(num_libraries)) >= 2 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
266 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
267 <data format="fastqsanger" name="fastq2" from_work_dir="grinder-2-reads.fastq" label="${tool.name} lib 2 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
268 <filter>int(str(num_libraries)) >= 2 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
269 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
270
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
271 <!-- multiple libraries: library 3 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
272 <data format="tabular" name="ranks3" from_work_dir="grinder-3-ranks.txt" label="${tool.name} lib 3 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
273 <filter>int(str(num_libraries)) >= 3</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
274 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
275 <data format="fasta" name="fasta3" from_work_dir="grinder-3-reads.fa" label="${tool.name} lib 3 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
276 <filter>int(str(num_libraries)) >= 3 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
277 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
278 <data format="qual" name="qual3" from_work_dir="grinder-3-reads.qual" label="${tool.name} lib 3 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
279 <filter>int(str(num_libraries)) >= 3 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
280 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
281 <data format="fastqsanger" name="fastq3" from_work_dir="grinder-3-reads.fastq" label="${tool.name} lib 3 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
282 <filter>int(str(num_libraries)) >= 3 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
283 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
284
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
285 <!-- multiple libraries: library 4 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
286 <data format="tabular" name="ranks4" from_work_dir="grinder-4-ranks.txt" label="${tool.name} lib 4 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
287 <filter>int(str(num_libraries)) >= 4</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
288 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
289 <data format="fasta" name="fasta4" from_work_dir="grinder-4-reads.fa" label="${tool.name} lib 4 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
290 <filter>int(str(num_libraries)) >= 4 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
291 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
292 <data format="qual" name="qual4" from_work_dir="grinder-4-reads.qual" label="${tool.name} lib 4 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
293 <filter>int(str(num_libraries)) >= 4 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
294 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
295 <data format="fastqsanger" name="fastq4" from_work_dir="grinder-4-reads.fastq" label="${tool.name} lib 4 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
296 <filter>int(str(num_libraries)) >= 4 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
297 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
298
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
299 <!-- multiple libraries: library 5 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
300 <data format="tabular" name="ranks5" from_work_dir="grinder-5-ranks.txt" label="${tool.name} lib 5 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
301 <filter>int(str(num_libraries)) >= 5</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
302 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
303 <data format="fasta" name="fasta5" from_work_dir="grinder-5-reads.fa" label="${tool.name} lib 5 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
304 <filter>int(str(num_libraries)) >= 5 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
305 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
306 <data format="qual" name="qual5" from_work_dir="grinder-5-reads.qual" label="${tool.name} lib 5 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
307 <filter>int(str(num_libraries)) >= 5 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
308 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
309 <data format="fastqsanger" name="fastq5" from_work_dir="grinder-5-reads.fastq" label="${tool.name} lib 5 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
310 <filter>int(str(num_libraries)) >= 5 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
311 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
312
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
313 <!-- multiple libraries: library 6 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
314 <data format="tabular" name="ranks6" from_work_dir="grinder-6-ranks.txt" label="${tool.name} lib 6 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
315 <filter>int(str(num_libraries)) >= 6</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
316 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
317 <data format="fasta" name="fasta6" from_work_dir="grinder-6-reads.fa" label="${tool.name} lib 6 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
318 <filter>int(str(num_libraries)) >= 6 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
319 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
320 <data format="qual" name="qual6" from_work_dir="grinder-6-reads.qual" label="${tool.name} lib 6 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
321 <filter>int(str(num_libraries)) >= 6 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
322 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
323 <data format="fastqsanger" name="fastq6" from_work_dir="grinder-6-reads.fastq" label="${tool.name} lib 6 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
324 <filter>int(str(num_libraries)) >= 6 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
325 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
326
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
327 <!-- multiple libraries: library 7 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
328 <data format="tabular" name="ranks7" from_work_dir="grinder-7-ranks.txt" label="${tool.name} lib 7 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
329 <filter>int(str(num_libraries)) >= 7</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
330 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
331 <data format="fasta" name="fasta7" from_work_dir="grinder-7-reads.fa" label="${tool.name} lib 7 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
332 <filter>int(str(num_libraries)) >= 7 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
333 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
334 <data format="qual" name="qual7" from_work_dir="grinder-7-reads.qual" label="${tool.name} lib 7 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
335 <filter>int(str(num_libraries)) >= 7 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
336 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
337 <data format="fastqsanger" name="fastq7" from_work_dir="grinder-7-reads.fastq" label="${tool.name} lib 7 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
338 <filter>int(str(num_libraries)) >= 7 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
339 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
340
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
341 <!-- multiple libraries: library 8 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
342 <data format="tabular" name="ranks8" from_work_dir="grinder-8-ranks.txt" label="${tool.name} lib 8 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
343 <filter>int(str(num_libraries)) >= 8</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
344 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
345 <data format="fasta" name="fasta8" from_work_dir="grinder-8-reads.fa" label="${tool.name} lib 8 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
346 <filter>int(str(num_libraries)) >= 8 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
347 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
348 <data format="qual" name="qual8" from_work_dir="grinder-8-reads.qual" label="${tool.name} lib 8 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
349 <filter>int(str(num_libraries)) >= 8 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
350 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
351 <data format="fastqsanger" name="fastq8" from_work_dir="grinder-8-reads.fastq" label="${tool.name} lib 8 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
352 <filter>int(str(num_libraries)) >= 8 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
353 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
354
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
355 <!-- multiple libraries: library 9 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
356 <data format="tabular" name="ranks9" from_work_dir="grinder-9-ranks.txt" label="${tool.name} lib 9 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
357 <filter>int(str(num_libraries)) >= 9</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
358 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
359 <data format="fasta" name="fasta9" from_work_dir="grinder-9-reads.fa" label="${tool.name} lib 9 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
360 <filter>int(str(num_libraries)) >= 9 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
361 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
362 <data format="qual" name="qual9" from_work_dir="grinder-9-reads.qual" label="${tool.name} lib 9 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
363 <filter>int(str(num_libraries)) >= 9 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
364 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
365 <data format="fastqsanger" name="fastq9" from_work_dir="grinder-9-reads.fastq" label="${tool.name} lib 9 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
366 <filter>int(str(num_libraries)) >= 9 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
367 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
368
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
369 <!-- multiple libraries: library 10 -->
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
370 <data format="tabular" name="ranks10" from_work_dir="grinder-10-ranks.txt" label="${tool.name} lib 10 ranks from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
371 <filter>int(str(num_libraries)) >= 10</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
372 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
373 <data format="fasta" name="fasta10" from_work_dir="grinder-10-reads.fa" label="${tool.name} lib 10 reads from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
374 <filter>int(str(num_libraries)) >= 10 and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
375 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
376 <data format="qual" name="qual10" from_work_dir="grinder-10-reads.qual" label="${tool.name} lib 10 quals from ${on_string}">
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
377 <filter>int(str(num_libraries)) >= 10 and str(qual_levels) and fastq_output == 0</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
378 </data>
8
43def9fa33b9 Grinder 0.4.0
fangly
parents: 7
diff changeset
379 <data format="fastqsanger" name="fastq10" from_work_dir="grinder-10-reads.fastq" label="${tool.name} lib 10 reads from ${on_string}">
6
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
380 <filter>int(str(num_libraries)) >= 10 and fastq_output == 1</filter>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
381 </data>
68576b1d2d8b Uploaded
fangly
parents: 5
diff changeset
382
5
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
383 </outputs>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
384
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
385 <tests>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
386 <!-- no tests since they would not not always return the same results -->
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
387 <!--
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
388 <test>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
389 <param name="specify" value="uploaded" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
390 <param name="value" value="ngs_simulation_in1.fasta" ftype="fasta" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
391 <output name="ranks" file="" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
392 <output name="fasta" file="" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
393 <output name="qual" file="" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
394 </test>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
395
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
396 <test>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
397 <param name="specify" value="builtin" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
398 <param name="builtin" value="pUC18" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
399 <output name="ranks" file="" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
400 <output name="fasta" file="" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
401 <output name="qual" file="" />
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
402 </test>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
403 -->
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
404 </tests>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
405
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
406 <help>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
407
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
408 **What it does**
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
409
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
410 Grinder is a program to create random shotgun and amplicon sequence libraries
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
411 based on reference sequences in a FASTA file. Features include:
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
412
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
413 * shotgun library or amplicon library
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
414 * arbitrary read length distribution and number of reads
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
415 * simulation of PCR and sequencing errors (chimeras, point mutations, homopolymers)
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
416 * support for creating paired-end (mate pair) datasets
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
417 * specific rank-abundance settings or manually given abundance for each genome
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
418 * creation of datasets with a given richness (alpha diversity)
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
419 * independent datasets can share a variable number of genomes (beta diversity)
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
420 * modeling of the bias created by varying genome lengths or gene copy number
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
421 * profile mechanism to store preferred options
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
422 * API to automate the creation of a large number of simulated datasets
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
423
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
424
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
425 **Input**
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
426
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
427 A variety of FASTA databases containing genes or genomes can be used as input
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
428 for Grinder, such as the NCBI RefSeq collection (ftp://ftp.ncbi.nih.gov/refseq/release/microbial/),
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
429 the GreenGenes 16S rRNA database (http://greengenes.lbl.gov/Download/Sequence_Data/Fasta_data_files/Isolated_named_strains_16S_aligned.fasta), theh uman genome and transcriptome (ftp://ftp.ncbi.nih.gov/refseq/H_sapiens/RefSeqGene/, ftp://ftp.ncbi.nih.gov/refseq/H_sapiens/mRNA_Prot/human.rna.fna.gz), ...
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
430
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
431 These input files can either be provided as a Galaxy dataset, or can be uploaded
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
432 by Galaxy users in their history.
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
433
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
434
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
435 **Output**
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
436
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
437 For each library requested, a first file contains the abundance of the species
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
438 in the simulated community created, e.g.::
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
439
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
440 # rank seqID rel. abundance
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
441 1 86715_Lachnospiraceae 0.367936925098555
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
442 2 6439_Neisseria_polysaccharea 0.183968462549277
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
443 3 103712_Fusobacterium_nucleatum 0.122645641699518
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
444 4 103024_Frigoribacterium 0.0919842312746386
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
445 5 129066_Streptococcus_pyogenes 0.0735873850197109
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
446 6 106485_Pseudomonas_aeruginosa 0.0613228208497591
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
447 7 13824_Veillonella_criceti 0.0525624178712221
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
448 8 28044_Lactosphaera 0.0459921156373193
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
449
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
450 The second file is a FASTA file containing shotgun or amplicon reads, e.g.::
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
451
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
452 >1 reference=13824_Veillonella_criceti position=89-1088 strand=+
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
453 ACCAACCTGCCCTTCAGAGGGGGATAACAACGGGAAACCGTTGCTAATACCGCGTACGAA
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
454 TGGACTTCGGCATCGGAGTTCATTGAAAGGTGGCCTCTATTTATAAGCTATCGCTGAAGG
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
455 AGGGGGTTGCGTCTGATTAGCTAGTTGGAGGGGTAATGGCCCACCAAGGCAA
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
456
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
457 >2 reference=103712_Fusobacterium_nucleatum position=2-1001 strand=+
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
458 TGAACGAAGAGTTTGATCCTGGCTCAGGATGAACGCTGACAGAATGCTTAACACATGCAA
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
459 GTCAACTTGAATTTGGGTTTTTAACTTAGGTTTGGG
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
460
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
461 If you specify the quality score levels option, a third file representing the
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
462 quality scores of the reads is created::
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
463
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
464 >1 reference=103712_Fusobacterium_nucleatum position=2-1001 strand=+
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
465 30 30 30 10 30 30 ...
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
466
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
467
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
468 </help>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
469
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
470 </tool>
5ba7c9ac056a Uploaded
fangly
parents:
diff changeset
471