annotate khmer_load_into_counting.xml @ 1:f491d18251e9 draft

planemo upload
author jowong
date Mon, 26 Nov 2018 02:14:27 -0500
parents 69d52f45c2fa
children ab0f91be3a90
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
1 <tool id="khmer_load_into_counting" name="Load Into Counting" version="1.0.5">
0
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
2 <description>Creates k-mer countgraph using reads</description>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
3 <requirements>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
4 <requirement type="package" version="2.1.2">khmer</requirement>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
5 </requirements>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
6 <command detect_errors="exit_code"><![CDATA[
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
7 load-into-counting.py
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
8 $advanced.b
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
9 $advanced.small
1
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
10 -k $kmer
0
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
11 -U $advanced.ukmer
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
12 #if str( $advanced.max_mem ) != "0"
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
13 -M $advanced.max_mem
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
14 #end if
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
15 #if str( $advanced.fp_rate ) != "0"
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
16 --fp-rate $advanced.fp_rate
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
17 #end if
1
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
18 -N $advanced.num_table
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
19 -x $advanced.table_size
0
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
20 hash.ct.gz
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
21 #if str( $data_input.data_selector ) == "paired"
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
22 $data_input.input1.forward $data_input.input1.reverse
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
23 #end if
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
24 #if str( $data_input.data_selector ) == "single"
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
25 $data_input.input2
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
26 #end if
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
27 ]]></command>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
28 <inputs>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
29 <conditional name="data_input">
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
30 <param name="data_selector" type="select" label="Single or Paired-end Data" help="Select between paired and single end data to add name to dataset">
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
31 <option value="paired">Paired</option>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
32 <option value="single">Single</option>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
33 </param>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
34 <when value="paired">
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
35 <param name="input1" format="data" type="data_collection" collection_type="paired" label="Select a paired collection" help="a paired data"/>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
36 </when>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
37 <when value="single">
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
38 <param name="input2" format="data" type="data" label="input" help="Specify dataset with single reads"/>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
39 </when>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
40 </conditional>
1
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
41 <param name="kmer" type="integer" value="32" label="K-mer" help="K-mer size to use (default: 32)" />
0
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
42 <section name="advanced" title="Advanced options" expanded="false">
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
43 <param type="boolean" argument="--small" label="Small count" checked="false" truevalue="--small-count" falsevalue="" help="Reduce memory usage by using a smaller counter for individual kmers. (default: False)"/>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
44 <param type="boolean" argument="-b" label="big count" checked="True" truevalue="-b" falsevalue="--no-bigcount" help="Reduce memory usage by using a smaller counter for individual kmers. (default: True)"/>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
45 <param name="thread" type="integer" value="1" label="Threads" help="Number of simultaneous threads to execute (default: 1)" />
1
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
46
0
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
47 <param name="ukmer" type="integer" value="0" label="Unique K-mer" help="approximate number of unique kmers in the input set (default: 0)" />
1
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
48 <param name="num_table" type="integer" value="1" label="Number of tables" help="number of tables to use (default: False)" />
f491d18251e9 planemo upload
jowong
parents: 0
diff changeset
49 <param name="table_size" type="integer" value="1000000000" label="Maximum size of table" help="maximum size of tables to use (default: False)" />
0
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
50 <param name="max_mem" type="integer" value="0" label="Maximum Memory" help="number of tables to use (default: False)" />
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
51 <param name="fp_rate" type="integer" value="0" label="FP rate override" help="Override the automatic FP rate setting for the current script" />
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
52 </section>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
53 </inputs>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
54 <outputs>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
55 <data name="hash_output" label="Hash output" format="data" from_work_dir="hash.ct.gz"/>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
56 </outputs>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
57 <help><![CDATA[
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
58 || This is the script load-into-counting.py in khmer.
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
59 || You are running khmer version 2.1.2
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
60 || You are also using screed version 1.0
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
61 ||
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
62 || If you use this script in a publication, please cite EACH of the following:
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
63 ||
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
64 || * MR Crusoe et al., 2015. http://dx.doi.org/10.12688/f1000research.6924.1
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
65 || * Q Zhang et al., http://dx.doi.org/10.1371/journal.pone.0101271
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
66 || * A. Döring et al. http://dx.doi.org:80/10.1186/1471-2105-9-11
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
67 ||
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
68 || Please see http://khmer.readthedocs.io/en/latest/citations.html for details.
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
69
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
70 usage: load-into-counting.py [--version] [--info] [-h] [-k KSIZE]
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
71 [-U UNIQUE_KMERS] [--fp-rate FP_RATE]
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
72 [-M MAX_MEMORY_USAGE] [--small-count]
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
73 [-T THREADS] [-b] [-s FORMAT] [-f] [-q]
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
74 output_countgraph_filename
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
75 input_sequence_filename
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
76 [input_sequence_filename ...]
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
77
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
78 Build a k-mer countgraph from the given sequences.
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
79
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
80 positional arguments:
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
81 output_countgraph_filename
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
82 The name of the file to write the k-mer countgraph to.
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
83 input_sequence_filename
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
84 The names of one or more FAST[AQ] input sequence
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
85 files.
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
86
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
87 optional arguments:
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
88 --version show program's version number and exit
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
89 --info print citation information
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
90 -h, --help show this help message and exit
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
91 -k KSIZE, --ksize KSIZE
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
92 k-mer size to use (default: 32)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
93 -U UNIQUE_KMERS, --unique-kmers UNIQUE_KMERS
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
94 approximate number of unique kmers in the input set
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
95 (default: 0)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
96 --fp-rate FP_RATE Override the automatic FP rate setting for the current
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
97 script (default: None)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
98 -M MAX_MEMORY_USAGE, --max-memory-usage MAX_MEMORY_USAGE
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
99 maximum amount of memory to use for data structure
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
100 (default: None)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
101 --small-count Reduce memory usage by using a smaller counter for
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
102 individual kmers. (default: False)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
103 -T THREADS, --threads THREADS
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
104 Number of simultaneous threads to execute (default: 1)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
105 -b, --no-bigcount The default behaviour is to count past 255 using
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
106 bigcount. This flag turns bigcount off, limiting
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
107 counts to 255. (default: True)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
108 -s FORMAT, --summary-info FORMAT
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
109 What format should the machine readable run summary be
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
110 in? (`json` or `tsv`, disabled by default) (default:
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
111 None)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
112 -f, --force Overwrite output file if it exists (default: False)
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
113 -q, --quiet
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
114
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
115 Note: with `-b`/`--no-bigcount` the output will be the exact size of the k-mer
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
116 countgraph and this script will use a constant amount of memory. In exchange
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
117 k-mer counts will stop at 255. The memory usage of this script with `-b` will
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
118 be about 1.15x the product of the `-x` and `-N` numbers.
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
119
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
120 Example:
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
121
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
122 load-into-counting.py -k 20 -x 5e7 out data/100k-filtered.fa
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
123
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
124 Multiple threads can be used to accelerate the process, if you have extra cores
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
125 to spare.
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
126
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
127 Example:
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
128
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
129 load-into-counting.py -k 20 -x 5e7 -T 4 out data/100k-filtered.fa
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
130
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
131
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
132 ]]></help>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
133 <citations>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
134 <citation type="bibtex">
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
135 @misc{githubkhmer,
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
136 author = {Crusoe, Michael},
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
137 year = {2015},
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
138 title = {khmer},
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
139 publisher = {GitHub},
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
140 journal = {GitHub repository},
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
141 url = {https://github.com/dib-lab/khmer},
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
142 }</citation>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
143 </citations>
69d52f45c2fa planemo upload
jowong
parents:
diff changeset
144 </tool>