Repository 'stacks'
hg clone https://toolshed.g2.bx.psu.edu/repos/avowinkel/stacks

Changeset 0:af879fc0d734 (2015-06-26)
Next changeset 1:228d0cbc14f9 (2015-06-29)
Commit message:
Uploaded
added:
process_radtags.xml
process_radtags_macros.xml
process_radtags_rename.sh
test-data/barcodes.tbl
test-data/input-se-inline.fastqsanger
tool_dependencies.xml
b
diff -r 000000000000 -r af879fc0d734 process_radtags.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/process_radtags.xml Fri Jun 26 16:48:45 2015 -0400
[
b'@@ -0,0 +1,252 @@\n+<?xml version="1.0"?>\n+<tool id="process_radtags" name="process_radtags" version="0.1.0">\n+\n+    <description>from Stacks toolbox</description>\n+\n+    <macros>\n+        <import>process_radtags_macros.xml</import>\n+    </macros>\n+\n+    <requirements>\n+        <requirement type="package" version="1.32">stacks</requirement>\n+    </requirements>\n+\n+    <command>\n+    <![CDATA[\n+\n+    mkdir output &&\n+\n+    process_radtags\n+    \n+    #if $analysis_type.analysis_type_select == \'se\'\n+        -f ${analysis_type.fastq_input1}\n+    #elif $analysis_type.analysis_type_select == \'pe\'\n+        -1 ${analysis_type.fastq_input1}\n+        -2 ${analysis_type.fastq_input2}\n+    #end if\n+\n+    -b ${barcode_file}\n+    -o output\n+\n+    #if $analysis_type.fastq_input1.is_of_type(\'fastqsanger\')\n+        -E "phred33"\n+    #elif $analysis_type.fastq_input1.is_of_type(\'fastqillumina\')\n+        -E "phred64"\n+    #end if\n+\n+    #if $double_digest.double_digest_enabled\n+        --renz_1 ${enzyme}\n+        --renz_2 ${double_digest.enzyme}\n+    #else\n+        -e ${enzyme}\n+    #end if\n+    \n+    ${c} ${q} ${r}\n+\n+    #if $t > 0\n+        -t ${t}\n+    #end if\n+    -w ${w}\n+    -s ${s}\n+\n+    -D\n+\n+    #if $analysis_type.adapter_options.adapter_options_enabled\n+        #if $analysis_type.analysis_type_select == \'se\'\n+            --adapter_1 ${$analysis_type.adapter_options.adapter_1}\n+        #elif $analysis_type.analysis_type_select == \'pe\'\n+            --adapter_1 ${$analysis_type.adapter_options.adapter_1}\n+            --adapter_2 ${$analysis_type.adapter_options.adapter_2}\n+        #end if\n+        --adapter_mm ${$analysis_type.adapter_options.adapter_mm}\n+    #end if\n+\n+    #if $advanced_options.advanced_options_enabled\n+        ${advanced_options.filter_illumina}\n+        ${advanced_options.disable_rad_check}\n+        --barcode_dist_1 ${advanced_options.barcode_dist}\n+    #end if\n+\n+    > ${log_file} 2>&1 &&\n+\n+    bash $__tool_directory__/process_radtags_rename.sh ${analysis_type.fastq_input1.ext}\n+\n+    ]]>\n+    </command>\n+\n+    <inputs>\n+        <conditional name="analysis_type">\n+            <param name="analysis_type_select" type="select" label="Analysis type">\n+                <option value="se" selected="true">Single End Reads</option>\n+                <option value="pe">Paired End Reads (NOT IMPLEMENTED)</option>\n+            </param>\n+\n+            <when value="se">\n+                <param name="fastq_input1" type="data" format="fasta,fastqsanger,fastqillumina" label="Select the fastq/a file" help="Specify fastq/a file with reads"/>\n+                \n+                <param name="barcode_type" type="select" label="Barcode type">\n+                    <option value="--inline_null">inline barcode</option>\n+                    <option value="--index_null">barcode in header</option>\n+                </param>\n+\n+                <expand macro="macro_adapter_options_se"/>\n+            </when>\n+\n+            <when value="pe">\n+                <param name="fastq_input1" type="data" format="fasta,fastqsanger,fastqillumina" label="Select first fastq/a file" help="Specify fastq/a file with forward reads"/>\n+                <param name="fastq_input2" type="data" format="fasta,fastqsanger,fastqillumina" label="Select second fastq/a file" help="Specify fastq/a file with reverse reads"/>\n+\n+                <param name="barcode_type" type="select" label="Barcode type">\n+                    <option value="--inline_inline">inline barcode</option>\n+                    <option value="--index_index">barcode in header</option>\n+                    <option value="--inline_index">forward read: inline; reverse read: header</option>\n+                    <option value="--index_inline">forward read: header; reverse read: inline</option>\n+                </param>\n+\n+                <expand macro="macro_adapter_options_pe"/>\n+            </when>\n+        </conditional>\n+        \n+        <param name="barcode_file" type="data" format="tabular" label="Select t'..b"[\n+\n+**Tool website (with examples)**:\n+\n+http://catchenlab.life.illinois.edu/stacks/comp/process_radtags.php\n+\n+----\n+\n+**Tool help output**::\n+\n+    process_radtags 1.32\n+    process_radtags [-f in_file | -p in_dir [-P] [-I] | -1 pair_1 -2 pair_2] -b barcode_file -o out_dir -e enz [-c] [-q] [-r] [-t len] [-D] [-w size] [-s lim] [-h]\n+    f: path to the input file if processing single-end sequences.\n+    i: input file type, either 'bustard' for the Illumina BUSTARD format, 'bam', 'fastq' (default), or 'gzfastq' for gzipped FASTQ.\n+    y: output type, either 'fastq', 'gzfastq', 'fasta', or 'gzfasta' (default is to match the input file type).\n+    p: path to a directory of files.\n+    P: files contained within directory specified by '-p' are paired.\n+    I: specify that the paired-end reads are interleaved in single files.\n+    1: first input file in a set of paired-end sequences.\n+    2: second input file in a set of paired-end sequences.\n+    o: path to output the processed files.\n+    b: path to a file containing barcodes for this run.\n+    c: clean data, remove any read with an uncalled base.\n+    q: discard reads with low quality scores.\n+    r: rescue barcodes and RAD-Tags.\n+    t: truncate final read length to this value.\n+    E: specify how quality scores are encoded, 'phred33' (Illumina 1.8+, Sanger, default) or 'phred64' (Illumina 1.3 - 1.5).\n+    D: capture discarded reads to a file.\n+    w: set the size of the sliding window as a fraction of the read length, between 0 and 1 (default 0.15).\n+    s: set the score limit. If the average score within the sliding window drops below this value, the read is discarded (default 10).\n+    h: display this help messsage.\n+\n+    Barcode options:\n+    --inline_null:   barcode is inline with sequence, occurs only on single-end read (default).\n+    --index_null:    barcode is provded in FASTQ header, occurs only on single-end read.\n+    --inline_inline: barcode is inline with sequence, occurs on single and paired-end read.\n+    --index_index:   barcode is provded in FASTQ header, occurs on single and paired-end read.\n+    --inline_index:  barcode is inline with sequence on single-end read, occurs in FASTQ header for paired-end read.\n+    --index_inline:  barcode occurs in FASTQ header for single-end read, is inline with sequence on paired-end read.\n+\n+    Restriction enzyme options:\n+    -e <enz>, --renz_1 <enz>: provide the restriction enzyme used (cut site occurs on single-end read)\n+    --renz_2 <enz>: if a double digest was used, provide the second restriction enzyme used (cut site occurs on the paired-end read).\n+    Currently supported enzymes include:\n+      'aluI', 'apeKI', 'apoI', 'bamHI', 'bgIII', 'bstYI', 'claI', 'ddeI', \n+      'dpnII', 'eaeI', 'ecoRI', 'ecoRV', 'ecoT22I', 'hindIII', 'kpnI', 'mluCI', \n+      'mseI', 'mspI', 'ndeI', 'nheI', 'nlaIII', 'notI', 'nsiI', 'pstI', \n+      'rsaI', 'sacI', 'sau3AI', 'sbfI', 'sexAI', 'sgrAI', 'speI', 'sphI', \n+      'taqI', 'xbaI', or 'xhoI'\n+    Adapter options:\n+    --adapter_1 <sequence>: provide adaptor sequence that may occur on the single-end read for filtering.\n+    --adapter_2 <sequence>: provide adaptor sequence that may occur on the paired-read for filtering.\n+      --adapter_mm <mismatches>: number of mismatches allowed in the adapter sequence.\n+\n+    Output options:\n+    --merge: if no barcodes are specified, merge all input files into a single output file.\n+\n+    Advanced options:\n+    --filter_illumina: discard reads that have been marked by Illumina's chastity/purity filter as failing.\n+    --disable_rad_check: disable checking if the RAD site is intact.\n+    --len_limit &lt;limit&gt;: specify a minimum sequence length (useful if your data has already been trimmed).\n+    --barcode_dist_1: the number of allowed mismatches when rescuing single-end barcodes (default 1).\n+    --barcode_dist_2: the number of allowed mismatches when rescuing paired-end barcodes (defaults to --barcode_dist_1).\n+\n+]]>\n+    </help>\n+</tool>\n"
b
diff -r 000000000000 -r af879fc0d734 process_radtags_macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/process_radtags_macros.xml Fri Jun 26 16:48:45 2015 -0400
b
@@ -0,0 +1,108 @@
+<macros>
+    
+    <token name="@OUTPUT_NAME_PREFIX@">${tool.name}</token>
+
+    <xml name="macro_enzyme_selector">
+        <param name="enzyme" type="select" label="Select Enzyme">
+            <option value="aluI">aluI</option>
+            <option value="apeKI">apeKI</option>
+            <option value="apoI">apoI</option>
+            <option value="bamHI">bamHI</option>
+            <option value="bgIII">bgIII</option>
+            <option value="bstYI">bstYI</option>
+            <option value="claI">claI</option>
+            <option value="ddeI">ddeI</option>
+            <option value="dpnII">dpnII</option>
+            <option value="eaeI">eaeI</option>
+            <option value="ecoRI">ecoRI</option>
+            <option value="ecoRV">ecoRV</option>
+            <option value="ecoT22I">ecoT22I</option>
+            <option value="hindIII">hindIII</option>
+            <option value="kpnI">kpnI</option>
+            <option value="mluCI">mluCI</option>
+            <option value="mseI">mseI</option>
+            <option value="mspI">mspI</option>
+            <option value="ndeI">ndeI</option>
+            <option value="nheI">nheI</option>
+            <option value="nlaIII">nlaIII</option>
+            <option value="notI">notI</option>
+            <option value="nsiI">nsiI</option>
+            <option value="pstI">pstI</option>
+            <option value="rsaI">rsaI</option>
+            <option value="sacI">sacI</option>
+            <option value="sau3AI">sau3AI</option>
+            <option value="sbfI">sbfI</option>
+            <option value="sexAI">sexAI</option>
+            <option value="sgrAI">sgrAI</option>
+            <option value="speI">speI</option>
+            <option value="sphI">sphI</option>
+            <option value="taqI">taqI</option>
+            <option value="xbaI">xbaI</option>
+            <option value="xhoI">xhoI</option>
+        </param>
+    </xml>
+
+    <xml name="macro_enzyme_selector2">
+        <param name="enzyme2" type="select" label="Select Second Enzyme (on reverse end only)">
+            <option value="aluI">aluI</option>
+            <option value="apeKI">apeKI</option>
+            <option value="apoI">apoI</option>
+            <option value="bamHI">bamHI</option>
+            <option value="bgIII">bgIII</option>
+            <option value="bstYI">bstYI</option>
+            <option value="claI">claI</option>
+            <option value="ddeI">ddeI</option>
+            <option value="dpnII">dpnII</option>
+            <option value="eaeI">eaeI</option>
+            <option value="ecoRI">ecoRI</option>
+            <option value="ecoRV">ecoRV</option>
+            <option value="ecoT22I">ecoT22I</option>
+            <option value="hindIII">hindIII</option>
+            <option value="kpnI">kpnI</option>
+            <option value="mluCI">mluCI</option>
+            <option value="mseI">mseI</option>
+            <option value="mspI">mspI</option>
+            <option value="ndeI">ndeI</option>
+            <option value="nheI">nheI</option>
+            <option value="nlaIII">nlaIII</option>
+            <option value="notI">notI</option>
+            <option value="nsiI">nsiI</option>
+            <option value="pstI">pstI</option>
+            <option value="rsaI">rsaI</option>
+            <option value="sacI">sacI</option>
+            <option value="sau3AI">sau3AI</option>
+            <option value="sbfI">sbfI</option>
+            <option value="sexAI">sexAI</option>
+            <option value="sgrAI">sgrAI</option>
+            <option value="speI">speI</option>
+            <option value="sphI">sphI</option>
+            <option value="taqI">taqI</option>
+            <option value="xbaI">xbaI</option>
+            <option value="xhoI">xhoI</option>
+        </param>
+    </xml>
+
+    <xml name="macro_adapter_options_se">
+        <expand macro="macro_adapter_options">
+            <param name="adapter_1" type="text" label="provide adaptor sequence that may occur on the read for filtering" />
+        </expand>
+    </xml>
+
+    <xml name="macro_adapter_options_pe">
+        <expand macro="macro_adapter_options">
+            <param name="adapter_1" type="text" label="provide adaptor sequence that may occur on the single-end read for filtering" />
+            <param name="adapter_2" type="text" label="provide adaptor sequence that may occur on the paired-read for filtering" />
+        </expand>
+    </xml>
+
+    <xml name="macro_adapter_options">
+        <conditional name="adapter_options">
+            <param name="adapter_options_enabled" type="boolean" label="Specify adapter options?" />
+            <when value="true">
+                <yield />
+                <param name="adapter_mm" type="integer" value="1" size="2" label="number of mismatches allowed in the adapter sequence" />
+            </when>
+            <when value="false" />
+        </conditional>
+    </xml>
+</macros>
b
diff -r 000000000000 -r af879fc0d734 process_radtags_rename.sh
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/process_radtags_rename.sh Fri Jun 26 16:48:45 2015 -0400
b
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+EXT=$1
+
+mv output/process_radtags.log output/Report.log
+mv output/*.discards output/Discards.${EXT}.discards
+mkdir splits
+mv output/sample_* splits
+#ls -lah output splits
+for i in splits/*.fq; do mv "$i" "${i/.fq}".${EXT}; done
b
diff -r 000000000000 -r af879fc0d734 test-data/barcodes.tbl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/barcodes.tbl Fri Jun 26 16:48:45 2015 -0400
b
@@ -0,0 +1,9 @@
+TAGCAG
+CCTTGCCATT
+ACTGCGAT
+GCAAGCCAT
+AACGTGCCT
+GAAGTG
+TCTTGG
+AACTGG
+ATGAGCAA
b
diff -r 000000000000 -r af879fc0d734 test-data/input-se-inline.fastqsanger
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input-se-inline.fastqsanger Fri Jun 26 16:48:45 2015 -0400
b
@@ -0,0 +1,44 @@
+@HWI-ST397:425:C563WACXX:1:1101:3568:2226 1:N:0:
+CCACTCATGCATAGAGAGTGCTGACATAGAGCAACAGATTTTAAGTTCCTTATTACTTTGCTAAGCCTAGTGGCATTGTTGGAATTTCAGCACTAGAATGG
++
+@@@DDBD;DDACFH@GDD3A?<@@AFIGCEH@3CDCFIIGIIEBHFIGGHG9FC@FHIIHEEFIFFHHGG=CCEGCHBECHFEEED;C@DCCCC:CCCCCA
+@HWI-ST397:425:C563WACXX:1:1101:3702:2227 1:N:0:
+TAGCAGTGCATTGCACAATTGTAGCTTAGGGTTGCTTATGTGATAGTTCTATTATGATGATATGATCTTGGTATGTAATTATGCAAGATCGGAAGAGCGGT
++
+@CCFFFFFHHHHHJJJJJJJJHJJJJJJIJJFHIIIJIJIBFDHEHIIGJGIJFIIGIJIJJJJIJJJJJJHIIJJHGJJJJJJJJHHHHHFFFDEEEDDB
+@HWI-ST397:425:C563WACXX:1:1101:3652:2228 1:N:0:
+ACTGCGATTGCATTCCCAAAATCAAAAGAGTGGGATCATGCAAGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCTCGTATGCCGTCTTCTGCT
++
+@B@FDFFFHHHHHJJIJIIJJJJJJJJIGG:EGGGJJJCGEHIJIGGGIIIGAEEGIAHHFHG@DDBE:@CEDBDBDBDD><BCBDDCDDDD9@<BCCCCD
+@HWI-ST397:425:C563WACXX:1:1101:3631:2229 1:N:0:
+CCTTGCCATTTGCATTGCTGAGTGTTTCAGTTTTTTATGCAAGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCTCGTATGCCGTCTTCTGCTT
++
+CCCFFFFFHHHHGJJJJJJJIJFEEJJJJJIIIIJJIIJJJJIJJJJJGGGHJFJJ5AEHHJHHHFFFFFFDDDDDBDB@BDDDBDDDDDD>BDDAC@CCC
+@HWI-ST397:425:C563WACXX:1:1101:3672:2229 1:N:0:
+GCAAGCCATTGCATGACTACTTAACGGGGGGATTCACCGCAAATACTACCTTGGCTCATTATTGCCGAGATAATGGTCTACTTCTTCACATCCACCGTGCA
++
+@@@FFFFFHHGHHJIJJJJJJJIJIJIJJJDBBDDDDDDDDDDDDDDDDDDDCCDCDDDEEEEDDDDBD>BDDDDCCCDDDEDDDDDDDCCDDDCDDDDDD
+@HWI-ST397:425:C563WACXX:1:1101:3742:2234 1:N:0:
+GCAAGCCATTGCATGAATTTTTCCTCTTGCAATGTATGAATTTTTTCCAGCAATGCAAGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCTCGT
++
+CCCFFFFFHHHHHJJJJJJJJJJJJJJJJJHJJJHIIJJJJJJJJJIJJJJJJJJJJJJIJJJJIJJJJDHF@DDECEEDDDDDDDDDDDDB@BBDDDDDD
+@HWI-ST397:425:C563WACXX:1:1101:3538:2245 1:N:0:
+GGAAGACATTGCATGTCCTTTTGATGAGATTGATGTAAATGAAGTTAGGGATGCAAGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCTCGTAT
++
+CCCFFFFFHHHHHJJHIJJJJJJIJJJJIJJJIJJGGGJJJIIJIIEIJJIGIHIJJJJJJJIJJJJJJJBHFFFEFFDDEEDDDDDBD:?BBDDDDDDDC
+@HWI-ST397:425:C563WACXX:1:1101:3974:2048 1:N:0:
+NACGTGCCTTGCATTGTTTGGTTTGATCCATTAAAAATAGAATGCAAGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCTCGTATGCCGTCTTC
++
+#1=DDDDFHHHHFJJJHIJIJFGHIIIJJJJIIIIJJEIIIJGIGIJJIGDGIGIGGHGII;AAEHEFFFFECECCBDBB?<B35>DDB??ACDDB0<AB:
+@HWI-ST397:425:C563WACXX:1:1101:3920:2053 1:N:0:
+NAAGTGTGCATCAACTATCTCAAACACAATTTGTATCCAAAACCATCATTCTAACATGCAAGGATCAATATATGACATCTCATTACTCACAGCCGACCATG
++
+#1=DDFDFHHHHHJJJJJJJJIJJJJJJJJJJJGIIJJIIJJJJJJJIJJIJJJJIJJJJJJJGIJJJJJJJJJIHJJHHHHHHFFFFFFEEDDDDDDDDD
+@HWI-ST397:425:C563WACXX:1:1101:3945:2061 1:Y:0:
+NCTTGGTGCATCAAAAACTCCGGGATCCTCGGGGCAAATGAAAGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCTCGTATGCCGTCTTCTGCT
++
+#08@9@@@@@@??########################################################################################
+@HWI-ST397:425:C563WACXX:1:1101:3801:2062 1:N:0:
+NACTGGTGCATGTATTAGTTATGTAGGATTTAGTAATGCAGGGTTTAATTATGCAAGTATTAGTTATGCAAGATCGGAAGAGCGGTTCAGCAGGAATGCCG
++
+#1:DDDFFHHHFFIIIEGCEEFHEEHGGFEHIICFHHGHEHGG1CFGGEHIGDHIIIBEHIIIGGHIIIIIIGGGFHIGFFHEDC=ABCCCCBB?B@CCC@
b
diff -r 000000000000 -r af879fc0d734 tool_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml Fri Jun 26 16:48:45 2015 -0400
b
@@ -0,0 +1,6 @@
+<?xml version="1.0"?>
+<tool_dependency>
+    <package name="stacks" version="1.32">
+        <repository changeset_revision="1e53d7d44ed6" name="package_stacks_1_32" owner="avowinkel" toolshed="https://toolshed.g2.bx.psu.edu" />
+    </package>
+</tool_dependency>