changeset 0:2fe2d2b9e8e4 draft

Uploaded tool tarball.
author devteam
date Wed, 25 Sep 2013 11:07:38 -0400
parents
children 8192b4014977
files fastx_clipper.xml test-data/fastx_clipper1.fastq test-data/fastx_clipper1a.out tool-data/fastx_clipper_sequences.txt.sample tool_dependencies.xml
diffstat 5 files changed, 192 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/fastx_clipper.xml	Wed Sep 25 11:07:38 2013 -0400
@@ -0,0 +1,117 @@
+<tool id="cshl_fastx_clipper" name="Clip" version="1.0.1" >
+  <description>adapter sequences</description>
+  <requirements>
+      <requirement type="package" version="0.0.13">fastx_toolkit</requirement>
+  </requirements>
+  <command>
+    zcat -f $input | fastx_clipper -l $minlength -a $clip_source.clip_sequence -d $keepdelta -o $output -v $KEEP_N $DISCARD_OPTIONS
+#if $input.ext == "fastqsanger":
+ -Q 33
+#end if
+  </command>
+  
+  <inputs>
+    <param format="fasta,fastqsanger,fastqsolexa,fastqillumina" name="input" type="data" label="Library to clip" />
+  
+    <param name="minlength" size="4" type="integer" value="15">
+      <label>Minimum sequence length (after clipping, sequences shorter than this length will be discarded)</label>
+    </param>
+
+	<conditional name="clip_source">
+		<param name="clip_source_list" type="select" label="Source">
+			<option value="prebuilt" selected="true">Standard (select from the list below)</option>
+			<option value="user">Enter custom sequence</option>
+		</param>
+
+		<when value="user">
+			<param name="clip_sequence" size="30" label="Enter custom clipping sequence" type="text" value="AATTGGCC" />
+		</when>
+
+		<when value="prebuilt">
+			<param name="clip_sequence" type="select" label="Choose Adapter">
+				<options from_file="fastx_clipper_sequences.txt">
+					<column name="name" index="1"/>
+					<column name="value" index="0"/>
+				</options>
+			</param> 
+		</when>
+	</conditional>
+
+	<param name="keepdelta" size="2" type="integer" value="0">
+		<label>enter non-zero value to keep the adapter sequence and x bases that follow it</label>
+		<help>use this for hairpin barcoding. keep at 0 unless you know what you're doing.</help>
+	</param>
+
+	<param name="KEEP_N" type="select" label="Discard sequences with unknown (N) bases">
+		<option value="">Yes</option>
+		<option value="-n">No</option>
+	</param>
+
+	<param name="DISCARD_OPTIONS" type="select" label="Output options">
+		<option value="-c">Output only clipped sequences (i.e. sequences which contained the adapter)</option>
+		<option value="-C">Output only non-clipped sequences (i.e. sequences which did not contained the adapter)</option>
+		<option value="">Output both clipped and non-clipped sequences</option>
+	</param>
+
+  </inputs>
+	<!--
+	#functional test with param value starting with - fails.	
+	-->
+	<tests>
+		<test>
+			<param name="input" value="fastx_clipper1.fastq" ftype="fastqsolexa"/>
+			<param name="maxmismatches" value="2" />
+			<param name="minlength" value="15" />
+			<param name="clip_source_list" value="user" />
+			<param name="clip_sequence" value="CAATTGGTTAATCCCCCTATATA" />
+			<param name="keepdelta" value="0" />
+			<param name="KEEP_N" value="+-n" />
+			<param name="DISCARD_OPTIONS" value="+-c" />
+			<output name="output" file="fastx_clipper1a.out" />
+		</test>
+	</tests>
+  <outputs>
+    <data format="input" name="output" metadata_source="input" />
+  </outputs>
+  
+<help>
+**What it does**
+
+This tool clips adapters from the 3'-end of the sequences in a FASTA/FASTQ file.
+
+--------
+
+
+**Clipping Illustration:**
+
+.. image:: ${static_path}/fastx_icons/fastx_clipper_illustration.png 
+ 
+ 
+ 
+ 
+ 
+ 
+ 
+
+**Clipping Example:**
+
+.. image:: ${static_path}/fastx_icons/fastx_clipper_example.png 
+
+
+    
+**In the above example:**
+
+* Sequence no. 1 was discarded since it wasn't clipped (i.e. didn't contain the adapter sequence). (**Output** parameter).
+* Sequence no. 5 was discarded --- it's length (after clipping) was shorter than 15 nt (**Minimum Sequence Length** parameter).
+
+
+
+
+------
+
+This tool is based on `FASTX-toolkit`__ by Assaf Gordon.
+
+ .. __: http://hannonlab.cshl.edu/fastx_toolkit/
+ 
+</help>
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/fastx_clipper1.fastq	Wed Sep 25 11:07:38 2013 -0400
@@ -0,0 +1,36 @@
+@CSHL_3_FC042AGLLWW:1:2:7:203
+GTACGCATGACCGAACCCCCCNCCCCCCAATTGGTT
++CSHL_3_FC042AGLLWW:1:2:7:203
+aab^V^aU]`aa^aZaaabbXEZabaaaaaaaa]]`
+@CSHL_3_FC042AGLLWW:1:2:7:33
+CAATGCCTCCAATTGGTTAATCCCCCTATATATACT
++CSHL_3_FC042AGLLWW:1:2:7:33
+Waaa^aZaaW^U_XaWaa\WMEP^KEZXRPEEEGaa
+@CSHL_3_FC042AGLLWW:1:2:7:169
+GCAGCAGGCGCGTCAGAGAGCCCCCCCCCCCCCCCC
++CSHL_3_FC042AGLLWW:1:2:7:169
+a_M^a\Uaaa_M_aaaaaaaaaaaaaaaV\ZUGUUR
+@CSHL_3_FC042AGLLWW:1:2:7:1436
+AATTATTTATTAAATTTTAATAATATGGGAGACACT
++CSHL_3_FC042AGLLWW:1:2:7:1436
+a^aaaaaaaaaaaaaaa_U`aaaaa_S_aaaaaVV[
+@CSHL_3_FC042AGLLWW:1:2:7:292
+GGAGAAATACACACAATTGGTTAATCCCCCTATATA
++CSHL_3_FC042AGLLWW:1:2:7:292
+babaaaaaaaUMaaaaaaaaaaa\XEUUEP_]UERE
+@CSHL_3_FC042AGLLWW:1:2:7:1819
+AATTCAAACCACCCCAACCCACACACAGAGATACAA
++CSHL_3_FC042AGLLWW:1:2:7:1819
+a\\QVVVLaaLOEXUWUUEKUULEMUEUUKULIQMU
+@CSHL_3_FC042AGLLWW:1:2:7:1875
+GCAAAAGAGTAGTGTACCCCCCCCCCCCCCCCCCCC
++CSHL_3_FC042AGLLWW:1:2:7:1875
+aaaaaaaaaXUXXEXaaaaa`_ZaaaaaaaaaXEXU
+@CSHL_3_FC042AGLLWW:1:2:8:624
+ACTGCAATTGGTTAATCCCCCTATATAGCGCTGTGG
++CSHL_3_FC042AGLLWW:1:2:8:624
+aa[S^`X`aa_]]OOXMU^_[MU_aaaaaaaaaaaa
+@CSHL_3_FC042AGLLWW:1:2:8:250
+TGCCGCGCACACTGATGCAATTGGTTAATCCCCCTA
++CSHL_3_FC042AGLLWW:1:2:8:250
+aaaaaaaa^aaaaaabbb[KXPEU[RXZ^JUKRKXE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/fastx_clipper1a.out	Wed Sep 25 11:07:38 2013 -0400
@@ -0,0 +1,20 @@
+@CSHL_3_FC042AGLLWW:1:2:7:203
+GTACGCATGACCGAACCCCCCNCCCCC
++CSHL_3_FC042AGLLWW:1:2:7:203
+aab^V^aU]`aa^aZaaabbXEZabaa
+@CSHL_3_FC042AGLLWW:1:2:7:169
+GCAGCAGGCGCGTCAGAGAGCCCCCCCCCCCCCCC
++CSHL_3_FC042AGLLWW:1:2:7:169
+a_M^a\Uaaa_M_aaaaaaaaaaaaaaaV\ZUGUU
+@CSHL_3_FC042AGLLWW:1:2:7:1819
+AATTCAAACCACCCCAACCCACACACAGAGATA
++CSHL_3_FC042AGLLWW:1:2:7:1819
+a\\QVVVLaaLOEXUWUUEKUULEMUEUUKULI
+@CSHL_3_FC042AGLLWW:1:2:7:1875
+GCAAAAGAGTAGTGTACCCCCCCCCCCCCCCCCCC
++CSHL_3_FC042AGLLWW:1:2:7:1875
+aaaaaaaaaXUXXEXaaaaa`_ZaaaaaaaaaXEX
+@CSHL_3_FC042AGLLWW:1:2:8:250
+TGCCGCGCACACTGATG
++CSHL_3_FC042AGLLWW:1:2:8:250
+aaaaaaaa^aaaaaabb
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/fastx_clipper_sequences.txt.sample	Wed Sep 25 11:07:38 2013 -0400
@@ -0,0 +1,13 @@
+#
+# Adapter/Linker sequences for FASTX-Clipper tool.
+#
+# Format:
+#    Adapter Sequence <TAB> Descriptive name
+#
+# Example:
+#     AAATTTGATAAGATA   Our-Adapter
+#
+# Some adapters can be found here:
+# http://seqanswers.com/forums/showthread.php?t=198
+#
+#TGTAGGCC	Dummy-Adapter (don't use me)
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml	Wed Sep 25 11:07:38 2013 -0400
@@ -0,0 +1,6 @@
+<?xml version="1.0"?>
+<tool_dependency>
+    <package name="fastx_toolkit" version="0.0.13">
+        <repository changeset_revision="ec66ae4c269b" name="package_fastx_toolkit_0_0_13" owner="devteam" toolshed="http://toolshed.g2.bx.psu.edu" />
+    </package>
+</tool_dependency>