Repository 'mageck_count'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/mageck_count

Changeset 1:4d72d204dcfa (2018-02-17)
Previous changeset 0:b80c0e046539 (2018-02-14) Next changeset 2:9527a3d6ebd2 (2018-04-04)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/mageck commit 2eea865fe331694058922292e5681b96f4f0b4c7
modified:
mageck_count.xml
test-data/out.count.bam.txt
test-data/out.count.fastq.txt
b
diff -r b80c0e046539 -r 4d72d204dcfa mageck_count.xml
--- a/mageck_count.xml Wed Feb 14 06:42:18 2018 -0500
+++ b/mageck_count.xml Sat Feb 17 10:41:26 2018 -0500
[
b'@@ -1,5 +1,5 @@\n <?xml version="1.0"?>\n-<tool id="mageck_count" name="MAGeCK count" version="@VERSION@" >\n+<tool id="mageck_count" name="MAGeCK count" version="@VERSION@.1" >\n     <description>- collect sgRNA read counts from read mapping files</description>\n     <macros>\n         <import>mageck_macros.xml</import>\n@@ -30,16 +30,16 @@\n #if str($reads.format_select) == "files":\n     --fastq $infile\n     -l \'$reads.sgrna_library_file\'\n-#if $reads.sample_label:\n-    --sample-label \'$reads.sample_label\'\n-#end if\n-\n+    #if $reads.sample_label:\n+        --sample-label \'$reads.sample_label\'\n+    #else:\n+        --sample-label \'$reads.sample.element_identifier\'\n+    #end if\n #elif str($reads.format_select) == "table":\n     -k \'$reads.counts\'\n     #if \'$sgrna_library_file\':\n         -l \'$sgrna_library_file\'\n     #end if\n-\n #end if\n \n -n output\n@@ -54,13 +54,21 @@\n #if $adv.trim5:\n    --trim-5 $adv.trim5\n #end if\n+\n --norm-method $adv.norm_method\n+\n #if $adv.control_sgrna:\n     --control-sgrna $adv.control_sgrna\n #end if\n---sgrna-len $adv.sgrna_len\n+\n+#if $adv.sgrna_len:\n+    --sgrna-len $adv.sgrna_len\n+#end if\n+\n $adv.count_n\n+\n $adv.reverse_complement\n+\n $adv.test_run\n \n #if $adv.gmt_file:\n@@ -81,7 +89,7 @@\n             <when value="files">\n                 <param name="sample" argument="--fastq" type="data" format="fastq,fastq.gz,bam" multiple="false" label="Sample reads" help="The input reads must be in FASTQ, FASTQ.GZ or BAM format and all files must be in the same format." />\n                 <param name="sgrna_library_file" type="data" argument="--list-seq" format="txt,tabular,tsv,csv" label="sgRNA library file" help="A library file must be provided with three columns containing the sgRNA ID, sequence, and gene it is targeting, see Help below for more information." />\n-                <param name="sample_label" argument="--sample-label" type="text" optional="true" value="" label="Sample label" help="Optionally, you can specify a sample label to use in the output file header."/>\n+                <param name="sample_label" argument="--sample-label" type="text" optional="true" value="" label="Specify sample label" help="By default, the input filename will be used as the sample label. Optionally you can specify a different sample label to use."/>\n             </when>\n             <when value="table">\n                 <param name="counts" argument="-k"  type="data" format="tabular" optional="true" label="Counts Table" help="Alternatively, a tab-separated file of read counts can be used as input. See Help below for format" />\n@@ -94,12 +102,12 @@\n             <param name="pdfreportOpt" argument="--pdf-report" type="boolean" truevalue="--pdf-report" falsevalue="" checked="false" optional="true" label="Output PDF report" help="Generate pdf report of the input file. Default: No" />\n             <param name="unmappedOpt" argument="--unmapped-to-file" type="boolean" truevalue="--unmapped-to-file" falsevalue="" checked="false" optional="true" label="Output unmapped reads" help="Save unmapped reads to file. Default: No" />\n             <param name="rscriptOpt" type="boolean" truevalue="True" falsevalue="" checked="false" optional="true" label="Output R script" help="Output the R script used to generate the plots in the pdf report. Default: No" />\n-            <param name="logOpt" type="boolean" truevalue="True" falsevalue="" checked="false" label="Output logfile" help="This file includes the logging information, it will list some basic statistics of the dataset at the end" />\n+            <param name="logOpt" type="boolean" truevalue="True" falsevalue="" checked="false" label="Output Log file" help="This file includes the logging information, it will list some basic statistics of the dataset at the end" />\n         </section>\n \n         <section name="adv" title="Advanced Options">\n             <param name="gmt_file" argument="--gmt-file" type="data" format="tabular" optional="true" value="" label="Pathway file for QC" help="TThe pathway fi'..b'" />\n             <param name="count_n" argument="--count-n" type="boolean" truevalue="--count-n" falsevalue="" checked="false" optional="true" label="Count sgRNAs with Ns" help="By default, sgRNAs containing Ns will be discarded" />\n-            <param name="reverse_complement" argument="--reverse-complement" type="boolean" truevalue="--reverse-complement" falsevalue="" checked="false" optional="true" label="Reverse complement the sequences in library for read mapping" />\n+            <param name="reverse_complement" argument="--reverse-complement" type="boolean" truevalue="--reverse-complement" falsevalue="" checked="false" optional="true" label="Reverse complement" help="Reverse complement the sequences in library for read mapping" />\n             <param name="test_run" argument="--test-run" type="boolean" truevalue="--test-run" falsevalue="" checked="false" optional="true" label="Test running" help="If this option is on, MAGeCK will only process the first 1M records for each file" />\n         </section>\n     </inputs>\n@@ -125,19 +133,12 @@\n         <data name="unmapped" format="tabular" from_work_dir="*.unmapped.txt" label="${tool.name} on ${on_string}: Unmapped" >\n             <filter>out[\'unmappedOpt\'] is True</filter>\n         </data>\n-        <data name="log" format="txt" from_work_dir="*.log" label="${tool.name} on ${on_string}: Log" >\n+        <data name="log" format="txt" from_work_dir="output.log" label="${tool.name} on ${on_string}: Log" >\n             <filter>out[\'logOpt\'] is True</filter>\n         </data>\n     </outputs>\n \n     <tests>\n-        <!-- Ensure fastq works -->\n-        <test expect_num_outputs="1">\n-            <param name="sgrna_library_file" value="demo/demo2/library.txt" ftype="tabular" />\n-            <param name="format_select" value="files" />\n-            <param name="sample" value="demo/demo2/test1.fastq" ftype="fastq"/>\n-            <output name="counts" file="out.count.fastq.txt"/>\n-        </test>\n         <!-- Ensure fastq.gz input works -->\n         <test expect_num_outputs="1">\n             <param name="sgrna_library_file" value="demo/demo2/library.txt" ftype="tabular" />\n@@ -145,6 +146,14 @@\n             <param name="sample" value="test1.fastq.gz" ftype="fastq.gz"/>\n             <output name="counts" file="out.count.fastq.txt"/>\n         </test>\n+        <!-- Ensure fastq input works -->\n+        <test expect_num_outputs="1">\n+            <param name="sgrna_library_file" value="demo/demo2/library.txt" ftype="tabular" />\n+            <param name="format_select" value="files" />\n+            <param name="sample" value="demo/demo2/test1.fastq" ftype="fastq"/>\n+            <param name="sample_label" value="test1.fastq.gz" />\n+            <output name="counts" file="out.count.fastq.txt"/>\n+        </test>\n         <!-- Ensure BAM input works -->\n         <test expect_num_outputs="1">\n             <param name="sgrna_library_file" value="demo/demo2/library.txt" ftype="tabular" />\n@@ -181,7 +190,17 @@\n \n **Inputs**\n \n-By default, MAGeCK count command will automatically determine the trimming length of the fastq file.\n+**Read file(s)**\n+\n+**MAGeCK count** accepts one or more FASTQ.GZ, FASTQ or BAM files as input.\n+\n+Since version 0.5.5, MAGeCK count module supports collecting read counts from BAM files. This will allow you to use a third-party aligner to map reads to the library with mismatches, providing more usable reads for the analysis. However, it is still recommended to directly use the fastq file in the count module (which does not allow any mismatches), because:\n+\n+* Some mismatches in the sgRNAs may have unwanted behaviors (have no on-target cleavages or have other off-target cleavages);\n+* In most cases the read counts are enough if we allow no mismatches;\n+* The mapping procedure is more complicated; for example, you need to know the exact length of 3\' adapter sequence.\n+\n+It is also possible to input a Count Table to normalize counts and get statistics.\n \n **sgRNA library file**\n \n'
b
diff -r b80c0e046539 -r 4d72d204dcfa test-data/out.count.bam.txt
--- a/test-data/out.count.bam.txt Wed Feb 14 06:42:18 2018 -0500
+++ b/test-data/out.count.bam.txt Sat Feb 17 10:41:26 2018 -0500
b
@@ -1,4 +1,4 @@
-sgRNA Gene sample1
+sgRNA Gene test1.bam
 s_10007 CCNA1 0
 s_10008 CCNA1 0
 s_10027 CCNC 0
b
diff -r b80c0e046539 -r 4d72d204dcfa test-data/out.count.fastq.txt
--- a/test-data/out.count.fastq.txt Wed Feb 14 06:42:18 2018 -0500
+++ b/test-data/out.count.fastq.txt Sat Feb 17 10:41:26 2018 -0500
b
@@ -1,4 +1,4 @@
-sgRNA Gene sample1
+sgRNA Gene test1.fastq.gz
 s_47512 RNF111 1
 s_24835 HCFC1R1 1
 s_14784 CYP4B1 4