changeset 8:4fa9d5e748d4 draft

planemo upload for repository https://github.com/phac-nml/biohansel commit 759c65786566b73806fccaed05802fe01ec4226a
author nml
date Tue, 21 May 2019 15:05:40 -0400
parents 3360158bb0c5
children e305df0b1af7
files biohansel.xml test-data/SRR1002850_SMALL.fasta-match_results.tab test-data/SRR1002850_SMALL.fasta-results.tab test-data/SRR5646583_SMALL-match_results.tab test-data/SRR5646583_SMALL-results.tab test-data/SRR5646583_SMALL-tech_results.tab
diffstat 6 files changed, 34 insertions(+), 31 deletions(-) [+]
line wrap: on
line diff
--- a/biohansel.xml	Mon May 13 09:42:08 2019 -0400
+++ b/biohansel.xml	Tue May 21 15:05:40 2019 -0400
@@ -1,7 +1,7 @@
-<tool id="biohansel" name="biohansel" version="2.1.6">
+<tool id="biohansel" name="biohansel" version="2.2.0">
   <description>SNP subtyping of genome sequence reads or assemblies</description>
   <requirements>
-    <requirement type="package" version="2.1.1">bio_hansel</requirement>
+    <requirement type="package" version="2.2.0">bio_hansel</requirement>
   </requirements>
   <command detect_errors="exit_code">
 <![CDATA[
@@ -129,14 +129,14 @@
 #if $qc_vals.low_cov_depth_freq
   --low-cov-depth-freq $qc_vals.low_cov_depth_freq
 #end if
-#if $qc_vals.max_missing_tiles
-  --max-missing-tiles $qc_vals.max_missing_tiles
+#if $qc_vals.max_missing_kmers
+  --max-missing-kmers $qc_vals.max_missing_kmers
 #end if
-#if $qc_vals.min_ambiguous_tiles
-  --min-ambiguous-tiles $qc_vals.min_ambiguous_tiles
+#if $qc_vals.min_ambiguous_kmers
+  --min-ambiguous-kmers $qc_vals.min_ambiguous_kmers
 #end if
-#if $qc_vals.max_intermediate_tiles
-  --max-intermediate-tiles $qc_vals.max_intermediate_tiles
+#if $qc_vals.max_intermediate_kmers
+  --max-intermediate-kmers $qc_vals.max_intermediate_kmers
 #end if
 #if $qc_vals.low_coverage_warning
   --low-cov-warning $qc_vals.low_coverage_warning
@@ -200,6 +200,9 @@
           label="Included SNP Subtyping Scheme">
           <option value="heidelberg">Salmonella Heidelberg subtyping scheme</option>
           <option value="enteritidis">Salmonella Enteritidis subtyping scheme</option>
+          <option value="typhi">Salmonella Typhi subtyping scheme</option>
+          <option value="typhimurium">Salmonella Typhimurium subtyping scheme</option>
+          <option value="tb_speciation">Mycobacterium Tuberculosis subtyping scheme</option>
         </param>
       </when>
       <when value="custom">
@@ -237,28 +240,28 @@
         optional="true"
         label="QC: Frequency below this coverage are considered low coverage"
         help="default = 20"/>
-      <param name="min_ambiguous_tiles" type="integer"
-        argument="--min-ambiguous-tiles"
+      <param name="min_ambiguous_kmers" type="integer"
+        argument="--min-ambiguous-kmers"
         optional="true"
         value="3" min="0"
-        label="QC: Min number of tiles missing for Ambiguous Result"
+        label="QC: Min number of kmers missing for Ambiguous Result"
         help="default = 3"/>
-      <param name="max_missing_tiles" type="float"
-        argument="--max-missing-tiles"
+      <param name="max_missing_kmers" type="float"
+        argument="--max-missing-kmers"
         optional="true"
         value="0.05" min="0" max="1"
-        label="QC: Decimal Proportion of max allowed missing tiles" help="default = 0.05, valid values {0.0 - 1.0}"/>
-      <param name="max_intermediate_tiles" type="float"
-        argument="--max-intermediate-tiles"
+        label="QC: Decimal Proportion of max allowed missing kmers" help="default = 0.05, valid values {0.0 - 1.0}"/>
+      <param name="max_intermediate_kmers" type="float"
+        argument="--max-intermediate-kmers"
         optional="true"
         value="0.05" min="0" max="1"
-        label="QC: Decimal Proportion of max allowed missing tiles for an intermediate subtype"
+        label="QC: Decimal Proportion of max allowed missing kmers for an intermediate subtype"
         help="default = 0.05, valid values {0.0 - 1.0}"/> 
       <param name="low_coverage_warning" type="integer"
         argument="--low-cov-warning"
         optional="true"
         value="20"
-        label="QC: Overall tile coverage below this value will trigger a low coverage warning"
+        label="QC: Overall kmer coverage below this value will trigger a low coverage warning"
         help="default = 20"/> 
     </section>
     <section name="dev_args" title="Developer Options" expanded="False">
@@ -342,11 +345,11 @@
 **Usage**
 
 1) Select the sequence data you wish to subtype (FASTAs or FASTQs)
-2) Select subtyping scheme (e.g. *Salmonella enterica* serovar Heidelberg subtyping scheme, *Salmonella enterica* serovar Enteritidis subtyping scheme, or your own custom `biohansel` compatible subtyping scheme)
+2) Select subtyping scheme (e.g. *Salmonella enterica* serovar Heidelberg, Enteritidis, Typhimurium, or Typhi subtyping scheme, or your own custom `biohansel` compatible subtyping scheme)
 3) [Optional] Select your subtype metadata information table to include subtype metadata along with your subtype results
 4) Click ``Execute``
 
-For more information, visit `the biohansel project page <https://github.com/phac-nml/biohansel>`_.
+For more information, visit `the biohansel project page <https://github.com/phac-nml/biohansel>`_ or the `biohansel read the docs page <https://bio-hansel.readthedocs.io/en/readthedocs/>`_.
 
 
 **Example analysis results of a single FASTA file**
@@ -354,7 +357,7 @@
 Contents of ``results.tab``:
 
     +------------------+------------+----------------+-------------+------------------------------------------------+---------------------------------------------------------------+-------------------------+-----------------------+----------------------+-------------------------------+---------------------------+------------------------------------+--------------------------+-----------------------------------+------------------------+-----------+------------+
-    | sample           | scheme     | scheme_version | subtype     | all_subtypes                                   | tiles_matching_subtype                                        | are_subtypes_consistent | inconsistent_subtypes | n_tiles_matching_all | n_tiles_matching_all_expected | n_tiles_matching_positive | n_tiles_matching_positive_expected | n_tiles_matching_subtype | n_tiles_matching_subtype_expected | file_path              | qc_status | qc_message |
+    | sample           | scheme     | scheme_version | subtype     | all_subtypes                                   | kmers_matching_subtype                                        | are_subtypes_consistent | inconsistent_subtypes | n_kmers_matching_all | n_kmers_matching_all_expected | n_kmers_matching_positive | n_kmers_matching_positive_expected | n_kmers_matching_subtype | n_kmers_matching_subtype_expected | file_path              | qc_status | qc_message |
     +------------------+------------+----------------+-------------+------------------------------------------------+---------------------------------------------------------------+-------------------------+-----------------------+----------------------+-------------------------------+---------------------------+------------------------------------+--------------------------+-----------------------------------+------------------------+-----------+------------+
     | SRR1002850_SMALL | heidelberg | 0.5.0          | 2.2.2.2.1.4 | 2; 2.2; 2.2.2; 2.2.2.2; 2.2.2.2.1; 2.2.2.2.1.4 | 2154958-2.2.2.2.1.4; 1037658-2.2.2.2.1.4; 3785187-2.2.2.2.1.4 | True                    |                       | 202                  | 202                           | 17                        | 17                                 | 3                        | 3                                 | SRR1002850_SMALL.fasta | PASS      |            |
     +------------------+------------+----------------+-------------+------------------------------------------------+---------------------------------------------------------------+-------------------------+-----------------------+----------------------+-------------------------------+---------------------------+------------------------------------+--------------------------+-----------------------------------+------------------------+-----------+------------+
@@ -363,7 +366,7 @@
 Contents of ``match_results.tab``:
 
     +---------------------------+-----------------------------------+------------+---------------------------------------+-------------+-------------+-------------+-------------+------------------+------------------------+------------+----------------+-----------+------------+
-    | tilename                  | seq                               | is_revcomp | contig_id                             | match_index | refposition | subtype     | is_pos_tile | sample           | file_path              | scheme     | scheme_version | qc_status | qc_message |
+    | kmername                  | seq                               | is_revcomp | contig_id                             | match_index | refposition | subtype     | is_pos_kmer | sample           | file_path              | scheme     | scheme_version | qc_status | qc_message |
     +---------------------------+-----------------------------------+------------+---------------------------------------+-------------+-------------+-------------+-------------+------------------+------------------------+------------+----------------+-----------+------------+
     | 2154958-2.2.2.2.1.4       | GGCGCGCCACGGTTACTCCCCGGTGGTCAGCCG | True       | NODE_1_length_726282_cov_40.4705_ID_1 | 13732       | 2154958     | 2.2.2.2.1.4 | True        | SRR1002850_SMALL | SRR1002850_SMALL.fasta | heidelberg | 0.5.0          | PASS      |            |
     +---------------------------+-----------------------------------+------------+---------------------------------------+-------------+-------------+-------------+-------------+------------------+------------------------+------------+----------------+-----------+------------+
@@ -380,7 +383,7 @@
 Contents of ``results.tab``:
 
     +------------------+------------+----------------+-------------+------------------------------------------------+------------------------------------------+-------------------------+-----------------------+----------------------+-------------------------------+---------------------------+------------------------------------+--------------------------+-----------------------------------+----------------------------------------------------------+-------------------+-----------+------------+
-    | sample           | scheme     | scheme_version | subtype     | all_subtypes                                   | tiles_matching_subtype                   | are_subtypes_consistent | inconsistent_subtypes | n_tiles_matching_all | n_tiles_matching_all_expected | n_tiles_matching_positive | n_tiles_matching_positive_expected | n_tiles_matching_subtype | n_tiles_matching_subtype_expected | file_path                                                | avg_tile_coverage | qc_status | qc_message |
+    | sample           | scheme     | scheme_version | subtype     | all_subtypes                                   | kmers_matching_subtype                   | are_subtypes_consistent | inconsistent_subtypes | n_kmers_matching_all | n_kmers_matching_all_expected | n_kmers_matching_positive | n_kmers_matching_positive_expected | n_kmers_matching_subtype | n_kmers_matching_subtype_expected | file_path                                                | avg_kmer_coverage | qc_status | qc_message |
     +------------------+------------+----------------+-------------+------------------------------------------------+------------------------------------------+-------------------------+-----------------------+----------------------+-------------------------------+---------------------------+------------------------------------+--------------------------+-----------------------------------+----------------------------------------------------------+-------------------+-----------+------------+
     | SRR5646583_SMALL | heidelberg | 0.5.0          | 2.2.1.1.1.1 | 2; 2.2; 2.2.1; 2.2.1.1; 2.2.1.1.1; 2.2.1.1.1.1 | 1983064-2.2.1.1.1.1; 4211912-2.2.1.1.1.1 | True                    |                       | 202                  | 202                           | 20                        | 20                                 | 2                        | 2                                 | ['SRR5646583_SMALL_1.fastq', 'SRR5646583_SMALL_2.fastq'] | 42.631            | PASS      |            |
     +------------------+------------+----------------+-------------+------------------------------------------------+------------------------------------------+-------------------------+-----------------------+----------------------+-------------------------------+---------------------------+------------------------------------+--------------------------+-----------------------------------+----------------------------------------------------------+-------------------+-----------+------------+
@@ -388,7 +391,7 @@
 Contents of ``match_results.tab``:
 
     +---------------------+-----------------------------------+------+-------------+-----------+-------------+-------------------+------------------+------------+----------------+-----------+------------+
-    | tilename            | seq                               | freq | refposition | subtype   | is_pos_tile | is_kmer_freq_okay | sample           | scheme     | scheme_version | qc_status | qc_message |
+    | kmername            | seq                               | freq | refposition | subtype   | is_pos_kmer | is_kmer_freq_okay | sample           | scheme     | scheme_version | qc_status | qc_message |
     +---------------------+-----------------------------------+------+-------------+-----------+-------------+-------------------+------------------+------------+----------------+-----------+------------+
     | negative4642573-1.2 | TACCAGGAAGTGCTGGAAGAGTTTAACGAACAT | 62   | 4642573     | 1.2       | False       | True              | SRR5646583_SMALL | heidelberg | 0.5.0          | PASS      |            |
     +---------------------+-----------------------------------+------+-------------+-----------+-------------+-------------------+------------------+------------+----------------+-----------+------------+
@@ -424,8 +427,8 @@
   <citations>
     <citation type="bibtex">@ARTICLE{a1,
       title = {A robust genotyping scheme for Salmonella enterica serovar Heidelberg clones circulating in North America},
-      author = {Geneviève Labbé, James Robertson, Peter Kruczkiewicz, Marisa Rankin, Matthew Gopez, Chad R. Laing, Philip Mabon, Kim Ziebell, Aleisha R. Reimer, Lorelee Tschetter, Gary Van Domselaar, Sadjia Bekal, Kimberley A. MacDonald, Linda Hoang, Linda Chui, Danielle Daignault, Durda Slavic, Frank Pollari, E. Jane Parmley, Elissa Giang, Lok Kan Lee, Jonathan Moffat, Joanne MacKinnon, Roger Johnson, John H.E. Nash},
-      url = {https://github.com/phac-nml/bio_hansel}
+      author = {Geneviève Labbé, James Robertson, Peter Kruczkiewicz, Marisa Rankin, Matthew Gopez, Chad R. Laing, Philip Mabon, Kim Ziebell, Aleisha R. Reimer, Lorelee Tschetter, Gary Van Domselaar, Sadjia Bekal, Kimberley A. MacDonald, Linda Hoang, Linda Chui, Danielle Daignault, Durda Slavic, Frank Pollari, E. Jane Parmley, David Son, Darian Hole, Elissa Giang, Lok Kan Lee, Jonathan Moffat, Joanne MacKinnon, Roger Johnson, John H.E. Nash},
+      url = {https://github.com/phac-nml/biohansel}
       }
     }</citation>
   </citations>
--- a/test-data/SRR1002850_SMALL.fasta-match_results.tab	Mon May 13 09:42:08 2019 -0400
+++ b/test-data/SRR1002850_SMALL.fasta-match_results.tab	Tue May 21 15:05:40 2019 -0400
@@ -1,4 +1,4 @@
-tilename	seq	is_revcomp	contig_id	match_index	refposition	subtype	is_pos_tile	sample	file_path	scheme	scheme_version	qc_status	qc_message
+kmername	seq	is_revcomp	contig_id	match_index	refposition	subtype	is_pos_kmer	sample	file_path	scheme	scheme_version	qc_status	qc_message
 2154958-2.2.2.2.1.4	GGCGCGCCACGGTTACTCCCCGGTGGTCAGCCG	True	NODE_1_length_726282_cov_40.4705_ID_1	13732	2154958	2.2.2.2.1.4	True	SRR1002850_SMALL	SRR1002850_SMALL.fasta	heidelberg	0.5.0	PASS	
 negative2131791-2.2.3.1.3	GCTGGGCGAAATGATGCAGTTCACCACTTGCTC	True	NODE_1_length_726282_cov_40.4705_ID_1	36900	2131791	2.2.3.1.3	False	SRR1002850_SMALL	SRR1002850_SMALL.fasta	heidelberg	0.5.0	PASS	
 2069216-2.2.2	ATACTTAGGCTGTCAGTAACCCGTGAGGTAGTG	True	NODE_1_length_726282_cov_40.4705_ID_1	99475	2069216	2.2.2	True	SRR1002850_SMALL	SRR1002850_SMALL.fasta	heidelberg	0.5.0	PASS	
--- a/test-data/SRR1002850_SMALL.fasta-results.tab	Mon May 13 09:42:08 2019 -0400
+++ b/test-data/SRR1002850_SMALL.fasta-results.tab	Tue May 21 15:05:40 2019 -0400
@@ -1,2 +1,2 @@
-sample	scheme	scheme_version	subtype	all_subtypes	tiles_matching_subtype	are_subtypes_consistent	inconsistent_subtypes	n_tiles_matching_all	n_tiles_matching_all_expected	n_tiles_matching_positive	n_tiles_matching_positive_expected	n_tiles_matching_subtype	n_tiles_matching_subtype_expected	file_path	qc_status	qc_message
+sample	scheme	scheme_version	subtype	all_subtypes	kmers_matching_subtype	are_subtypes_consistent	inconsistent_subtypes	n_kmers_matching_all	n_kmers_matching_all_expected	n_kmers_matching_positive	n_kmers_matching_positive_expected	n_kmers_matching_subtype	n_kmers_matching_subtype_expected	file_path	qc_status	qc_message
 SRR1002850_SMALL	heidelberg	0.5.0	2.2.2.2.1.4	2; 2.2; 2.2.2; 2.2.2.2; 2.2.2.2.1; 2.2.2.2.1.4	2154958-2.2.2.2.1.4; 1037658-2.2.2.2.1.4; 3785187-2.2.2.2.1.4	True		202	202	17	17	3	3	SRR1002850_SMALL.fasta	PASS	
--- a/test-data/SRR5646583_SMALL-match_results.tab	Mon May 13 09:42:08 2019 -0400
+++ b/test-data/SRR5646583_SMALL-match_results.tab	Tue May 21 15:05:40 2019 -0400
@@ -1,4 +1,4 @@
-tilename	seq	freq	refposition	subtype	is_pos_tile	is_kmer_freq_okay	sample	scheme	scheme_version	qc_status	qc_message
+kmername	seq	freq	refposition	subtype	is_pos_kmer	is_kmer_freq_okay	sample	scheme	scheme_version	qc_status	qc_message
 negative4642573-1.2	TACCAGGAAGTGCTGGAAGAGTTTAACGAACAT	62	4642573	1.2	False	True	SRR5646583_SMALL	heidelberg	0.5.0	PASS	
 21097-2.2.1.1.1	GCAAATCGCGCCAGTCAAGTCCTCTTTTACCGT	42	21097	2.2.1.1.1	True	True	SRR5646583_SMALL	heidelberg	0.5.0	PASS	
 negative3647258-2.2.2.2.2.1	TACGGGTAACTGTTATCGGTAACATTGTCCAAC	64	3647258	2.2.2.2.2.1	False	True	SRR5646583_SMALL	heidelberg	0.5.0	PASS	
--- a/test-data/SRR5646583_SMALL-results.tab	Mon May 13 09:42:08 2019 -0400
+++ b/test-data/SRR5646583_SMALL-results.tab	Tue May 21 15:05:40 2019 -0400
@@ -1,2 +1,2 @@
-sample	scheme	scheme_version	subtype	all_subtypes	tiles_matching_subtype	are_subtypes_consistent	inconsistent_subtypes	n_tiles_matching_all	n_tiles_matching_all_expected	n_tiles_matching_positive	n_tiles_matching_positive_expected	n_tiles_matching_subtype	n_tiles_matching_subtype_expected	file_path	avg_tile_coverage	qc_status	qc_message
+sample	scheme	scheme_version	subtype	all_subtypes	kmers_matching_subtype	are_subtypes_consistent	inconsistent_subtypes	n_kmers_matching_all	n_kmers_matching_all_expected	n_kmers_matching_positive	n_kmers_matching_positive_expected	n_kmers_matching_subtype	n_kmers_matching_subtype_expected	file_path	avg_kmer_coverage	qc_status	qc_message
 SRR5646583_SMALL	heidelberg	0.5.0	2.2.1.1.1.1	2; 2.2; 2.2.1; 2.2.1.1; 2.2.1.1.1; 2.2.1.1.1.1	1983064-2.2.1.1.1.1; 4211912-2.2.1.1.1.1	True		202	202	20	20	2	2	['SRR5646583_SMALL_1.fastq', 'SRR5646583_SMALL_2.fastq']	42.631	PASS	
--- a/test-data/SRR5646583_SMALL-tech_results.tab	Mon May 13 09:42:08 2019 -0400
+++ b/test-data/SRR5646583_SMALL-tech_results.tab	Tue May 21 15:05:40 2019 -0400
@@ -1,2 +1,2 @@
-sample	subtype	avg_tile_coverage	qc_status	qc_message
+sample	subtype	avg_kmer_coverage	qc_status	qc_message
 SRR5646583_SMALL	2.2.1.1.1.1	42.631	PASS