Repository 'hifiasm_meta'
hg clone https://toolshed.g2.bx.psu.edu/repos/galaxy-australia/hifiasm_meta

Changeset 0:6b86c86eab26 (2023-01-12)
Next changeset 1:15dbb444df71 (2023-01-18)
Commit message:
planemo upload for repository https://github.com/usegalaxy-au/tools-au commit 64c69504c3c9d78544ff708c1c8c819981913a7d
added:
hifiasm_meta.xml
macros.xml
test-data/asm.a_ctg.gfa
test-data/asm.p_ctg.gfa
test-data/zymoD6331std-ecoli-ten-percent.42.1.fq.gz
b
diff -r 000000000000 -r 6b86c86eab26 hifiasm_meta.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/hifiasm_meta.xml Thu Jan 12 23:07:53 2023 +0000
[
@@ -0,0 +1,104 @@
+<tool id="hifiasm_meta" name="Hifiasm_meta" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@" license="MIT">
+    <description>for metagenome assembly using Hifi reads.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+    <expand macro="requirements"/>
+    <command detect_errors="exit_code"><![CDATA[
+        ##################
+        ## SET UP FILES ##
+        ##################
+
+        #set reads_fn = 'reads.' + $reads.ext
+        ln -s '$reads' '$reads_fn' &&
+
+        #################
+        ## RUN HIFIASM ##
+        #################
+
+        hifiasm_meta 
+        --lowq-10 '$read_selection.lowq_10'
+        --lowq-3 '$read_selection.lowq_3'
+        --lowq-5 '$read_selection.lowq_5'
+        -a '$assembly.a'
+        -k '$overlap_correction.k'
+        -o asm
+        -r '$overlap_correction.r'
+        #if '$read_selection.S':
+            -S
+        #end if
+        -t \${GALAXY_SLOTS:-4}
+        '$reads_fn'
+
+    ]]></command>
+    <inputs>
+        <!-- fastq files (could be a repeat or a collection) -->
+        <param name="reads" format="fastqsanger,fastqsanger.gz" type="data" label="HiFi reads" help="Input reads for assembly" />
+        <section name="read_selection" title="Read selection" expanded="false">
+            <param argument='-S' type="boolean" checked="true" label="Enable read selection" help="If enabled, hifiasm_meta will estimate the total number of read overlaps." />
+            <param argument='--lowq-10' type="integer" value='50' label="lower 10% runtime kmer frequency threshold." />
+            <param argument='--lowq-5' type="integer" value='50' label="lower 5% runtime kmer frequency threshold." />
+            <param argument='--lowq-3' type="integer" value='10' label="lower 3% runtime kmer frequency threshold." />
+        </section>
+        <section name="overlap_correction" title="Overlap/Error correction" expanded="false">
+            <param argument='-k' type="integer" value='51' min="1" max="63" label="k-mer length" />
+            <param argument='-r' type="integer" value='3' min="1" max="10" label="rounds of correction" />
+        </section>
+        <section name="assembly" title="Assembly" expanded="false">
+            <param argument='-a' type="integer" value='4' min="1" max="10" label="rounds of assembly cleaning" />
+        </section>
+    </inputs>
+    <outputs>
+        <!-- contig graph files -->
+        <collection name="contig_graphs" type="list" label="hifiasm_meta on ${on_string}: contig graphs">
+            <data name="Alternate contigs" label="Alternate contigs" from_work_dir="asm.a_ctg.gfa" format="gfa2" />
+            <data name="Primary contigs" label="Primary contigs" from_work_dir="asm.p_ctg.gfa" format="gfa2" />
+        </collection>
+        <!-- unitig graph files -->
+        <collection name="unitig_graphs" type="list" label="hifiasm_meta on ${on_string}: unitig graphs">
+            <data name="Raw unitigs" label="Raw unitigs" from_work_dir="asm.r_utg.gfa" format="gfa2" />
+            <data name="Processed unitigs" label="Processed unitigs" from_work_dir="asm.p_utg.gfa" format="gfa2" />
+        </collection>
+        <!-- Simplified graphs for visualisation -->
+        <collection name="simple_graphs" type="list" label="hifiasm_meta on ${on_string}: graphs for visualisation">
+            <discover_datasets pattern="(?P&lt;designation&gt;.+)\.noseq.gfa" format="gfa2" visible="false" />
+        </collection>
+    </outputs>
+    <tests>
+        <!-- 01: basic function -->
+        <test>
+            <param name="reads" value="zymoD6331std-ecoli-ten-percent.42.1.fq.gz" />
+            <param name='S' value="False" />
+            <param name='r' value="1" />
+            <output_collection name="contig_graphs" type="list">
+                <element name="Primary contigs" file="asm.p_ctg.gfa"/>
+                <element name="Alternate contigs" file="asm.a_ctg.gfa"/>
+            </output_collection>
+        </test>
+    </tests>
+        <help><![CDATA[
+hifiasm_meta
+------------
+
+de novo metagenome assembler, based on hifiasm, a haplotype-resolved de novo assembler for PacBio Hifi reads.
+
+
+Hifiasm is an ultrafast haplotype-resolved de novo assembler for PacBio
+Hifi reads. Unlike most existing assemblers, hifiasm starts from uncollapsed
+genome. Thus, it is able to keep the haplotype information as much as possible.
+The input of hifiasm is the PacBio Hifi reads in fasta/fastq format, and its
+outputs consist of multiple types of assembly graph in GFA format.
+
+Hifiasm_meta is a fork of hifiasm. It comes with a read selection module, which
+enables the assembly of dataset of high redundancy without compromising overall
+assembly quality, and meta-centric graphcleaning modules. Currently hifiasm_meta 
+does not take bining info.
+
+--------------
+
+hifiasm_meta's home page is
+`xfengnefx/hifiasm-meta <https://github.com/xfengnefx/hifiasm-meta>`__.
+
+This tool was wrapped by the Galaxy Australia team.
+        ]]></help>
+</tool>
\ No newline at end of file
b
diff -r 000000000000 -r 6b86c86eab26 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Thu Jan 12 23:07:53 2023 +0000
b
@@ -0,0 +1,11 @@
+<macros>
+    <token name="@TOOL_VERSION@">hamtv0.3</token>
+    <token name="@VERSION_SUFFIX@">0</token>
+    <token name="@PROFILE@">22.05</token>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="@TOOL_VERSION@">hifiasm_meta</requirement>
+        </requirements>
+    </xml>
+    <!-- no citation or bio.tools id yet! -->
+</macros>
b
diff -r 000000000000 -r 6b86c86eab26 test-data/asm.p_ctg.gfa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/asm.p_ctg.gfa Thu Jan 12 23:07:53 2023 +0000
b
b'@@ -0,0 +1,7 @@\n+S\ts0.ctg000001l\tGCGACCTGTGATGCTCTGGTTCAGGCGCACGGCGCGTTGAAAGGGTTGGCTGCGTCACTGATGAAAATCGCCAATGATGTCCGCTGGCTGGCCTCTGGCCCCGCGCTGCGGAATTGGTGAAATCTCAATCCCGGAAAATGAGCCGGGCAGCTCAATCATGCCGGGGAAAGTGAATCCAACACAGTGTGAGGCATTAACCATGCTCTGCTGTCAGGTGATGGGGAACGACGTGGCGATCAACATGGGGGGCGCTTCCGGTAACTTTGAACTGAACGTCTTCCGTCCAATGGTGATCCACAATTTCCTGCAATCGGTGCGCTTGCTGGCAGATGGCATGGAAAGTTTTAACAAACACTGCGCAGTGGGTATTGAACCGAATCGTGAGCGAATCAATCAATTACTCAATGAATCGCTGATGCTGGTGACTGCGCTTAACACCCACATTGGTTATGACAAAGCCGCGGAGATCGCCAAAAAAGCGCATAAAGAAGGGCTGACCTTAAAAGCTGCGGCCTTGCGCTGGGGTATCTTAGCGAAGCCGAGTTTGACAGCTGGGTACGGCCAGAACAGATGGTCGGCAGTATGAAAGCCGGGCGTTAATCCGCAACATACAGGTGCAGCCGGGGAATGATCAAACGAAGCGGCTGCGCCTGTGGTTTATAACGGTGTTGCACATTGTCGGCATCGTAATTTAACAACTCCCCAACATCCGGCACGCCCGCGCCATTATCCCGATTAATCAGCGCAATAAGCGGTGTAGGGCAAGCGTGTTGTACTTGTTTTTGATCTCCTTTGTACCAGACGCGGGCAATCGGCTGCACCTTCACCGGACGTTTGATTTTTAACTTCGCGTTCTGTGGCAGGGCAGCGATATCCTGATACTCTCGCTCCAGTTTTCTTTGCCACTCCTCGCGCGTCCACGGTGCGACACTGCGTGGTGATTTCAGGCTTTTTTCCAGCTGTGCCAGGACTTCATCACGATGCAAATTTTTTAATGATATGTTTATTAGCCCAGCCAAAACGTAAAGTGGCGGGGTCGTGCAGAACGGTGAGCGTGCGGTAAGCATTAAGGGTGATCAGCCCCGGCAAATGACGATGCACCCCATTCAAAACGTGCCGCGGTGGGGAGTTCTGATTCAACCGTGACGATATGCTCGAACGTGGTCTTGAGTTTATTGATGTGCTGAATATGACTGACCAACGCTGCTTGCGAAAGGTTATCGACCTGGTAACACAACACGCCAGGCAGACGGACAGCGGCCTTGCTGCTGCGATTTTCGGACTGTTGTTGAATAAATAAATGGCGGAAATGACGCAACGCCAGCGACTGCGCGTCGTTGCCGAGATGTTGTTTTACCTCAATACGATTAAGCGGATTATGCTCATCCTCTTTTTTTACCTCCGGCAAAGAGAACACGCGGGCAACCAATAGCTTGTGTTGCTCAAGATGAGCGGCAAATGCAGCCAGCTCTTGTTCCATCTGGCGAAAAGTAGTGTTGAGTCGGTCTACGAGATCGTAACGCGCCATAATATTAACCACTTTAGTTACAACATCCTTAATTTATAGCACAGTGGTGGTGACTTGACCACCGTGCGCGTAGTGTCAAGCAGAGGGTAAATTGCGGGATGTTATGCCATAACGGCCAGCTAAACGAGAAGCGGGCACCACCCAGTTCGCTGGTGCCACAATTAACCGTACCGCCCATTGCCAGTGCTATAGAGTGGACAATTGCCAGTCCCAGCCCGCAGCCGCCGGTTGAGCGACCCCGGCTGGGATCGAGGCGAACAAAAGGTTCAAAGATATGTTCGCGGTTTTCTGGGCAATCCCTGAGCCATCATCCTCAACAATTAATGTCGCTTTATTCCCCGACAGTAGCAGGCTGGTTTCAACCGTTGAATGGCAGTAGCGCAGGGCGTTATTGAGCAAATTATCCAGCACGCGCTCCATTAAGCGCATATCCAACGCCGCATAATGGCCTTGCATGAGCGTTTTTATCCGTACCGTTTTATCGGGGCGTTACTGCCTGAATATCTGCCAGATGCGTTGACAGCCACAACGGCAGGTCTGGTTCGCTAAGATGAAGCTCGTTTTGTGGGCGATCGAGTCGGGCATAAGTCAGCAGCTCTTCAATTAAAGCTTCAAGTTGACTGATATCACGATTCAACGCCTGGGATTCGGCGGCGCTCAGGTTATCGCTCATCTCCAGTCGATAACGCAGGCGCACTAACGGTGTTCGCAGTTCGTGAGCGATACCGTCAATAAGCTGTTTTTTGCTGGCAATTAAGGCGTTGATATTGTCCGCCATCTGGTTAAATGCGACGCCAAGTCGTTCAAAGCTCGAACCCTCATCAAAGTGGATACGTTCATTGAGATGCCCATCGCCAAATCGTTGCGCCGCTGCTTCCAGTTTTAACATATCCTGCCAGTGCGGACGCATCCAGATAAACACCGGAAAGGCGAGGGAAATAGCAATAAAAGCGATCAGGGCGATATCCAGCAATCGCATTTGATGGAGGTAATAAAGATAAGGAACAGGACCAACTGCCAGCACGTAGTGGCTGCGCGGGATACGCTGCAAAAACGTGTACTGATCGTCCAGGGCGACAATTTCGCCGCCACGCAGTCGGTGCATGGAAATATCATCAAGATGGTATTTACTCAGTGGCTCGACACGCAGATCGAAAGAGAGATTTAAATCCATCTCTTTCAGCGTCTTACCCCAGTCGTGTGGGGGGATCTCACGCAATTCGCTGCGCATCAGATACAGCGAACTGTTCATCAAATCATCCAGCGACTGTTTGCCCGCGCGTTCGGCGGTAAATTTGTACACCAGCCCAACCAGCAGAGACATCACAAGGAAGCAGACAAACAATAACAGGTAAAACTGGATAAACAATTTTTTCATCGCTTATTCCCATGCATGAGGCGCAAAAAGATAGCCCTTTGTTACGCACGGTTTTAATGCGATAAGGTTCTGCGGCGTTATCGAGTAGTTTTTTTCTTAACCGCGAAATAGCCACGTCCACGCTACGATCCAGTCCGTCATAACTGACGCCGCGTAAATTTTTCAGCAATGCATCGCGGTCCATGATTTGCCCGGCATGGGTAGCTAATTCCCACAATAATTCGAAATCAGCTGTCGAGAGCGAGATTTCAGTGTTAGCCAGGGTGACTACGCGGTTGATGGGATCGATGGTCAACGTGCCGAAATGCAGGGCTTTGTAGGGAGTCAGAGACGTTTCCTGAAGACCTTTGGTCAGTGTGGCTTGCTCATTCTGACGCAAATGCAAACGTAAACGCGCTAGCAAAACAGCAGGGGGCGTCGTTTTGAGAATATAGTCGCAGGCACCCATTTCCAGTGCCAGGATGTGGTTCATATCGCTATCGAGAGAGGTTAGAAGAACAATCGGTCCAGACCACTTTGCGCGTAAATCACGACAAATGGTCATGCCGTCCTTGCCTGGTAGCATGATGTCGAGTAACACCAAATCCGGATTTTCTCGCAAAATGGTTTCTTCGGCCTGGTCGCCGCGCGGCTCTACGGTAACCTGCATATCATGTTTTGCCAGGTACGCGGCAATCAGTGAACCGACTTCCCGCATCATCTTCCACAAATACGATAGTGTTCATAACATTCACGGTAGATATAAAAACGTCACAATACACCGCGCTGTTTTTACTTACTATCAATCGTTTCTAAACAAGTTTTCATCAGGTATTCTACTGATGACTTGTTATGGAAGTGTTAAGGTAAAAAGATGGGGCTGGTAATCAAAGCCGCGCTCGGTGCGCTGGTAGTGCTGTTGATTGGTGTTTTAGCAAAAACGAAAAATTATTATATCGCCGGGCTGATTCCACTTTTCCCGACCTTTGCGCTTATCGCGCATTATATTGTTGCCAGCGAACGCGGCATTGAAGCCTTACGCGCAACCATCATTTTTAGTATGTGGTCGATTATTCCCTAT'..b'GACAATATTCACCCGAATACCTTTCTTCGCGACCTGTTTTGCCAAGCCACGGCTGTAGTTCAGAATCGCCGCCTTCGTAGCCGCATAGTCCCAGTAAATGCGGACTTGGCTGGTATGCCTGGATTGACGAAGTGGTGATGATACTTGCACCTTTCGGTAGCAGGGGGATCGCTTCCTGGGTTAGCCAGAACAGCGCGAAAACGTTAATGGCAAAGGTCTTTTGAAACTGTTCGCTGGTGAGGTCTGCAATATCCGGAATGGCAACCTGTTTCCCGGCGACCAGCGCCATAATATCCAGCCCGCCTAACGCCTTGTGCGCTTCGTGAACCAGCGAACGGGCAAATTTCTCATCGCTTAAATCGCCTGGCAGCAGAACGGCTTTGCGTCCGCATTCTTCAATGATCTTTTTCACATCCTGAGCGTCTTCTTCTTCCACGGGAAGATAACTGATCGCCACGTCAGCCCCTTCACGCGCGTAAGCGATGGCGGCAGCGCGACCTATTCCGGAATCGCCCCCTGTCACCAGTGCTTTACGATCTTTCAGGCGACCGCTACCAACATAGGTTTTCTCGCCGCAATCCGGTACCGGTGTCATCTTCGCCTGGATGCCTGGCGTCGGTTGTTTCTGTTTGGGATATTCACCAGTGTAATACTGCGTGGTCGGGTCTTTTAAATGAGACATCGTTTTTCTCCCTTCAGGTTCAACGTCCTTTAAGGGTAGACGTTCTCGATGCGTTGATAAGGGAACCAGGAAGATCCCTAAACCTCAGAATTATGCGACAAAGGTTTAACGTATATGTTGATTTGCTGTTGCGTGCTGTTTACTCAATTGCGATATACTGTTGCCCGTTTTAACTACACGACAGGAATGTATGGAACGTTTTCTTGAAAATGCAATGTATGCTTCTCGCTGGCTGCTTGCCCCCGTGTACTTTGGCCTTTCGCTGGCGTTAGTTGCCCTGGCGCTGAAGTTCTTCCAGGAGATTATTCACGTACTGCCGAATATCTTCTCGATGGCGGAATCAGATTTGATCCTCGTGTTGCTGTCGCTGGTGGATATGACGCTGGTTGGCGGTTTGCTGGTGATGGTGATGTTTTCCGGTTATGAGAATTTCGTCTCACAGCTGGATATCTCCGAGAACAAAGAGAAGCTGAACTGGCTGGGGAAAATGGACGCAACGTCGCTGAAAAACAAAGTAGCAGCGTCGATTGTGGCAATTTCTTCCATTCACTTACTGCGCGTCTTTATGGATGCGAAAAATGTCCCGGATAACAAACTGATGTGGTACGTCATTATCCATCTGACGTTTGTGCTTTCTGCATTTGTGATGGGCTATCTTGACCGACTGACTCGTCATAATCACTGATCTGATTCGGGCGCGGTTCGCGCGCCCGTTATTAACAGGTCATTTATCGGAAGACGCCTGCCACAGATTCAGCTCGCCATCGGCGATATGCTGATCAATCTGCGCCAGCTCCTTGGTGCTAAATGTCAGATTATTCAGCGCCTGCACGTTCTCCTCTAGTTGCTCCGCGCGGCTGGCACCAATCAATACCGACGTCACGCGATCATCTTTCAGCAACCAGCTTAACGCCATTTGCGCCATTGATTGTCCACGCTGCTGTGCCATTTCATTCAATAAGCGCAGGCTGTTGAGGTTGGCTTCGGTAAGCATTTTCGGTGTCAGACCACGAACTTTATTCCCTTCACGATGCATCCGTGAATCTTGCGGAATGCCGTTGAGATATTTTCCGGTCAGCAATCCCTGAGCCAGAGGAGTAAAGGCAATACAGCCCACGCCGTTATTTTGCAGGGTATCCAGCAGGCCGCTTTTATCCACCCAGCGGTTCAGTAAATTGTACGAAGGTTGATGAATTAACAGCGGAATTTTCCACTCGCGCAGCAACTCGACCATTTTTTGCGTCCGCTCTGGCGAGTAAGAGGAGATCCCGACATACAGCGCCTTACCGCTTTGTACCGCATGAGCCAGCGCAGAGGCGGTTTCTTCCATCGGCGTATTTTCATCGACGCGATGAGAGTAAAAGATATCGACATACTCAAGCCCCATACGCTTCAGGCTTTGGTCGAGGCTGGCGAGCAGGTATTTACGTGAACCGCCAGAGCCCGTAAGGGCCGGGCCACATATCGTAGCCAGCCTTGGTAGAGATAATCAGTTCATCGCGATAAGCGGCAAAATCCTCCCGCAGCAGGCGACCAAAGTTCTCTTCTGCGCTTCCTGGAGGCGGCCCGTAATTGTTGGCTAAATCAAAGTGCGTAATGCCCAAATCAAACGCTTTACGCAGGATCGCACGCTGTGATTCCAGCGCGTTAACGTGACCGAAATTGTGCCATAAACCGAGCGATAACGCGGGCAGGCGTAAACCACTTTTTCCGCAATAGCGGTATTGCATCTGCCCGTAACGTTCGGGATTCGCTAACCAGACCATGACCTCTCCTTTCCACCGTTCAATTTCGAAACAATGTTTCTAGTTTAGCGATTCGCCAGCGCGTATCCCGTAGTCTGGCTCACAGAGTGACGAAAAACTGGGCAAAAATACGTGCTTATGCTTTGCTTAAAAAAACACCAACTGAGGAGTGCAACGATGCCCGCGTTTAACCGCCAAAGATTTCCCACAAGAGTTGCTGGATTACTATGACTATTACGCTCACGGGAAAATCTCGAAACGTGAGTTCCTCAACCTTGCGGCGAAGTGCGGTAGGCGGGATGACGGCATTAGCGTTGTTTGATTTGCTCAAGCCAAATTATGCGCTGGCGACTCAGGTAGAGTTTACCGACCCGGAAATTGTTGCTGAGTACATCACGTATCCTTCGCCAAATGGTCACGGCGAGGTGCGGGGTTATCTGGTGAAGCCCGCAAAGATGAGCGGCAAAACGCCAGCCGTAGTGGTGGTGCATGAGAATCGTGGACTGAATCCGTATATCGAAGATGTGGCACGGCGAGTGGCGAAGGCGGGGTATATCGCCCTGGCACCTGACGGCTTAAGTTCCGTTGGAGGTTATCCGGGAAATGATGATAAAGGTCGTGAGCTGCAACAGCAGGTTGATCCAACAAACTGATGAATGATTTCTTTGCCGCAATTGAGTTTATGCAACGCTATCCGCAAGCGACAGGCAAAGTGGGTATTACCGGATTTTGCTATGGCGGTGGCGTATCGAACGCGGCGGCTGTCGCGTATCCGGAACTGGCCTGCGCGGTGCCGTTTTATGGTCGTCAGGCACCCCACTGCCGATGTGGCGAAGATTGAAGCGCCTTTACTACTCCACTTCGCGGAACTGGACACCCGAATCAACGAGGGCTGGCCTGCTTACGAGGCGGCGTTGAAAGCCAATAATAAGGTTTATGAGGCGTATATCTATCCGGGGGTTAATCACGGATTCCATAATGATTCCACGCCCCGTTATGACAAATCTGCCGCCGATCTTGCCTGGCAAAGGACACTGAAATGGTTCGATAAATATCTCTCCTGATAGGTTTATCTCTTACGGGATTACGTCTTAAACAAGCATGAAAAAATAGCGTGCGCAAAAGTCGTTCTTTGCCTAAAATATCGCTATATATGACAATATATAGCGAATGAGGTGAACGATGAATAACCATTTTGGTAAAGGCTTAATGGCGGGATTAAAAGCAACGCATGCCGACAGTGCGGTTAATGTGACAAAATTCTGTGCCGATTATAAACGCGGTTTTGTATTAGGCTACTCACACCGGATGTACGAAAAGACCGGAGATCGCCAGCTTAGCGCCTGGGAAGCGGGTATTCTGACGCGCCGCTATGGACTGG\tLN:i:41858\tdp:f:1\tts:B:I,1\n+A\ts1.ctg000002l\t0\t+\tm64015_200911_223407/148179444/ccs\t0\t22379\tid:i:31\tHG:A:a\n+A\ts1.ctg000002l\t18954\t+\tm64015_200911_223407/145754697/ccs\t0\t22904\tid:i:193\tHG:A:a\n'
b
diff -r 000000000000 -r 6b86c86eab26 test-data/zymoD6331std-ecoli-ten-percent.42.1.fq.gz
b
Binary file test-data/zymoD6331std-ecoli-ten-percent.42.1.fq.gz has changed