Repository 'sanntis_marine'
hg clone https://toolshed.g2.bx.psu.edu/repos/ecology/sanntis_marine

Changeset 0:12870a79d56b (2024-07-26)
Next changeset 1:9d689f8c9ce4 (2024-08-08)
Commit message:
planemo upload for repository https://github.com/galaxyecology/tools-ecology/tree/master/tools/marine_omics commit 3b5d66e71ee273061f579c8715fc085ea9d0b99e
added:
sanntis.xml
test-data/BGC0001472.fna.prodigal.faa.gb
test-data/BGC0001472.fna.prodigal.faa.ip.tsv
test-data/Sanntis_output_data.gff3
b
diff -r 000000000000 -r 12870a79d56b sanntis.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/sanntis.xml Fri Jul 26 14:31:32 2024 +0000
[
@@ -0,0 +1,53 @@
+<tool id="sanntis_marine" name="Sanntis biosynthetic gene clusters" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.01" license="MIT">
+    <description>in genomic and metagenomic data</description>
+    <macros>
+        <token name="@TOOL_VERSION@">0.9.3.5</token>
+        <token name="@VERSION_SUFFIX@">0</token>
+    </macros>
+    <edam_topics>
+        <edam_topic>topic_3387</edam_topic>
+    </edam_topics>
+    <requirements>
+        <requirement type="package" version="@TOOL_VERSION@">sanntis</requirement>
+    </requirements>
+    <command detect_errors="exit_code"><![CDATA[
+        sanntis --ip-file '$input_interpro' --outfile 'output_sanntis.gff' '$input_genbank'
+    ]]></command>
+    <inputs>
+        <param name="input_interpro" type="data" format="tabular" label="Input the TSV file from InterProScan" help="Before using this tool you need to retrieve the right data by using the InterProScan tool"/>
+        <param name="input_genbank" type="data" format="genbank" label="Input a Genbank .gb file" help="It needs to have the right structure and fit the protein fasta file used in InterProScan"/>
+    </inputs>
+    <outputs>
+        <data name="output_sanntis" from_work_dir="output_sanntis.gff" format="gff3" label="Sanntis output data"/>
+    </outputs>
+    <tests>
+        <test expect_num_outputs="1">
+            <param name="input_interpro" value="BGC0001472.fna.prodigal.faa.ip.tsv"/>
+            <param name="input_genbank" value="BGC0001472.fna.prodigal.faa.gb"/>
+            <output name="output_sanntis" value="Sanntis_output_data.gff3"/>
+        </test>
+    </tests>
+    <help><![CDATA[
+
+.. class:: infomark
+
+**What it does**
+
+SMBGC Annotation using Neural Networks Trained on Interpro Signatures
+Tool for identifying biosynthetic gene clusters (BGCs) in genomic & metagenomic data
+
+.....
+
+
+**Input**
+- A tsv file coming from InterProScan tool from which you can retrieve the right data.
+- The right Genbank file with the right structure that fits the protein fasta file used to run InterProScan tool
+
+**Output**
+- A Gff3 file
+
+    ]]></help>
+    <citations>
+        <citation type="doi">10.1101/2023.05.23.540769</citation>
+    </citations>
+</tool>
b
diff -r 000000000000 -r 12870a79d56b test-data/BGC0001472.fna.prodigal.faa.gb
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/BGC0001472.fna.prodigal.faa.gb Fri Jul 26 14:31:32 2024 +0000
b
b'@@ -0,0 +1,155 @@\n+LOCUS       BGC0001472                32 bp    DNA              UNK 01-JAN-1980\n+DEFINITION  BGC0001472.\n+ACCESSION   BGC0001472\n+VERSION     BGC0001472\n+KEYWORDS    .\n+SOURCE      .\n+  ORGANISM  .\n+            .\n+FEATURES             Location/Qualifiers\n+     CDS             312..683\n+                     /translation="MPTIQQLVRKGRQDKVEKNKTPALEGSPQRRGVCTRVFTTTPKKP\n+                     NSALRKVARVRLTSGIEVTAYIPGEGHNLQEHSIVLVRGGRVKDLPGVRYKIIRGSLDT\n+                     QGVKNRKQARSRYGAKKEK"\n+                     /protein_id="BGC0001472_1"\n+     CDS             686..1156\n+                     /translation="MPRKGPAPKRPVIIDPVYSSPLVTSLINKILLDGKRSTAERIVYG\n+                     AMEGLREKTGADPVITLKRALENVKPSLEVKSRRVGGATYQVPIEVKPGRAATLALRWV\n+                     VGYSRARREKTMTERLMNELLDASNGLGAAVKKREDTHKMAESNKAFAHYRW"\n+                     /protein_id="BGC0001472_2"\n+     CDS             1195..3324\n+                     /translation="MATTSLDLAKVRNIGIMAHIDAGKTTTTERILFYTGVSYKIGEVH\n+                     DGAATMDWMEQEQERGITITSAATTCHWPLNDVDHTINIIDTPGHVDFTVEVERSLRVL\n+                     DGAVTVFDGVAGVEPQSETVWRQADRYGVPRICFVNKLDRTGADFLRCVDMIVQRLGAV\n+                     PIVMQLPIGAEADFRGVVDLVSMKAFVYPEEAVKGEMYDTVEIPDNLKEAAEEWRGKLL\n+                     EAVSENDDQMMELYLEGEEPTEEQLHEAIRRITLASKGSADSVTVTPVFCGTAFKNKGV\n+                     QPLLDAVVRYLPSPLDVEAIEGHDVKDPEKVVQRKPSDDEPFSGLAFKIASDPHLGKLT\n+                     FVRIYSGRLEAGTAVLNSVKGKKERIGKIYRMHANKREEIPSVGAGDIVAVMGLKQTTT\n+                     GETLCDDKNPVILESMDFPAPVIQVAIEPKSKGDQEKLGVAIQRLSEEDPSFQVHSDEE\n+                     TGQTIIGGMGELHLEVLVDRMKREFRVEANVGKPQVAYRETIRKAVERIDYTHKKQTGG\n+                     TGQFAKVQIAIEPIEGGDASYEFVNKVTGGRIPREYIPSVDAGAQEAMQFGILAGYEMV\n+                     GVRVTLLDGGYHEVDSSELAFKIAGSQAFKEGARKASPVLLEPMMAVEVTTPEDYMGEV\n+                     VGDINSRRGQIQAMEERHGARVVKGLVPLSEMFGYVGDLRSKTSGRASYSMQFDSYAEV\n+                     PRNVAEEIIAKAKGE"\n+                     /protein_id="BGC0001472_3"\n+     CDS             3472..4665\n+                     /translation="MAKAKFERTKPHVNIGTIGHIDHGKTTLTAAITKVLHDAYPDLNE\n+                     ASAFDQIDKAPEERQRGITISIAHVEYQTESRHYAHVDCPGHADYIKNMITGAAQMDGA\n+                     ILVVAATDGPMPQTKEHVLLARQVGVPYIVVALNKADMVDDEEILELVELEVRELLSEY\n+                     EFPGDDLPVVKVSALKALEGDAEWGQTVLDLMKAVDESIPQPERDVEKPFLMPIEDVFT\n+                     ITGRGTVVTGRIERGVLKVNETVDIVGIKTEKTTTTVTGIEMFRKLLDEGQAGENVGLL\n+                     LRGIKREDVERGQVIIKPGSVTPHTEFQAQAYILSKDEGGRHTPFFNNYRPQFYFRTTD\n+                     VTGVVTLPEGTEMVMPGDNTLMDVALIQPVAMEEGLKFAIREGGRTVGAGQVTKITK"\n+                     /protein_id="BGC0001472_4"\n+     CDS             4869..5570\n+                     /translation="MRNDVTSMTAVLEGFTSRTPTSDGLAAERRPVPFADSVPVEPQPS\n+                     AEDLRPVHDLRGTLERRRSSLHYAPLPVRTDVILSLLRDVLRRDRDDWGLDASAGALEG\n+                     FVFAFRSEGAEPGLYRVTAEETCYLAGLDEIGPAENLGVQREFSTGAGIVALYASLDRA\n+                     DTWAGSHGYRISALRASMATYDLNLRCQALGLVGTLFGGFVPSSVHHLVHSDGATRHSL\n+                     LATTYARPPES"\n+                     /protein_id="BGC0001472_5"\n+     CDS             5567..7195\n+                     /translation="MVAEMKAEQIGRAARTDMQLTVPARPVLRRGVRLRRAGESVVLDG\n+                     ADRAQVFSGAFAREGLVPLTEACDGTRDHTELALKTGFDEATVYKCLALLSTAGAVEEA\n+                     MSGEEPDVTPEWAVFLSRLGNSTGSNPSWADAAARLVSRSVRLEGDAALVAGARRSLRE\n+                     VCPVVTEPAGPPGPGDELTVFFETPASAPLLAATEERCRQDGRPLLRVRADARTITIGP\n+                     YADLSITPCLDCGRHGEADLSGEPPEYLHDLVVGLASHHVTALLARATISHLPGDFTVI\n+                     DTATLSTVYRPVAVRPGCPRCSYARGPVAPQAPAGAVYEASVAMPPRAFLAPKDHQAHY\n+                     YASNLRLQSQFKDWPSRPHTPLPALDISVLAGSERHDPSHGDTPLTLSSLGLLLKVAFG\n+                     VKEDETTPERVKRWTAASGNIGSTTAYAVVRDDRIMPPGVYAYAQGSHTLVTVSGEVPP\n+                     GDSPCDIIITGDLKKVMTKYGTFGFRLVFLDAGCNLASLRELAQHLGLGFTPRSDWDDD\n+                     ALARLLGTSPADEPVAAFASLGGTA"\n+                     /protein_id="BGC0001472_6"\n+     CDS             7210..7821\n+         '..b'GLRDLV\n+                     AGDEASALKPSKARLRESSLVNFAYRASLKPSPFGRFTEIGAFPPDDPRPADPGGRHGG\n+                     TQESVTTLNRLLVNWGPPGLPLVPGGMEPGHLVLNSTLRAGTEYVEYVGVAPGSREDGR\n+                     MATERVLRVRREGLFDALLAAMPEGSAPAATVLRDLTAVTGKAETSRKVVQGLIRAGIL\n+                     FFRPEIDDHDPDYSMKLDRVLAAGGTPETAALRGHFSELRRLETDFSEAAADERQKLLD\n+                     SAYAAIGGIAELCKVSPPPEEVLKSPVFEDTPASTAPQAWNLPTVEGSIPALTGLWRLA\n+                     SMMDNGQVKRLGLYSFATRVLGDRSTMPFLEFFQAFSSLTDQEQVDVFMGRDVEEAERY\n+                     TRQRAEALRTIRQRLVPGDGTVHLDPSVIEKACEGVEDLLDTESVTFRAQFAQGVLPDR\n+                     DRTLVVNGLLTGYGVYFSRFGSFVEGTDEWSLPAAQREHLARRFPGQVDLNSVLGFNFN\n+                     LHPSVTRRVVNYPGAVSLGAERTVYGLARLEVRADQATRSLRLWDPEAQETLDLVPMNF\n+                     MTPIGVPLLYRLLEALSPSNRYLWKPLDDIRDAGGPTVYGETAPRLVVGDVVADRRSWN\n+                     VAAAEIPMLQDLSRDVPEALVAFDAWRLTRGLPRHAFVLCQTPEERDVMAGRSRKVTRQ\n+                     WADYAHLRRASVHKPMYVDFRNPFLVRSFAKSALSRGDVVASIRECLPSVDDYGPDTGW\n+                     TAAEEFFVELCTDN"\n+                     /protein_id="BGC0001472_11"\n+     CDS             13612..14571\n+                     /translation="MNCVPTTSGQTGTREWRTVHIHVPHSLHTPFLCDVVEPLLRSEGL\n+                     QDHFFFLRYWQGGPHLRLRMLCGPGAGSAEAAERVVAGLARAMPEFGAQAREEYALGLT\n+                     LQDELARLEKETSEEGRPIGALDRVAYEPEYRKYGGTEGLQIAETVFRKSSVAVLGLLG\n+                     GQPRAWVDERRAPIGEAARIMAMFLHGAGLDPRAAGLFLREYEDWWRTYAPDDMQRAWP\n+                     KLFGGVSAQMTNLCAAVWRDGATDVFHDISAEAAARARSVCGAEPGGDVRDLRLDGTPY\n+                     PGCLSNYVHTTNNRLGLVPAAEGLVAYLVRRGLEAMDG"\n+                     /protein_id="BGC0001472_12"\n+     CDS             14692..15894\n+                     /translation="MTDRQDSAYPYPRTCPLHPPKEYASLRAEQPITKVTLASGRTAWL\n+                     LTRHEHIRQLLADPHVSSNLAHPGYPLHFDAPPEVMEQMRPVLLAMDPPVHTAQRKMVI\n+                     PEFTVKRVLQLRPRVEEIVDECISSMLAGEGPADLVEALALPVPSLVICELLGVPRSDR\n+                     AFFQDRTNKLVSVDADPQERNSAHQELHAYFSELVTAQEADPGDDLLGRLVVKNRETGT\n+                     FDHGELVGMANVLLVGGHETTANMISLGVVGLLENPDQLAKLRADPGLAPQAVDELLRY\n+                     FSIADQVTSRVATADLEIGGVLIRAGEGVIGLSASGNHDEAVFPDPDRLDIERGGRHHL\n+                     AFGHGIHQCIGQNLAKLELEVVFNALLARIPGLKLATPVAELPFKDSMGVYGLHKLPVS\n+                     W"\n+                     /protein_id="BGC0001472_13"\n+     CDS             16220..16564\n+                     /translation="MYLSIVMWDLKKSEATVESLREYLRDYAVDAYSALDGMRLKAWFS\n+                     DSARQLWGAVYLWDSPEQMPGLYKVSRVIDLIGYPPTSVGGFTLEATAEGKSVHETLAG\n+                     LGIALEGGTQ"\n+                     /protein_id="BGC0001472_14"\n+     CDS             17019..17729\n+                     /translation="MLIEDIEPLLQSIRAGVEFIEIYGLDTVPVPDSLLAECERRRIPV\n+                     RLLAASVANQVFKTEKKPKVFGIAKVPRPRRLSDLSDMTGDLILLDGVKIVGNIGAIVR\n+                     TSFALGASGIVLVDSDLGSIADRRLIRASRGYVFSLPIVLASRAEALQYFQDNAMRPVV\n+                     FEADGDLGVADLDGMDERLVLMFGSERIGPSGEFSDIAAKSVSIPMNPAAESLNVSVSA\n+                     GIALHARARRNLSR"\n+                     /protein_id="BGC0001472_15"\n+     CDS             17815..19485\n+                     /translation="ALLGLRPFTPWEVSVAELGPDHRAEVNVLAADGRRVELIFLNTAM\n+                     HTGRHRLGLPSLWQDRRLVLRTVVADGSPLRRAGSYTYDGLVGVLTGLMESYRPTVVHT\n+                     LDPDPDIQHSTEAVRRRDSEQPGYSDHADHTAAACFAWAAMIRWVARATADGGRIPGFV\n+                     TVAYRGYYNRHWPKNLPQGVLARKAAHLVPYGGSPDWDCGNPSGCGDYNVGGDRPLTNR\n+                     KGWVRSTHHRYPGTRTVLTAEPDGRLAAYAVLGLRVVRWQETGPGSGAWGPPHDLGGGP\n+                     LAPALGSATTRDGRLLLFGLRFAALGGHGADNEREIVVLEQSAPGRGFRPWRGLGSPSP\n+                     GRDEVRRTGVPVAVAAPDGQIHLFVRDAEKGVSTRVRDGAGRWSAWRDMGGGEVQDGLH\n+                     TAVDEGGRVHVFGAGHHAVHHWTQDTPSAGLTARTQLTAAPVPAHAPAALPAPDGSVSL\n+                     YYRAAAGSGLTTARAGTAVPGARFDGYXXVDAAPSPRGPVLLGRTAEGLVQLLMGGGLH\n+                     VRTDGPAALDGASLRLGPDGRPSVAGLGPDAAPWMWRPR"\n+                     /protein_id="BGC0001472_16"\n+ORIGIN\n+        1 gatcgatcga tcgatcgatc gatcgatcga tc\n+//\n'
b
diff -r 000000000000 -r 12870a79d56b test-data/BGC0001472.fna.prodigal.faa.ip.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/BGC0001472.fna.prodigal.faa.ip.tsv Fri Jul 26 14:31:32 2024 +0000
b
b'@@ -0,0 +1,81 @@\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tProSitePatterns\tPS00086\tCytochrome P450 cysteine heme-iron ligand signature.\t342\t351\t-\tT\t13-08-2021\tIPR017972\tCytochrome P450, conserved site\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00385\tP450 superfamily signature\t340\t349\t3.1E-7\tT\t13-08-2021\tIPR001128\tCytochrome P450\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00385\tP450 superfamily signature\t238\t255\t3.1E-7\tT\t13-08-2021\tIPR001128\tCytochrome P450\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00385\tP450 superfamily signature\t273\t284\t3.1E-7\tT\t13-08-2021\tIPR001128\tCytochrome P450\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00385\tP450 superfamily signature\t349\t360\t3.1E-7\tT\t13-08-2021\tIPR001128\tCytochrome P450\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPfam\tPF00067\tCytochrome P450\t272\t368\t4.0E-18\tT\t13-08-2021\tIPR001128\tCytochrome P450\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t273\t284\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t319\t334\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t291\t318\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t340\t349\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t349\t360\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t138\t154\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t192\t214\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t155\t170\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tPRINTS\tPR00359\tB-class P450 signature\t91\t102\t8.3E-58\tT\t13-08-2021\tIPR002397\tCytochrome P450, B-class\n+BGC0001472_13\t874c0f534839f521f055a275c391567a\t400\tGene3D\tG3DSA:1.10.630.10\tCytochrome P450\t2\t400\t7.0E-113\tT\t13-08-2021\tIPR036396\tCytochrome P450 superfamily\n+BGC0001472_11\t67b7792659aca4f0747f903233e4f593\t885\tPfam\tPF04738\tLantibiotic dehydratase, N terminus\t141\t791\t2.4E-20\tT\t13-08-2021\tIPR006827\tLantibiotic dehydratase, N-terminal\n+BGC0001472_6\t76d1387ac73417cb91ccfb11c2c5229e\t542\tGene3D\tG3DSA:3.40.50.720\t-\t132\t304\t8.2E-16\tT\t13-08-2021\t-\t-\n+BGC0001472_6\t76d1387ac73417cb91ccfb11c2c5229e\t542\tGene3D\tG3DSA:3.40.109.10\tNADH Oxidase\t348\t542\t3.1E-35\tT\t13-08-2021\tIPR000415\tNitroreductase-like\n+BGC0001472_3\t4b28e769738231bbe9f69d4979528f4d\t709\tGene3D\tG3DSA:3.40.50.300\t-\t3\t304\t1.4E-121\tT\t13-08-2021\tIPR027417\tP-loop containing nucleoside triphosphate hydrolase\n+BGC0001472_3\t4b28e769738231bbe9f69d4979528f4d\t709\tPfam\tPF00009\tElongation factor Tu GTP binding domain\t10\t294\t1.2E-65\tT\t13-08-2021\tIPR000795\tTranslational (tr)-type GTP-binding domain\n+BGC0001472_3\t4b28e769738231bbe9f69d4979528f4d\t709\tTIGRFAM\tTIGR00231\tsmall_GTP: small GTP-binding protein domain\t11\t184\t1.5E-33\tT\t13-08-2021\tIPR005225\tSmall GTP-binding protein domain\n+BGC0001472_3\t4b28e769738231bbe9f69d4979528f4d\t709\tPfam\tPF03144\tElongation factor Tu domain 2\t337\t404\t9.3E-16\tT\t13-08-2021\tIPR004161\tTranslation elongation factor EFTu-like, domain 2\n+BGC0001472_3\t4b28e769738231bbe9f69d4979528f4d\t709\tPfam\tPF00679\tElongation factor G C-terminus\t615\t701\t2.7E-29\tT\t13-08-2021\tIPR000640\tElongation factor EFG, domain V-like\n+BGC0001472_3\t4b28e769738231bbe9f69d4979528f4d\t709\tPfam\tPF14492\tElongation Factor G, domain III\t417\t491\t2.5E-33\tT\t13-08-2021\tIPR041095\tElongation Factor G, domain II\n+BGC0001472_3\t4b28e76973'..b'rpsG_bact: ribosomal protein uS7\t3\t156\t4.4E-64\tT\t13-08-2021\tIPR005717\tRibosomal protein S7, bacterial/organellar-type\n+BGC0001472_2\tfc82bb58d52c83068b7ca785129b2384\t156\tPfam\tPF00177\tRibosomal protein S7p/S5e\t1\t149\t4.0E-59\tT\t13-08-2021\tIPR023798\tRibosomal protein S7 domain\n+BGC0001472_2\tfc82bb58d52c83068b7ca785129b2384\t156\tGene3D\tG3DSA:1.10.455.10\tRibosomal protein S7 domain\t1\t155\t7.0E-60\tT\t13-08-2021\tIPR036823\tRibosomal protein S7 domain superfamily\n+BGC0001472_2\tfc82bb58d52c83068b7ca785129b2384\t156\tProSitePatterns\tPS00052\tRibosomal protein S7 signature.\t20\t46\t-\tT\t13-08-2021\tIPR020606\tRibosomal protein S7, conserved site\n+BGC0001472_15\t206c74fd5c80ef02123ab090a4b6cfa4\t236\tPfam\tPF04705\tThiostrepton-resistance methylase, N terminus\t1\t82\t5.8E-30\tT\t13-08-2021\tIPR006795\tThiostrepton-resistance methylase, N-terminal\n+BGC0001472_15\t206c74fd5c80ef02123ab090a4b6cfa4\t236\tGene3D\tG3DSA:3.40.1280.10\t-\t75\t235\t1.3E-37\tT\t13-08-2021\tIPR029026\ttRNA (guanine-N1-)-methyltransferase, N-terminal\n+BGC0001472_15\t206c74fd5c80ef02123ab090a4b6cfa4\t236\tGene3D\tG3DSA:3.30.1330.30\t-\t1\t73\t2.3E-26\tT\t13-08-2021\tIPR029064\t50S ribosomal protein L30e-like\n+BGC0001472_15\t206c74fd5c80ef02123ab090a4b6cfa4\t236\tPfam\tPF00588\tSpoU rRNA Methylase family\t88\t227\t1.8E-26\tT\t13-08-2021\tIPR001537\ttRNA/rRNA methyltransferase, SpoU type\n+BGC0001472_8\t2149eda482fc77a076bb0eb91c55bd5d\t448\tGene3D\tG3DSA:3.30.40.250\t-\t104\t186\t3.5E-36\tT\t13-08-2021\t-\t-\n+BGC0001472_8\t2149eda482fc77a076bb0eb91c55bd5d\t448\tTIGRFAM\tTIGR03604\tTOMM_cyclo_SagD: thiazole/oxazole-forming peptide maturase, SagD family component\t75\t448\t1.4E-100\tT\t13-08-2021\tIPR027624\tThiazole/oxazole-forming peptide maturase, SagD family component\n+BGC0001472_8\t2149eda482fc77a076bb0eb91c55bd5d\t448\tPfam\tPF02624\tYcaO cyclodehydratase, ATP-ad Mg2+-binding\t75\t406\t8.3E-62\tT\t13-08-2021\tIPR003776\tYcaO-like domain\n+BGC0001472_8\t2149eda482fc77a076bb0eb91c55bd5d\t448\tGene3D\tG3DSA:3.30.1330.230\t-\t82\t405\t3.5E-36\tT\t13-08-2021\t-\t-\n+BGC0001472_8\t2149eda482fc77a076bb0eb91c55bd5d\t448\tGene3D\tG3DSA:3.30.160.660\t-\t223\t357\t3.5E-36\tT\t13-08-2021\t-\t-\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tTIGRFAM\tTIGR00981\trpsL_bact: ribosomal protein uS12\t1\t123\t5.4E-69\tT\t13-08-2021\tIPR005679\tRibosomal protein S12, bacterial-type\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tProSitePatterns\tPS00055\tRibosomal protein S12 signature.\t43\t50\t-\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tPfam\tPF00164\tRibosomal protein S12/S23\t12\t123\t8.3E-44\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tPRINTS\tPR01034\tRibosomal protein S12 signature\t27\t42\t8.4E-59\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tPRINTS\tPR01034\tRibosomal protein S12 signature\t42\t57\t8.4E-59\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tPRINTS\tPR01034\tRibosomal protein S12 signature\t58\t77\t8.4E-59\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tPRINTS\tPR01034\tRibosomal protein S12 signature\t77\t94\t8.4E-59\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tPRINTS\tPR01034\tRibosomal protein S12 signature\t94\t110\t8.4E-59\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tPRINTS\tPR01034\tRibosomal protein S12 signature\t110\t122\t8.4E-59\tT\t13-08-2021\tIPR006032\tRibosomal protein S12/S23\n+BGC0001472_1\tf4269c94863705a842e7252b96e5f27d\t123\tGene3D\tG3DSA:2.40.50.140\t-\t1\t123\t1.6E-66\tT\t13-08-2021\t-\t-\n+BGC0001472_7\t80ec0c524f263f553a78952ff4408537\t203\tGene3D\tG3DSA:3.40.50.720\t-\t16\t185\t5.5E-22\tT\t13-08-2021\t-\t-\n+BGC0001472_14\tb47c649341e9af373f88df5f17e9dc46\t114\tGene3D\tG3DSA:3.30.70.100\t-\t1\t92\t1.6E-30\tT\t13-08-2021\t-\t-\n+BGC0001472_5\t8eb61811b90411be4123c98a64e16860\t233\tGene3D\tG3DSA:3.40.109.10\tNADH Oxidase\t12\t230\t5.1E-18\tT\t13-08-2021\tIPR000415\tNitroreductase-like\n'
b
diff -r 000000000000 -r 12870a79d56b test-data/Sanntis_output_data.gff3
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/Sanntis_output_data.gff3 Fri Jul 26 14:31:32 2024 +0000
b
@@ -0,0 +1,2 @@
+##gff-version 3
+BGC0001472 SanntiSv0.9.3.5 CLUSTER 312 19485 . . . ID=BGC0001472_sanntis_1;nearest_MiBIG=BGC0001472;nearest_MiBIG_class=RiPP;nearest_MiBIG_diceDistance=0.037;score=0.900;partial=11