changeset 5:66617be450bd draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/tooldistillator commit 164bcc563f8495d4bb1ce14b574aef9287904f40
author iuc
date Thu, 10 Apr 2025 15:02:10 +0000
parents ea93df4b3df2
children dfd6fa2637ba
files macro.xml test-data/checkm2/DIAMOND_RESULTS.tsv test-data/checkm2/checkm2.log test-data/checkm2/quality_report.tsv tooldistillator.xml
diffstat 5 files changed, 219 insertions(+), 19 deletions(-) [+]
line wrap: on
line diff
--- a/macro.xml	Thu Oct 17 08:00:15 2024 +0000
+++ b/macro.xml	Thu Apr 10 15:02:10 2025 +0000
@@ -1,7 +1,7 @@
 <?xml version="1.0"?>
 <macros>
-    <token name="@TOOL_VERSION@">0.9.1</token>
-    <token name="@VERSION_SUFFIX@">1</token>
+    <token name="@TOOL_VERSION@">0.9.2</token>
+    <token name="@VERSION_SUFFIX@">0</token>
     <token name="@PROFILE@">21.05</token>
     <xml name="version_command">
         <version_command><![CDATA[tooldistillator --version]]></version_command>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkm2/DIAMOND_RESULTS.tsv	Thu Apr 10 15:02:10 2025 +0000
@@ -0,0 +1,100 @@
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49428_2	UniRef100_A0A0N7IEW1~K00616	91.7	218	18	0	1	218	1	218	3.7e-113	412.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49428_3	UniRef100_B5R745~K05776	39.4	358	206	4	14	367	49	399	3.5e-63	247.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_28292_2	UniRef100_E6STV5~K03402	94.3	157	9	0	1	157	1	157	3.4e-76	289.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_28292_4	UniRef100_A0A1A9I3U8~K05970	45.9	427	197	7	12	409	12	433	1.2e-101	375.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14200_2	UniRef100_E6SQC7~K01200	86.9	665	87	0	1	665	1	665	0.0e+00	1218.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_63629_1	UniRef100_E6SR16~K03711	95.1	162	7	1	1	161	1	162	6.6e-83	311.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_114_1	UniRef100_A0A139LU84~K01952	94.2	1011	59	0	1	1011	38	1048	0.0e+00	1941.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_21313_3	UniRef100_E6SMX3~K06950	78.4	208	45	0	1	208	1	208	3.4e-92	342.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_21313_4	UniRef100_E6SMX8~K06942	94.6	367	20	0	1	367	1	367	3.7e-198	695.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_21322_2	UniRef100_A0A0P0G6A0~K05349	80.0	862	172	0	1	862	2	863	0.0e+00	1431.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7210_2	UniRef100_A0A0P0GLB2~K14742	92.2	230	18	0	1	230	1	230	8.7e-121	438.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7210_4	UniRef100_E6SRP6~K00942	90.9	187	17	0	1	187	1	187	1.5e-91	340.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7222_2	UniRef100_A0A127AYQ9~K21573	33.3	1066	648	24	3	1045	1	1026	8.1e-142	510.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7222_5	UniRef100_S4XS10~K15921	31.9	467	248	23	20	442	84	524	4.9e-48	197.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_63747_1	UniRef100_A0A1T5DC71~K02343	70.7	362	106	0	4	365	3	364	6.5e-146	522.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14378_2	UniRef100_Q7UNN1~K01134	43.8	491	265	6	28	512	40	525	6.7e-113	412.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_42512_3	UniRef100_A3U9J4~K08316	38.8	165	97	3	2	164	16	178	5.3e-27	125.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_42512_4	UniRef100_T1YCJ1~K06131	44.5	272	148	3	1	269	33	304	6.9e-61	239.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14415_3	UniRef100_E6STG4~K02619	68.2	201	58	1	1	201	1	195	1.1e-71	274.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14415_4	UniRef100_X2K1F6~K01665	56.5	248	108	0	5	252	30	277	4.2e-76	289.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_28506_2	UniRef100_E6SNZ6~K12573	92.3	711	55	0	4	714	7	717	0.0e+00	1304.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_28506_3	UniRef100_I9Q1S0~K07005	74.1	158	41	0	1	158	1	158	1.0e-67	261.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_35544_1	UniRef100_E6SPZ0~K00873	94.5	458	25	0	1	458	28	485	2.6e-246	855.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_35544_2	UniRef100_C7M9L1~K00588	44.0	207	115	1	3	209	8	213	8.0e-49	198.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_247_2	UniRef100_A0A089KNB8~K01198&K01209	31.1	492	280	21	27	487	10	473	1.3e-39	169.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_247_3	UniRef100_A0A0P0GKF6~K15923	70.2	1071	312	4	12	1080	8	1073	0.0e+00	1597.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49649_3	UniRef100_A0A0K1KXX7~K07658	39.6	230	128	3	2	222	3	230	9.9e-37	158.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49649_5	UniRef100_A0A0P0G8E4~K06142	88.1	201	23	1	1	200	1	201	1.5e-89	334.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49664_3	UniRef100_A0A0E3PP05~K00763	38.9	265	150	4	1	254	1	264	1.2e-42	178.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_63921_2	UniRef100_E6SQK9~K20866	79.0	205	43	0	1	205	1	205	1.5e-92	344.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_63921_3	UniRef100_A0A0P0G8Y8~K01537	89.8	842	86	0	1	842	53	894	0.0e+00	1457.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_63924_3	UniRef100_A0A290SA98~K15726	37.3	381	237	2	1	381	44	422	1.4e-70	271.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49669_2	UniRef100_A0A127AYQ9~K21573	35.7	1080	585	33	13	1040	4	1026	2.7e-161	574.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49669_3	UniRef100_A0A0P0GBJ8~K21572	69.2	539	152	5	1	528	1	536	9.6e-216	754.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49669_6	UniRef100_A0A0P0GI09~K01190	84.9	1050	159	0	1	1050	1	1050	0.0e+00	1939.1
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7445_2	UniRef100_B5YB77~K15921	35.2	474	247	19	26	453	48	507	9.0e-61	239.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7453_2	UniRef100_E6SR03~K05516	85.8	317	40	2	1	317	1	312	5.0e-151	538.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_35703_1	UniRef100_U5Q4K6~K03183	41.8	153	87	1	9	159	1	153	1.9e-29	134.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_35703_2	UniRef100_E6SV36~K00014	92.7	248	18	0	1	248	1	248	3.7e-133	479.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_35703_3	UniRef100_A0A0P0G426~K06889	78.7	315	67	0	1	315	1	315	1.3e-148	530.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_35703_4	UniRef100_A0A0P0GMY7~K06872	81.4	242	45	0	5	246	1	242	2.9e-114	416.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_56776_2	UniRef100_A0A175ACE0~K05297	56.0	50	22	0	3	52	2	51	2.0e-12	75.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_56776_3	UniRef100_A0A0P0GR35~K03324	93.6	565	36	0	1	565	1	565	1.1e-294	1016.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_56776_4	UniRef100_B9KAM4~K00876	40.3	370	208	5	21	384	29	391	1.6e-66	258.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_427_1	UniRef100_F0YI08~K00134	73.4	79	21	0	7	85	6	84	9.2e-26	120.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_427_2	UniRef100_E6SV71~K01284	81.9	685	124	0	1	685	1	685	0.0e+00	1172.1
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_28766_1	UniRef100_A0A140NMH2~K00262	60.7	84	32	1	1	84	17	99	1.9e-20	103.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_28766_3	UniRef100_E6SRR4~K16089	72.3	750	185	5	3	749	6	735	0.0e+00	1114.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_28848_1	UniRef100_I1YI16~K07689	31.3	208	141	2	6	212	6	212	1.9e-21	107.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7592_1	UniRef100_E6SR99~K07037	87.6	687	84	1	1	687	1	686	0.0e+00	1193.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7592_3	UniRef100_R6LHP4~K01104	86.6	149	20	0	6	154	33	181	1.6e-73	280.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7592_4	UniRef100_B3DWK1~K04066	40.8	534	283	10	14	527	110	630	4.6e-109	400.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_21835_1	UniRef100_E6SRJ9~K03702	91.4	685	58	1	1	685	1	684	0.0e+00	1232.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_21835_2	UniRef100_E6SRK0~K01912	93.5	432	28	0	1	432	1	432	1.1e-241	840.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_21835_4	UniRef100_A0A0P0GAI4~K05807	93.3	267	18	0	1	267	1	267	4.5e-137	492.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_57056_1	UniRef100_E6ST38~K00053	95.7	347	15	0	2	348	1	347	2.0e-190	669.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_57056_2	UniRef100_B0D4X2~K19783	31.1	591	312	19	112	621	127	703	9.9e-50	203.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49958_2	UniRef100_E6SQ13~K01243	83.3	234	39	0	1	234	1	234	1.2e-109	401.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49958_3	UniRef100_E6SQ14~K07173	93.2	162	11	0	1	162	1	162	2.9e-86	322.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49958_4	UniRef100_R4M9B3~K00666	49.3	294	146	3	5	295	8	301	1.3e-76	291.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_810_1	UniRef100_A0A0P0GIW9~K03657	87.2	678	86	1	2	679	3	679	0.0e+00	1186.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49992_1	UniRef100_A0A0N7IFG4~K00789	94.5	419	23	0	1	419	12	430	2.8e-226	789.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49992_2	UniRef100_A0A0P0FY07~K06966	83.1	195	33	0	2	196	1	195	7.2e-92	341.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49992_4	UniRef100_E6SNW4~K01719	95.6	250	11	0	1	250	1	250	3.3e-134	482.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_49992_5	UniRef100_E6SNW5~K03536	85.2	108	16	0	1	108	1	108	9.9e-43	177.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_36157_2	UniRef100_E6SUR0~K00948	96.8	312	10	0	1	312	1	312	7.0e-166	588.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14711_1	UniRef100_E6SNY0~K09815	72.0	304	80	1	11	309	1	304	3.0e-124	449.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14711_2	UniRef100_A0A0P0GQ72~K09817	85.0	254	33	1	1	254	1	249	6.9e-119	431.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_1	UniRef100_Q5LHW2~K02884	99.1	117	1	0	1	117	1	117	1.5e-57	226.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_2	UniRef100_A0A0N7IF60~K00845	94.8	326	17	0	1	326	1	326	8.6e-175	617.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_3	UniRef100_A0A0P0FVB4~K02003	95.0	238	12	0	1	238	1	238	4.2e-126	455.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_4	UniRef100_E6STT3~K02004	83.3	419	69	1	1	418	1	419	9.6e-203	711.1
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_5	UniRef100_E6STT4~K02004	88.9	413	46	0	1	413	1	413	1.7e-212	743.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_6	UniRef100_E6STT5~K02005	91.3	368	32	0	1	368	1	368	2.2e-179	633.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_7	UniRef100_E6STT6~K12340	85.2	433	63	1	3	434	10	442	2.2e-202	709.9
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_8	UniRef100_E6STU0~K00243	84.9	278	42	0	1	278	1	278	2.4e-136	490.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_7946_9	UniRef100_E6STU7~K00024	94.0	333	20	0	1	333	1	333	7.5e-182	641.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_1015_1	UniRef100_A0A1U7XXK2~K00895	52.9	272	126	1	4	273	31	302	3.4e-74	283.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_1015_2	UniRef100_A0A174D557~K18139	75.0	456	114	0	1	456	1	456	2.2e-192	676.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_1015_3	UniRef100_T0GCG4~K18138	39.4	589	339	8	5	579	12	596	7.1e-103	379.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_22153_3	UniRef100_E6STN2~K02069	92.8	263	19	0	1	263	1	263	5.9e-129	465.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_22153_5	UniRef100_E6STN3~K02068	79.2	207	43	0	1	207	1	207	5.5e-90	335.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_57444_2	UniRef100_A0A0N7IFV5~K03118	90.9	263	24	0	17	279	1	263	9.6e-133	478.0
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_57444_3	UniRef100_D4VLF0~K03116	95.8	72	3	0	3	74	1	72	1.7e-17	93.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_57444_4	UniRef100_B6YQB3~K01775	50.8	311	141	2	1	299	70	380	2.0e-80	304.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_1116_3	UniRef100_E6SQF3~K01224	73.2	392	103	1	3	394	5	394	3.0e-174	616.3
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_50177_4	UniRef100_A0A1L3GGF5~K11383	36.4	236	148	2	20	255	1	234	1.6e-35	154.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_36310_1	UniRef100_A0A076H3R8~K15633	41.6	341	184	5	1	330	34	370	8.7e-66	255.8
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_36310_3	UniRef100_L0RWC6~K02470	50.9	273	125	5	25	296	8	272	9.9e-69	265.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14955_2	UniRef100_Q7MX03~K01070	63.5	244	89	0	29	272	6	249	2.1e-94	350.5
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_14955_3	UniRef100_A0A0P0G3B8~K03699	87.0	430	56	0	1	430	10	439	1.3e-202	710.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15011_4	UniRef100_A0A0P0GFV2~K01735	90.1	353	35	0	1	353	1	353	2.4e-186	656.4
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15043_2	UniRef100_A0A0P0GCU8~K07568	95.5	352	16	0	1	352	1	352	1.5e-193	680.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15043_3	UniRef100_A0A0P0M190~K00950	74.3	148	38	0	1	148	5	152	3.0e-58	229.6
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15043_4	UniRef100_A0A076IYN8~K21557	33.1	523	339	5	18	538	18	531	3.4e-75	287.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_1350_6	UniRef100_H6SQ71~K03701	44.9	510	274	4	5	508	17	525	1.4e-110	405.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15093_1	UniRef100_D4IXW5~K04485	48.2	141	66	3	1	138	1	137	2.8e-30	136.7
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15093_2	UniRef100_B6VS51~K01673	83.8	179	29	0	1	179	3	181	2.5e-83	313.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15093_3	UniRef100_E6SSR0~K01424	87.5	345	43	0	1	345	1	345	1.8e-175	620.2
+bin_semibin_SASB_CSM7KOLE.1ΩCSM7KOLE_k117_15116_2	UniRef100_A0A0P0GBM8~K01209	87.9	514	62	0	1	514	1	514	1.7e-278	963.0
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkm2/checkm2.log	Thu Apr 10 15:02:10 2025 +0000
@@ -0,0 +1,11 @@
+[03/03/2025 11:20:03 AM] INFO: Running CheckM2 version 1.0.2
+[03/03/2025 11:20:03 AM] INFO: Custom database path provided for predict run. Checking database at Database/CheckM2_database/uniref100.KO.1.dmnd...
+[03/03/2025 11:20:10 AM] INFO: Running quality prediction workflow with 5 threads.
+[03/03/2025 11:20:12 AM] INFO: Calling genes in 50 bins with 5 threads:
+[03/03/2025 11:20:59 AM] WARNING: Skipping protein file batches/batch_0/checkm2/protein_files/bin_concoct_SASB_HSMA33OT.11.faa as it was empty.
+[03/03/2025 11:20:59 AM] INFO: Calculating metadata for 49 bins with 5 threads:
+[03/03/2025 11:20:59 AM] INFO: Annotating input genomes with DIAMOND using 5 threads
+[03/03/2025 11:23:40 AM] INFO: Processing DIAMOND output
+[03/03/2025 11:23:40 AM] INFO: Predicting completeness and contamination using ML models.
+[03/03/2025 11:23:44 AM] INFO: Parsing all results and constructing final output table.
+[03/03/2025 11:23:44 AM] INFO: CheckM2 finished successfully.
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkm2/quality_report.tsv	Thu Apr 10 15:02:10 2025 +0000
@@ -0,0 +1,50 @@
+Name	Completeness	Contamination	Completeness_Model_Used	Translation_Table_Used	Coding_Density	Contig_N50	Average_Gene_Length	Genome_Size	GC_Content	Total_Coding_Sequences	Total_Contigs	Max_Contig_Length	Additional_Notes
+bin_concoct_SASB_CSM7KOLE.0	22.51	0.0	Neural Network (Specific Model)	11	0.887	2144	267.22576530612247	708085	0.53	784	324	5294	None
+bin_concoct_SASB_CSM7KOLE.1	15.91	5.09	Neural Network (Specific Model)	11	0.845	4814	222.07713884992987	1119464	0.47	1426	273	50470	None
+bin_concoct_SASB_CSM7KOLE.20	6.38	0.0	Gradient Boost (General Model)	11	0.974	3001	300.0	16618	0.61	18	6	4049	None
+bin_concoct_SASB_CSM7KOLE.22	100.0	2.05	Neural Network (Specific Model)	11	0.87	22717	300.98043641835966	2755022	0.54	2658	187	146684	None
+bin_concoct_SASB_CSM7KOLE.24	6.38	0.0	Gradient Boost (General Model)	11	0.926	5194	268.5	5194	0.45	6	1	5194	None
+bin_concoct_SASB_CSM7KOLE.3	6.38	0.0	Gradient Boost (General Model)	11	0.818	4650	264.75	7724	0.36	8	3	4650	None
+bin_concoct_SASB_CSM7KOLE.30	6.38	0.0	Gradient Boost (General Model)	11	0.796	1887	501.0	1887	0.5	1	1	1887	None
+bin_concoct_SASB_HSMA33MG.1	33.58	0.68	Neural Network (Specific Model)	11	0.856	2959	250.53061224489795	987394	0.59	1127	345	13858	None
+bin_concoct_SASB_HSMA33MG.10	6.38	0.0	Gradient Boost (General Model)	11	0.998	2318	386.0	2318	0.36	2	1	2318	None
+bin_concoct_SASB_HSMA33MG.12	9.66	0.29	Neural Network (Specific Model)	11	0.887	1956	238.57806691449815	432765	0.41	538	204	12095	None
+bin_concoct_SASB_HSMA33MG.13	6.65	0.0	Gradient Boost (General Model)	11	0.936	1726	269.5	1726	0.45	2	1	1726	None
+bin_concoct_SASB_HSMA33MG.8	6.38	0.0	Gradient Boost (General Model)	11	0.794	1759	233.0	1759	0.53	2	1	1759	None
+bin_concoct_SASB_HSMA33MG.9	53.69	21.09	Neural Network (Specific Model)	11	0.901	2957	269.85174585002864	3130308	0.44	3494	1086	18806	None
+bin_concoct_SASB_HSMA33OT.0	4.43	0.0	Neural Network (Specific Model)	11	0.851	1985	214.93157894736842	143344	0.38	190	71	3816	None
+bin_concoct_SASB_HSMA33OT.10	6.38	0.0	Gradient Boost (General Model)	11	0.966	11244	210.76666666666668	19477	0.36	30	4	11244	None
+bin_concoct_SASB_HSMA33OT.14	6.38	0.0	Gradient Boost (General Model)	11	0.509	1707	290.0	1707	0.44	1	1	1707	None
+bin_concoct_SASB_HSMA33OT.16	9.03	0.06	Neural Network (Specific Model)	11	0.881	1824	231.57877813504822	244747	0.42	311	130	3723	None
+bin_concoct_SASB_HSMA33OT.18	6.38	0.0	Gradient Boost (General Model)	11	0.958	1602	256.0	1602	0.36	2	1	1602	None
+bin_concoct_SASB_HSMA33OT.2	6.38	0.0	Gradient Boost (General Model)	11	0.941	1704	345.0	3299	0.35	3	2	1704	None
+bin_concoct_SASB_HSMA33OT.3	5.64	0.0	Gradient Boost (General Model)	11	0.839	2532	203.5	4366	0.44	6	2	2532	None
+bin_concoct_SASB_HSMA33OT.4	6.38	0.0	Gradient Boost (General Model)	11	0.634	2866	202.0	2866	0.42	3	1	2866	None
+bin_concoct_SASB_HSMA33OT.6	6.42	0.0	Gradient Boost (General Model)	11	0.915	1816	233.42857142857142	10707	0.61	14	6	2097	None
+bin_concoct_SASB_MSM5LLDE.16	6.38	0.0	Gradient Boost (General Model)	11	0.998	1592	530.0	1592	0.6	1	1	1592	None
+bin_concoct_SASB_MSM5LLDE.19	6.38	0.0	Gradient Boost (General Model)	11	0.819	1941	68.75	1941	0.39	8	1	1941	None
+bin_concoct_SASB_MSM5LLDE.2	6.38	0.0	Gradient Boost (General Model)	11	0.876	1618	236.5	1618	0.54	2	1	1618	None
+bin_concoct_SASB_MSM5LLDE.20	49.54	0.72	Neural Network (Specific Model)	11	0.901	2559	261.2743158588856	2632930	0.42	3033	1029	33333	None
+bin_concoct_SASB_MSM5LLDE.21	99.55	8.64	Neural Network (Specific Model)	11	0.9	81127	346.90618336886996	4332951	0.46	3752	143	235469	None
+bin_concoct_SASB_MSM5LLDE.27	9.51	0.07	Neural Network (Specific Model)	11	0.877	1958	217.07469879518072	307709	0.57	415	150	5816	None
+bin_concoct_SASB_MSM5LLDE.28	6.38	0.0	Gradient Boost (General Model)	11	0.952	1638	260.0	1638	0.59	2	1	1638	None
+bin_concoct_SASB_MSM5LLDE.6	5.91	0.0	Gradient Boost (General Model)	11	0.91	1987	228.10714285714286	20991	0.61	28	11	2365	None
+bin_concoct_SASB_MSM5LLDE.7	5.03	0.0	Gradient Boost (General Model)	11	0.999	1689	282.0	1689	0.65	2	1	1689	None
+bin_metabat_SASB_CSM7KOLE.10	45.04	8.76	Neural Network (Specific Model)	11	0.903	2382	261.277639046538	3814277	0.41	4405	1544	17510	None
+bin_metabat_SASB_CSM7KOLE.2	18.36	0.04	Neural Network (Specific Model)	11	0.924	2177	272.32474226804123	514039	0.49	582	230	4454	None
+bin_metabat_SASB_CSM7KOLE.3	15.42	0.06	Neural Network (Specific Model)	11	0.944	2547	288.0351906158358	623088	0.49	682	253	7390	None
+bin_metabat_SASB_CSM7KOLE.7	5.83	0.18	Neural Network (Specific Model)	11	0.906	146684	275.6360153256705	237533	0.52	261	10	146684	None
+bin_metabat_SASB_MSM5LLDE.1	85.75	0.14	Neural Network (Specific Model)	11	0.897	81302	343.6424261670372	3612719	0.46	3149	65	235469	None
+bin_metabat_SASB_MSM5LLDE.2	96.34	0.33	Neural Network (Specific Model)	11	0.866	76315	307.9110091743119	2321808	0.57	2180	40	221393	None
+bin_semibin_SASB_CSM7KOLE.0	17.68	0.13	Neural Network (Specific Model)	11	0.895	3290	276.360396039604	467082	0.59	505	137	14331	None
+bin_semibin_SASB_CSM7KOLE.1	45.77	0.88	Gradient Boost (General Model)	11	0.901	4330	318.24455825864277	1653306	0.5	1562	386	16396	None
+bin_semibin_SASB_CSM7KOLE.10	10.46	0.46	Neural Network (Specific Model)	11	0.884	8223	264.5268817204301	749398	0.39	837	118	30972	None
+bin_semibin_SASB_CSM7KOLE.11	14.55	3.97	Neural Network (Specific Model)	11	0.89	19781	259.4004424778761	788274	0.5	904	74	146684	None
+bin_semibin_SASB_CSM7KOLE.14	92.78	0.09	Neural Network (Specific Model)	11	0.897	65685	352.9744467860906	4474676	0.42	3796	113	353143	None
+bin_semibin_SASB_CSM7KOLE.16	10.61	0.0	Neural Network (Specific Model)	11	0.881	3151	281.17182130584195	278023	0.52	291	84	5610	None
+bin_semibin_SASB_CSM7KOLE.3	10.48	1.74	Neural Network (Specific Model)	11	0.919	3218	322.7874125874126	752315	0.41	715	228	6603	None
+bin_semibin_SASB_HSMA33MG.1	37.55	7.85	Neural Network (Specific Model)	11	0.909	3945	314.83505866114564	1502934	0.43	1449	378	18770	None
+bin_semibin_SASB_HSMA33MG.2	9.86	0.19	Neural Network (Specific Model)	11	0.84	5391	209.15863141524105	478276	0.48	643	94	18806	None
+bin_semibin_SASB_MSM5LLDE.0	6.09	0.04	Neural Network (Specific Model)	11	0.889	3492	214.14640198511165	290530	0.54	403	76	32205	None
+bin_semibin_SASB_MSM5LLDE.1	29.89	0.02	Neural Network (Specific Model)	11	0.914	3803	319.14351851851853	1129847	0.42	1080	302	10395	None
+bin_semibin_SASB_MSM5LLDE.10	6.39	0.04	Neural Network (Specific Model)	11	0.838	6460	243.23076923076923	214350	0.48	247	38	17791	None
--- a/tooldistillator.xml	Thu Oct 17 08:00:15 2024 +0000
+++ b/tooldistillator.xml	Thu Apr 10 15:02:10 2025 +0000
@@ -118,6 +118,19 @@
     --threshold '$tool.select_tool.threshold'
     --read_len '$tool.select_tool.read_len'
     --level '$tool.select_tool.level'
+        #elif $tool.select_tool.tool_list == 'checkm2':
+            #if $tool.select_tool.diamond_results_path
+    --diamond_results_path '$tool.select_tool.diamond_results_path'
+    --diamond_results_hid '$tool.select_tool.diamond_results_path.hid'
+            #end if
+            #if $tool.select_tool.protein_zip_path
+    --protein_zip_path '$tool.select_tool.protein_zip_path'
+    --protein_zip_hid '$tool.select_tool.protein_zip_path.hid'
+            #end if
+            #if $tool.select_tool.checkm2_log_path
+    --checkm2_log_path '$tool.select_tool.checkm2_log_path'
+    --checkm2_log_hid '$tool.select_tool.checkm2_log_path.hid'
+            #end if
         #elif $tool.select_tool.tool_list == 'fastp':
             #if $tool.select_tool.trimmed_forward_R1_path
     --trimmed_forward_R1_path '$tool.select_tool.trimmed_forward_R1_path'
@@ -251,6 +264,7 @@
                         <option value="bandage">Bandage</option>
                         <option value="bracken">Bracken</option>
                         <option value="bwa">BWA</option>
+                        <option value="checkm2">CheckM2</option>
                         <option value="fastp">Fastp</option>
                         <option value="fastqc">Fastqc</option>
                         <option value="filtlong">Filtlong</option>
@@ -326,6 +340,14 @@
                         <expand macro="analysis_software_version"/>
                         <expand macro="reference_database_version"/>
                     </when>
+                    <when value="checkm2">
+                        <param name="input" type="data" format="txt,tabular" multiple="false" label="CheckM2 quality report file" help="Tabular file from CheckM2 output"/>
+                        <param argument="--diamond_results_path" type="data" format="txt,tabular" optional="true" multiple="false" label="CheckM2 Diamond results file" help="DIAMOND_RESULTS file for CheckM2"/>
+                        <param argument="--protein_zip_path" type="data" format="zip,tar,tar.gz" optional="true" multiple="false" label="Archive file with protein files from CheckM2" help="Protein sequence fasta files in an archive file for CheckM2"/>
+                        <param argument="--checkm2_log_path" type="data" format="txt" multiple="false" optional="true" label="CheckM2 log file" help="Log file from CheckM2"/>
+                        <expand macro="analysis_software_version"/>
+                        <expand macro="reference_database_version"/>
+                    </when>
                     <when value="fastp">
                         <param name="input" type="data" format="json" multiple="false" label="Fastp report file" help="Fastp result in json format"/>
                         <param argument="--trimmed_forward_R1_path" type="data" format="fastq,fastq.gz" optional="true" multiple="false" label="Fastp trimmed R1" help="trimmed file R1"/>
@@ -597,6 +619,19 @@
                 </repeat>
                 <repeat name="tools">
                     <conditional name="select_tool">
+                        <param name="tool_list" value="checkm2"/>
+                        <param name="input" value="checkm2/quality_report.tsv" ftype="tabular"/>
+                        <param name="diamond_results_path" value="checkm2/DIAMOND_RESULTS.tsv"/>
+                        <param name="checkm2_log_path" value="checkm2/checkm2.log"/>
+                        <conditional name="origin">
+                            <param name="origin" value="true"/>
+                            <param name="analysis_software_version" value="1.0.2"/>
+                        </conditional>
+                        <param name="reference_database_version" value="Uniref"/>
+                    </conditional>
+                </repeat>
+                <repeat name="tools">
+                    <conditional name="select_tool">
                         <param name="tool_list" value="fastp"/>
                         <param name="input" value="fastp/fastp_report.json" ftype="json"/>
                         <param name="trimmed_forward_R1_path" value="fastp/trimmed_R1.fastq.gz"/>
@@ -771,27 +806,28 @@
                     </conditional>
                 </repeat>
             </section>
-            <output_collection name="output_json" type="list" count="20">
+            <output_collection name="output_json" type="list" count="21">
                 <expand macro="element_assert" name="abricate_0_output" text="Enterococcus faecalis V583"/>
                 <expand macro="element_assert" name="amrfinderplus_1_output" text="mercury resistance transcriptional regulator MerR"/>
                 <expand macro="element_assert" name="bakta_2_output" text="hypothetical protein"/>
                 <expand macro="element_assert" name="bandage_3_output" text="3042326"/>
                 <expand macro="element_assert" name="bracken_4_output" text="Staphylococcus_aureus"/>
                 <expand macro="element_assert" name="bwa_5_output" text="bwa_report"/>
-                <expand macro="element_assert" name="fastp_6_output" text="705053822"/>
-                <expand macro="element_assert" name="fastqc_7_output" text="Sequences flagged as poor quality"/>
-                <expand macro="element_assert" name="filtlong_8_output" text="filtlong_report"/>
-                <expand macro="element_assert" name="flye_9_output" text="contig_2"/>
-                <expand macro="element_assert" name="integronfinder2_10_output" text="2353.0"/>
-                <expand macro="element_assert" name="isescan_11_output" text="IS200/IS605"/>
-                <expand macro="element_assert" name="kraken2_12_output" text="Enterococcus_faecalis"/>
-                <expand macro="element_assert" name="plasmidfinder_13_output" text="repUS40_1_repB"/>
-                <expand macro="element_assert" name="polypolish_14_output" text="320811"/>
-                <expand macro="element_assert" name="quast_15_output" text="2944723"/>
-                <expand macro="element_assert" name="recentrifuge_16_output" text="6.4917947578"/>
-                <expand macro="element_assert" name="refseqmasher_17_output" text="GCF_000519925.1"/>
-                <expand macro="element_assert" name="shovill_18_output" text="436224"/>
-                <expand macro="element_assert" name="tabular_file_19_output" text="NP_814691"/>
+                <expand macro="element_assert" name="checkm2_6_output" text="UniRef100_B5R745"/>
+                <expand macro="element_assert" name="fastp_7_output" text="705053822"/>
+                <expand macro="element_assert" name="fastqc_8_output" text="Sequences flagged as poor quality"/>
+                <expand macro="element_assert" name="filtlong_9_output" text="filtlong_report"/>
+                <expand macro="element_assert" name="flye_10_output" text="contig_2"/>
+                <expand macro="element_assert" name="integronfinder2_11_output" text="2353.0"/>
+                <expand macro="element_assert" name="isescan_12_output" text="IS200/IS605"/>
+                <expand macro="element_assert" name="kraken2_13_output" text="Enterococcus_faecalis"/>
+                <expand macro="element_assert" name="plasmidfinder_14_output" text="repUS40_1_repB"/>
+                <expand macro="element_assert" name="polypolish_15_output" text="320811"/>
+                <expand macro="element_assert" name="quast_16_output" text="2944723"/>
+                <expand macro="element_assert" name="recentrifuge_17_output" text="6.4917947578"/>
+                <expand macro="element_assert" name="refseqmasher_18_output" text="GCF_000519925.1"/>
+                <expand macro="element_assert" name="shovill_19_output" text="436224"/>
+                <expand macro="element_assert" name="tabular_file_20_output" text="NP_814691"/>
             </output_collection>
         </test>
     </tests>
@@ -801,9 +837,10 @@
 ToolDistillator is a tool to extract information from output files of specific tools, expose it as JSON files, and aggregate over several tools.
 
 This tool here is extracting information from output files of specific tools and exposing it as JSON files
+
 ** Tool input**
 
-ToolDistillator can use several input type from at least 21 different tools and 1 generic tool for tabular file:
+ToolDistillator can use several input type from at least 22 different tools and 1 generic tool for tabular file:
 
 +----------------+----------------+-------------------+------------------------------------------------------------+
 | Tools          | Version        | Default input file| Optional files                                             |
@@ -820,6 +857,8 @@
 +----------------+----------------+-------------------+------------------------------------------------------------+
 | BWA            | 2.2.1          |  input1.bam       | input2.bam                                                 |
 +----------------+----------------+-------------------+------------------------------------------------------------+
+| CheckM2        |1.0.2           | quality_report.tsv| DIAMOND_RESULTS.tsv, protein_files.zip, checkm2.log        |
++----------------+----------------+-------------------+------------------------------------------------------------+
 | Fastp          | 0.23.2         |  output.json      |                                                            |
 +----------------+----------------+-------------------+------------------------------------------------------------+
 | Fastqc         | 0.12.1         | report.txt        | report.html                                                |
@@ -850,7 +889,7 @@
 +----------------+----------------+-------------------+------------------------------------------------------------+
 | Staramr        | 0.9.1          |  resfinder.tsv    | mlst.tsv, pointfinder.tsv, plasmidfinder.tsv, settings.tsv |
 +----------------+----------------+-------------------+------------------------------------------------------------+
-| tabular_file   |  0             |  output.tsv       | no optional files                                          |
+| tabular_file   |  0             |  output.tsv       |                                                            |
 +----------------+----------------+-------------------+------------------------------------------------------------+
 
 ** Options **