diff mafft.xml @ 14:6f28e90db932 draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mafft commit 1570f3a28232b4b88385cdfbb68f79d80ff1dabb
author bgruening
date Tue, 31 Oct 2023 15:48:53 +0000
parents 4de39704d423
children bf28a8cff401
line wrap: on
line diff
--- a/mafft.xml	Fri Sep 30 19:24:47 2022 +0000
+++ b/mafft.xml	Tue Oct 31 15:48:53 2023 +0000
@@ -1,9 +1,10 @@
 <?xml version="1.0" encoding="UTF-8"?>
-<tool id="rbc_mafft" name="MAFFT" version="@TOOL_VERSION@+galaxy@VERSION@">
-  <description>Multiple alignment program for amino acid or nucleotide sequences</description>
+<tool id="rbc_mafft" name="MAFFT" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
+<description>Multiple alignment program for amino acid or nucleotide sequences</description>
   <macros>
     <import>macros.xml</import>
   </macros>
+  <expand macro="biotools"/>
   <expand macro="requirements" />
   <stdio>
     <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" />
@@ -229,32 +230,51 @@
       <param name="outputFormat" value="--clustalout"/>
       <output name="outputAlignment" ftype="clustal" file="mafft_nwns_result.aln" lines_diff="2" />
     </test>
+    <!-- WARNING: the results of the following test depends on #threads.
+    The result seems deterministic for single threaded execution, i.e. GALAXY_SLOTS=1 planemo test
+    However, GH CI/CD uses 2 threads and results vary -->
     <test expect_num_outputs="1" >
       <param name="inputSequences" value="sample.fa"/>
       <param name="flavourType" value="custom"/>
-      <param name="matrix_condition" value="BLOSUM"/>
+      <conditional name="matrix_condition">
+        <param name="matrix" value="BLOSUM"/>
+      </conditional>
       <param name="BLOSUM" value="62"/>
       <param name="distance_method" value="--fastapair"/>
       <param name="weighti" value="2.7"/>
       <param name="iterations" value="1000"/>
       <param name="outputFormat" value="--clustalout"/>
-      <output name="outputAlignment" ftype="clustal" file="mafft_custom_result.aln" lines_diff="2" />
+      <output name="outputAlignment" ftype="clustal" file="mafft_custom_result.aln" compare="sim_size">
+        <assert_contents>
+          <has_n_lines n="458" delta="0"/>
+          <has_text text="CLUSTAL format alignment by MAFFT F-INS-i"/>
+          <has_text text="NPIVYGISHPKY"/>
+          <has_text text="1=="/>
+          <has_text text="36=="/>
+          <has_line line="8=opsin,        ------------------------------------------------------------"/>
+        </assert_contents>
+      </output>
     </test>
   </tests>
   <help>    <![CDATA[
       **What it does**
+
       MAFFT is a multiple sequence alignment program for unix-like operating systems.
       It offers a range of multiple alignment methods, L-INS-i (accurate; for alignment of <∼200 sequences),
       FFT-NS-2 (fast; for alignment of <∼30,000 sequences), etc.
-      From the MAFFT man page, an overview of the different predefined flavours of the tool.
+      From the MAFFT man page, an overview of the different predefined flavours of the tool is as follows:
+
       **Accuracy-oriented methods:**
+
       - L-INS-i (probably most accurate; recommended for <200 sequences; iterative refinement method incorporating local pairwise alignment information):
       - mafft --localpair --maxiterate 1000 input [> output]
       - G-INS-i (suitable for sequences of similar lengths; recommended for <200 sequences; iterative refinement method incorporating global pairwise alignment information):
       - mafft --globalpair --maxiterate 1000 input [> output]
       - E-INS-i (suitable for sequences containing large unalignable regions; recommended for <200 sequences):
       - mafft --ep 0 --genafpair --maxiterate 1000 input [> output]. For E-INS-i, the --ep 0 option is recommended to allow large gaps.
+
       **Speed-oriented methods:**
+
       - FFT-NS-i (iterative refinement method; two cycles only):
       - mafft --retree 2 --maxiterate 2 input [> output]
       - FFT-NS-i (iterative refinement method; max. 1000 iterations):
@@ -271,23 +291,14 @@
       - mafft --retree 1 --maxiterate 0 --nofft --parttree input [> output]
 
       **Options:**
-      --auto
-      Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2)
-      --adjustdirection
-      Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored.
-      --op
-      Gap opening penalty, default: 1.53
-      --ep
-      Offset (works like gap extension penalty), default: 0.0
-      --maxiterate
-      Maximum number of iterative refinement, default: 0
-      --clustalout
-      Output: clustal format, default: fasta
-      --thread
-      Number of threads (if unsure, --thread -1)
-      --retree number
-      Guide tree is built number times in the progressive stage.
-      Valid with 6mer distance.  Default: 2
+
+      - --auto Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2)
+      - --adjustdirection Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored.
+      - --op Gap opening penalty, default: 1.53
+      - --ep Offset (works like gap extension penalty), default: 0.0
+      - --maxiterate Maximum number of iterative refinement, default: 0
+      - --clustalout Output: clustal format, default: fasta
+      - --retree number Guide tree is built number times in the progressive stage. Valid with 6mer distance. Default: 2
       ]]>
     </help>
   <expand macro="citations" />