comparison protein_blast_grouping.xml @ 0:7abe5f471364 draft

planemo upload commit 7ebbd0df0aea9e58c4df58b61d6da385ee0ebb49
author cpt
date Wed, 24 Jul 2024 01:37:37 +0000
parents
children f2a7dffab581
comparison
equal deleted inserted replaced
-1:000000000000 0:7abe5f471364
1 <tool id="edu.tamu.cpt.blast.protein_grouping" name="Protein Blast Grouping" version="0.0.1">
2 <description>Based on a BLASTp result</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="requirements"/>
7 <command detect_errors="aggressive">
8 <![CDATA[
9 '$__tool_directory__/protein_blast_grouping.py'
10 '${blast_in.blast}'
11 --hits '$hits'
12 --sort '$sort.sortType'
13 > '$grouping_output'
14 ]]>
15 </command>
16 <inputs>
17 <conditional name="blast_in">
18 <param name="blastType" type="select" label="Blastn Input Type">
19 <option value="TSV">Blast Tabular</option>
20 </param>
21 <when value="TSV">
22 <param label="BLASTp Results" name="blast" type="data" format="tsv,tabular"/>
23 </when>
24 </conditional>
25 <param label="Number of results to return" name="hits" type="integer" value="5" min="1" max="30"/>
26 <conditional name="sort">
27 <param name="sortType" type="select" label="Sort by">
28 <option value="unique_queries" selected="true">Unique Queries</option>
29 <option value="unique_hits">Unique Hits</option>
30 </param>
31 <when value="unique_queries"/>
32 <when value="unique_hits"/>
33 </conditional>
34 </inputs>
35 <outputs>
36 <data format="tabular" name="grouping_output" label="Top BlastP Hits"/>
37 </outputs>
38 <tests>
39 <test>
40 <conditional name="blast_in">
41 <param name="blastType" value="TSV"/>
42 <param name="blast" value="infile.txt"/>
43 </conditional>
44 <param name="hits" value="20"/>
45 <output name="grouping_output" file="outfile.txt" lines_diff="1"/>
46 </test>
47 </tests>
48 <help>
49 **What it does**
50 * Reads a tab-delimited BLAST output file.
51 * Extracts organism names from the subject titles (text in square brackets).
52 * Counts unique query proteins that matched each organism and unique hit proteins from each organism.
53 * Sorts and displays results based on either unique queries or unique hits.
54 * The output is a formatted table showing the top N organisms with the most matches.
55 </help>
56 <expand macro="citations-2020"/>
57 </tool>