Mercurial > repos > cpt > cpt_lipory
comparison lipory.xml @ 4:b79df4966ebb draft
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
author | cpt |
---|---|
date | Mon, 05 Jun 2023 02:45:43 +0000 |
parents | |
children | 2654bcd9b14d |
comparison
equal
deleted
inserted
replaced
3:68e1e56e338a | 4:b79df4966ebb |
---|---|
1 <tool id="edu.tamu.cpt.fasta.lipory" name="Identify Lipoboxes" version="19.1.0.0"> | |
2 <description> in protein sequences</description> | |
3 <macros> | |
4 <import>macros.xml</import> | |
5 <import>cpt-macros.xml</import> | |
6 </macros> | |
7 <expand macro="requirements"> | |
8 <requirement type="package" version="2022.1.18">regex</requirement> | |
9 </expand> | |
10 <command interpreter="python" detect_errors="aggressive"><![CDATA[lipory.py | |
11 '$positional_1' | |
12 '$positional_2' | |
13 | |
14 --lipobox_mindist '$lipobox_mindist' | |
15 --lipobox_maxdist '$lipobox_maxdist' | |
16 | |
17 > '$default']]></command> | |
18 <inputs> | |
19 <param label="Naive orf calls" name="positional_1" type="data" format="gff3"/> | |
20 <param label="Genome" name="positional_2" type="data" format="fasta"/> | |
21 <param label="Minimum distance in codons to start of lipobox" name="lipobox_mindist" type="integer" value="10"/> | |
22 <param label="Maximum distance in codons to start of lipobox" name="lipobox_maxdist" type="integer" value="40"/> | |
23 </inputs> | |
24 <outputs> | |
25 <data format="gff3" name="default" label="Lipoboxes from ${on_string}"/> | |
26 </outputs> | |
27 <tests> | |
28 <test> | |
29 <param name="positional_1" value="T7_LiporyIn.gff3"/> | |
30 <param name="positional_2" value="T7_LiporyIn.fasta"/> | |
31 <param name="lipobox_mindist" value="10"/> | |
32 <param name="lipobox_maxdist" value="60"/> | |
33 <output name="default" value="T7_LiporyOut.gff3"/> | |
34 </test> | |
35 </tests> | |
36 <help><![CDATA[ | |
37 **What it does** | |
38 | |
39 Identifies possible LipoBoxes from an input GFF3 and FASTA. | |
40 | |
41 **How it works** | |
42 | |
43 Searches in the first 10-40 amino acids of an input protein sequence using regular expressions | |
44 for a 4-amino acid motif based on the consensus sequences described in (**Babu** et al. 2006. *J | |
45 Bacteriol.* 188(8):2761-2773 and **Kongari** *et al.* 2018 *BMC Bioinformatics*. 19:326). The | |
46 amino acids allowed here are relaxed to allow for the diversity of amino acids known to occur in lipoboxes. | |
47 | |
48 Position 1: ILMFTV or only A | |
49 | |
50 Position 2: any residue except REKD or only W | |
51 | |
52 Position 3: GAS | |
53 | |
54 Position 4: C | |
55 | |
56 ]]></help> | |
57 <expand macro="citations-2020"/> | |
58 </tool> |