Mercurial > repos > cpt > cpt_putative_osp
annotate generate-putative-osp.xml @ 4:8f6c09b6a43d draft default tip
planemo upload commit 471832a126aa25d903becae9a074a6b7b1ff7092-dirty
author | cpt |
---|---|
date | Fri, 20 Sep 2024 04:02:40 +0000 |
parents | 859e18a9814a |
children |
rev | line source |
---|---|
1
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
1 <tool id="edu.tamu.cpt2.spanin.generate-putative-osp" name="OSP candidates" version="1.0"> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
2 <description>constructs a putative list of potential o-spanin from an input genomic FASTA</description> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
3 <macros> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
4 <import>macros.xml</import> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
5 </macros> |
3
859e18a9814a
planemo upload commit 09a88823322bf86d7f05f008f9dabdb60a572d3a
cpt
parents:
2
diff
changeset
|
6 <requirements> |
859e18a9814a
planemo upload commit 09a88823322bf86d7f05f008f9dabdb60a572d3a
cpt
parents:
2
diff
changeset
|
7 <requirement type="package" version="3.9">python</requirement> |
859e18a9814a
planemo upload commit 09a88823322bf86d7f05f008f9dabdb60a572d3a
cpt
parents:
2
diff
changeset
|
8 <requirement type="package" version="1.84">biopython</requirement> |
859e18a9814a
planemo upload commit 09a88823322bf86d7f05f008f9dabdb60a572d3a
cpt
parents:
2
diff
changeset
|
9 <requirement type="package" version="2024.9.11">regex</requirement> |
859e18a9814a
planemo upload commit 09a88823322bf86d7f05f008f9dabdb60a572d3a
cpt
parents:
2
diff
changeset
|
10 </requirements> |
1
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
11 <command detect_errors="aggressive"><![CDATA[ |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
12 '$__tool_directory__/generate-putative-osp.py' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
13 '$fasta_file' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
14 --strand '$strand' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
15 --switch '$switch' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
16 --osp_on '$osp_on' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
17 --osp_op '$osp_op' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
18 --osp_ob '$osp_ob' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
19 --osp_og '$osp_og' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
20 --osp_min_len '$osp_min_len' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
21 --putative_osp '$putative_osp' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
22 --summary_osp_txt '$summary_osp' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
23 --putative_osp_gff '$putative_osp_gff' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
24 --min_lipo_after '$lipo_min' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
25 --max_lipo_after '$lipo_max' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
26 --osp_max '$osp_max' |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
27 ]]></command> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
28 <inputs> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
29 <param type="select" label="Strand Choice" name="strand"> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
30 <option value="both">both</option> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
31 <option value="forward">+</option> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
32 <option value="reverse">-</option> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
33 </param> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
34 <param label="Single Genome FASTA" name="fasta_file" type="data" format="fasta"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
35 <param label="o-spanin minimal length" name="osp_min_len" type="integer" value="45"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
36 <param label="o-spanin maximum length" name="osp_max" type="integer" value="200"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
37 <param label="Range Selection; default is all; for a specific range to check for a spanin input integers separated by a colon (eg. 1234:4321)" type="text" name="switch" value="all"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
38 <param label="Lipobox minimal distance from start codon" name="osp_min_dist" type="integer" value="10"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
39 <param label="Lipobox maximum distance from start codon" name="osp_max_dist" type="integer" value="60" help="Searches for a Lipobox between Lipoboxmin and Lipoboxmax ie [Lipoboxmin,Lipoboxmax]"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
40 <param label="Minimum amount of residues after lipobox is found" name="lipo_min" type="integer" value="25"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
41 <param label="Maximum amount of residues after lipobox is found" name="lipo_max" type="integer" value="170"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
42 </inputs> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
43 <outputs> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
44 <data format="fasta" name="osp_on" label="NucSequences.fa" hidden="true"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
45 <data format="fasta" name="osp_op" label="ProtSequences.fa" hidden="true"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
46 <data format="bed" name="osp_ob" label="BED_Output.bed" hidden="true"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
47 <data format="gff3" name="osp_og" label="GFF_Output.gff" hidden="true"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
48 <data format="fasta" name="putative_osp" label="putative_osp.fa"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
49 <data format="txt" name="summary_osp" label="summary_osp.txt"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
50 <data format="gff3" name="putative_osp_gff" label="putative_osp.gff3"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
51 </outputs> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
52 <help><![CDATA[ |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
53 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
54 **What it does** |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
55 Searches a genome for candidate o-spanins (OSPs), a phage protein involved in outer membrane disruption during Gram-negative bacterial host cell lysis. |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
56 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
57 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
58 **METHODOLOGY** |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
59 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
60 Locates ALL potential start sequences, based on TTG / ATG / GTG (M / L / V). This list is pared down to those within the user-set min/max lengths. That filtered list generates a set of files with the ORFs in FASTA (nt and aa), BED, and GFF3 file formats. |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
61 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
62 For each sequence in the protein FASTA, the tool then checks within the user-specified range (min/max distance from start codon) for a regular expression (RegEx) to identify a potential lipobox. The following residues are allowed for the potential lipobox: |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
63 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
64 * [ILMFTV][^REKD][GAS]C |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
65 * AW[AGS]C |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
66 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
67 Finally, the protein list is filtered for size with user-set periplasmic length parameters, calculated as the number of residues after the putative lipobox. |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
68 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
69 **INPUT** --> Genomic FASTA |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
70 *NOTE: This tool only takes a SINGLE genomic fasta. It does not work with multiFASTAs.* |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
71 |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
72 **OUTPUT** --> putative_osp.fa (FASTA) file, putative_osp.gff3, and basic summary statistics file as sumamry_osp.txt |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
73 Protein sequences which passed the above filters are returned as the candidate OSPs. |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
74 ]]></help> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
75 <expand macro="citations-crr"/> |
05b97a4dce94
planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
cpt
parents:
diff
changeset
|
76 </tool> |