comparison tools/ncbi_blast_plus/ncbi_segmasker_wrapper.xml @ 13:623f727cdff1 draft

Uploaded v0.1.00, uses BLAST+ 2.2.29, allows custom column selection for tabular output - including taxonomy fields.
author peterjc
date Fri, 14 Mar 2014 07:40:46 -0400
parents
children 2fe07f50a41e
comparison
equal deleted inserted replaced
12:6560192c5098 13:623f727cdff1
1 <tool id="ncbi_segmasker_wrapper" name="NCBI BLAST+ segmasker" version="0.1.00">
2 <description>low-complexity regions in protein sequences</description>
3 <macros>
4 <token name="@BINARY@">segmasker</token>
5 <import>ncbi_macros.xml</import>
6 </macros>
7 <expand macro="requirements" />
8 <command>
9 ## The command is a Cheetah template which allows some Python based syntax.
10 ## Lines starting hash hash are comments. Galaxy will turn newlines into spaces
11 segmasker
12 #if $db_opts.db_opts_selector == "db":
13 -in "${db_opts.database.fields.path}" -infmt blastdb
14 #elif $db_opts.db_opts_selector == "histdb":
15 -in "${os.path.join($db_opts.histdb.extra_files_path, 'blastdb')}" -infmt blastdb
16 #else:
17 -in "$subject" -infmt fasta
18 #end if
19 -out "$outfile"
20 -window $window
21 -locut $locut
22 -hicut $hicut
23 -outfmt $outformat
24 </command>
25 <expand macro="stdio" />
26 <inputs>
27 <expand macro="input_conditional_protein_db" />
28 <param name="window" type="integer" value="12" label="SEG window length" help="(-window)" />
29 <param name="locut" type="float" value="2.2" label="SEG low cutoff" help="(-locut)" />
30 <param name="hicut" type="float" value="2.5" label="SEG high cutoff" help="(-hicut)" />
31 <param name="outformat" type="select" label="Output format">
32 <!-- seqloc_* formats are not very useful
33 and what BLAST+ calls 'interval' is not what Galaxy calls interval format
34 -->
35 <option value="fasta">FASTA</option>
36 <option value="maskinfo_asn1_bin">maskinfo ASN.1 binary</option>
37 <option value="maskinfo_asn1_text" selected="true">maskinfo ASN.1 text</option>
38 <option value="maskinfo_xml">maskinfo_xml</option>
39 </param>
40 </inputs>
41 <outputs>
42 <data name="outfile" format="maskinfo-asn1" label="SEG Masked File">
43 <change_format>
44 <when input="outformat" value="fasta" format="fasta" />
45 <when input="outformat" value="maskinfo_asn1_bin" format="maskinfo-asn1-binary" />
46 <!--
47 <when input="outformat" value="maskinfo_asn1_text" format="maskinfo-asn1" />
48 -->
49 <when input="outformat" value="maskinfo_xml" format="xml" />
50 </change_format>
51 </data>
52 </outputs>
53 <tests>
54 <test>
55 <param name="db_opts_selector" value="file" />
56 <param name="subject" value="four_human_proteins.fasta" ftype="fasta" />
57 <param name="window" value="12" />
58 <param name="locut" value="2.2" />
59 <param name="hicut" value="2.5" />
60 <param name="outformat" value="fasta" />
61 <output name="outfile" file="segmasker_four_human.fasta" />
62 </test>
63 <test>
64 <param name="db_opts_selector" value="file" />
65 <param name="subject" value="four_human_proteins.fasta" ftype="fasta" />
66 <param name="window" value="12" />
67 <param name="locut" value="2.2" />
68 <param name="hicut" value="2.5" />
69 <param name="outformat" value="maskinfo_asn1_bin" />
70 <output name="outfile" file="segmasker_four_human.maskinfo-asn1-binary" />
71 </test>
72 <test>
73 <param name="db_opts_selector" value="file" />
74 <param name="subject" value="four_human_proteins.fasta" ftype="fasta" />
75 <param name="window" value="12" />
76 <param name="locut" value="2.2" />
77 <param name="hicut" value="2.5" />
78 <param name="outformat" value="maskinfo_asn1_text" />
79 <output name="outfile" file="segmasker_four_human.maskinfo-asn1" />
80 </test>
81 </tests>
82 <help>
83 **What it does**
84
85 This tool identifies and masks out low complexity regions of a protein database (or proteins in FASTA format) by using the SEG_ algorithm.
86
87 If you select *maskinfo ASN.1* (binary or text) as output format, the output file can be used as masking data for NCBI BLAST+ makeblastdb tool.
88
89 More information about segmasker can be found in the `BLAST Command Line Applications User Manual`_.
90
91 .. _BLAST Command Line Applications User Manual: http://www.ncbi.nlm.nih.gov/books/NBK1763/
92 .. _SEG: http://www.ncbi.nlm.nih.gov/pubmed/8743706
93
94 **References**
95
96 If you use this Galaxy tool in work leading to a scientific publication please
97 cite the following papers (a more specific paper covering this wrapper is planned):
98
99 @REFERENCES@
100 </help>
101 </tool>