comparison prot_features.xml @ 0:e3b52db3d583 draft

planemo upload commit abb24d36c776520e73220d11386252d848173697-dirty
author proteore
date Sun, 26 Nov 2017 19:45:52 -0500
parents
children bfc679370c64
comparison
equal deleted inserted replaced
-1:000000000000 0:e3b52db3d583
1 <tool id="prot_features" name="Protein Features (neXtProt)" version="0.1.0">
2 <description>
3 obtains different features of your protein list from neXtProt.
4 </description>
5 <requirements>
6 </requirements>
7 <stdio>
8 <exit_code range="1:" />
9 </stdio>
10 <command><![CDATA[
11
12 #if $inputtype.filetype == "copy_paste":
13 Rscript --vanilla $__tool_directory__/get_data_nextprot.R --inputtype copypaste --input '$inputtype.genelist' --nextprot $__tool_directory__/result_nextprot.txt --column c1 --argsP1 '$Nextprot_params.P1' --argsP2 '$Nextprot_params.P2'--argsP3 '$Nextprot_params.P3' --type '$idtype' --output '$output' --header None
14 #end if
15
16 #if $inputtype.filetype == "file_all":
17
18 Rscript --vanilla $__tool_directory__/get_data_nextprot.R --inputtype tabfile --input '$inputtype.genelist' --nextprot $__tool_directory__/result_nextprot.txt --column '$inputtype.column' --argsP1 '$Nextprot_params.P1' --argsP2 '$Nextprot_params.P2'--argsP3 '$Nextprot_params.P3' --type '$idtype' --output '$output' --header '$inputtype.header'
19
20 #end if
21
22
23 ]]></command>
24
25 <inputs>
26 <conditional name="inputtype">
27 <param name="filetype" type="select" label="Select your type of input file">
28 <option value="file_all">Input file containing your identifiers</option>
29 <option value="copy_paste">Copy/paste your list of IDs</option>
30 </param>
31 <when value="copy_paste">
32 <param name="genelist" type="text" label="Enter a list of identifiers"/>
33 </when>
34 <when value="file_all">
35 <param name="genelist" type="data" format="txt,tabular" label="Choose a multiple-columns file" help="This file must imperatively have 1 column filled with IDs consistent with the database that will be used. Please use the MappingIDs component if this is not the case."/>
36 <param name="column" type="text" label="Please specify the column where you would like to apply the comparison (e.g : Enter c1)" value="c1"/>
37 <param name="header" type="select" label="Does your file have a header?" multiple="false" optional="false">
38 <option value="TRUE" selected="true">Yes</option>
39 <option value="FALSE" selected="false">No</option>
40 </param>
41 </when>
42 </conditional>
43 <param name="idtype" type="select" label="Type of your input ids" multiple="false" optional="false">
44 <option value="nextprot" selected="false">Nextprot IDs</option>
45 <option value="uniprot" selected="true">Uniprot IDs</option>
46 </param>
47
48 <section name="Nextprot_params" title="Choose the type of information (compulsory step)" expanded="True">
49 <param name="P1" type="select" label="Physico-Chemical Features" multiple="true" help="Choose the information you want to add to your data from Nextprot" display="checkboxes" optional="true">
50 <option value="MW" selected="false">Molecular Weight</option>
51 <option value="SeqLength" selected="false">Sequence Length</option>
52 <option value="IsoPoint" selected="false">Isoelectric point</option>
53 <option value="TMDomains" selected="false">Number of transmembrane domains</option>
54 <option value="ProteinExistence" selected="false">Protein Existence (PE level)</option>
55 </param>
56
57 <param name="P2" type="select" label="Localization" multiple="true" help="Choose the information you want to add to your data from Nextprot" display="checkboxes" optional="true">
58 <option value="Chr" selected="false">Chromosome</option>
59 <option value="SubcellLocations" selected="false">Subcellular Location</option>
60 </param>
61
62 <param name="P3" type="select" label="Diseases information">
63 <option value="Diseases">Yes</option>
64 <option value="None">No</option>
65 </param>
66 </section>
67
68 </inputs>
69
70
71 <outputs>
72 <data name="output" format="tsv" label="Add information from ${database_type.database}"/>
73
74
75 </outputs>
76
77
78 <tests>
79 <test>
80 <conditional name="inputtype">
81 <param name="filetype " value="tabfile"/>
82 <param name="genelist" value="mitochondrion_enzymes_Nextprot.txt"/>
83 <param name="column" value="c1"/>
84 <param name="header" value="TRUE"/>
85 </conditional>
86
87 <param name="idtype" value="nextprot"/>
88
89 <section name="Nextprot_params">
90 <param name="P1" value="MW,SeqLength,IsoPoint,TMDomains,ProteinExistence"/>
91 <param name="P2" value="Chr,SubcellLocations"/>
92 <param name="P3" value="Diseases"/>
93 </section>
94
95 <output name="output" file="output_get_data.tsv"/>
96 </test>
97 </tests>
98
99 <help><![CDATA[
100
101 This tool filters an input **tabular** file according to different databases.
102
103 **Input**
104
105 Input can be a file containing multiple fields but with **at least one column of Ensembl gene IDs** or a list of Ensembl gene ids. If your input file contains other kind of IDs, please refer to the MappingIDs component to create a column of Ensembl gene IDs.
106
107 **Databases**
108
109 The input file will be filtered using information from different sources :
110
111 - HPA normal tissue : will filter the input according to the data contained in the Human Protein Atlas webservice. Pertinent information, such as tissular location, will be added for each gene to your input file.
112
113 - HPA cancer tissue : will filter the input according to the data contained in the Human Protein Atlas webservice for cancer. Pertinent information, such as tumor type, will be added for each gene to your input file.
114
115 **Parameters**
116
117 For HPA normal tissue :
118
119 - tissue category : categories based on RNA-Seq data to estimate the transcript abundance of each protein-coding gene in tissues. For more information, please refer to http://www.proteinatlas.org/about/assays+annotation#rna .
120
121 - level of detection IF : level of detection of the protein associated to the coding gene tissues based on immunofluorescency. For more information, please refer to http://www.proteinatlas.org/about/assays+annotation#if .
122
123 - level of detection IH : level of detection of the protein associated to the coding gene tissues based on immunohistochemistry. For more information, please refer to http://www.proteinatlas.org/about/assays+annotation#if .
124
125 For HPA cancer tissue :
126
127 - tumors : which tumors are associated with your protein-coding genes according to the Human Protein Atlas.
128
129
130 **Outputs**
131
132 The output will be a tabular file. The initial columns will be kept, but lines can be deleted due to the filtering process. Additional columns will be added according to which data you chose to filter your input with.
133
134
135 **Data sources**
136
137 The data for HPA normal tissue was retrieved from the Human Protein Atlas downloadable data repository (http://www.proteinatlas.org/download/proteinatlas.tab.gz).
138
139 The data for HPA cancer was retrieved from the Human Protein Atlas downloadable data repository (http://www.proteinatlas.org/download/cancer.csv.zip).
140 ]]></help>
141
142 <citations>
143 </citations>
144
145 </tool>