comparison compute_kegg_pathways.xml @ 0:42d0805353b6 draft

planemo upload commit 0ce4c81e6d2f7af8c9b52f6c07e83b0319c2adb1-dirty
author proteore
date Wed, 19 Sep 2018 05:38:52 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:42d0805353b6
1 <tool id="compute_kegg_pathways" name="KEGG pathways coverage" version="2018.09.18">
2 <requirements>
3 <requirement type="package" version="1.18.0">bioconductor-keggrest</requirement>
4 </requirements>
5 <command detect_errors="exit_code"><![CDATA[
6 Rscript $__tool_directory__/compute_kegg_pathways.R
7
8 #if $input.ids == "text"
9 --id_list="$input.txt"
10 #else
11 --input="$input.file"
12 --id_column="$input.ncol"
13 --header="$input.header"
14 #end if
15
16 --id_type="$ref_ids.id_type"
17 --output="$output1"
18 --nb_pathways="$nb_pathways"
19 --ref="$__tool_directory__/$ref_ids.ref_file"
20
21 ]]></command>
22 <inputs>
23 <conditional name="input" >
24 <param name="ids" type="select" label="Provide your identifiers (Uniprot or Entrez gene)" help="Copy/paste or ID list from a file (e.g. table)" >
25 <option value="text">Copy/paste your identifiers</option>
26 <option value="file" selected="true">Input file containing your identifiers</option>
27 </param>
28 <when value="text" >
29 <param name="txt" type="text" label="Copy/paste your identifiers" help='IDs must be separated by "," into the form field, for example: P31946,P62258' >
30 <sanitizer invalid_char=''>
31 <valid initial="string.printable">
32 <remove value="&apos;"/>
33 </valid>
34 <mapping initial="none">
35 <add source="&apos;" target="__sq__"/>
36 </mapping>
37 </sanitizer>
38 </param>
39 </when>
40 <when value="file" >
41 <param name="file" type="data" format="txt,tabular" label="Select a file that contains your list of IDs" help="" />
42 <param name="header" type="boolean" checked="true" truevalue="true" falsevalue="false" label="Does your input file contain header?" />
43 <param name="ncol" type="text" value="c1" label="The column number of IDs to map" help='For example, fill in "c1" if it is the first column, "c2" if it is the second column and so on' />
44 </when>
45 </conditional>
46 <conditional name="ref_ids">
47 <param name="id_type" type="select" label="select your identifiers type :">
48 <option value="uniprot">Uniprot Accession number</option>
49 <option value="geneID">Entrez gene ID</option>
50 </param>
51 <when value="uniprot">
52 <param name="ref_file" type="select" label="Select species" >
53 <options from_data_table="uniprot_kegg_list"/>
54 <option>Human (Homo sapiens)</option>
55 <option>Mouse (Mus musculus)</option>
56 </param>
57 </when>
58 <when value="geneID">
59 <param name="ref_file" type="select" label="Select species" >
60 <options from_data_table="entrez_kegg_list"/>
61 <option>Human (Homo sapiens)</option>
62 <option>Mouse (Mus musculus)</option>
63 </param>
64 </when>
65 </conditional>
66 <param type="integer" name="nb_pathways" label="Set the number of pathways to be displayed in the output" value="10" help="pathways are sorted by percent of mapping gene by pathway in descending order"/>
67 </inputs>
68 <outputs>
69 <data name="output1" format="tsv" />
70 </outputs>
71 <help><![CDATA[
72
73 This tool computes the number of proteins from your list divided by the total number of protein of each KEGG pathway.
74
75 it allows you to identify the signaling pathways that are the most covered by your proteomics dataset.
76
77 By default the number of pathway to be displayed is set to 10 and sorted in descending order.
78
79 At the moment two species are supported: Human (Homo sapiens) and Mouse (Mus musculus)
80
81 **Input:**
82
83 Input can be either a list of Uniprot accession number or Entrez gene IDs (copy/paste mode) or a file containing multiple columns but with at least one column Uniprot accession number or Entrez gene IDs. If your input file contains other type of IDs, please use the ID_Converter tool.
84
85 **Output:**
86
87 The output is a tabular file (.tsv) with the following columns:
88
89 * **Pathway_ID:** KEGG pathway identifier (e.g. hsa04970)
90 * **Description:** name of the pathway as in KEGG
91 * **Ratio IDs mapped/total IDs (%):** percentage of pathway coverage
92 * **nb genes mapped in the pathway:** number of genes/proteins of your list mapped on the KEGG pathway
93 * **nb total genes present in the pathway:** total number of genes/proteins present in the KEGG pathway
94
95 -----
96
97 .. class:: infomark
98
99 **Database:**
100
101 Pathways and associated Uniprot Accession Number or Gene IDs are collected from KEGGREST package
102
103 User manual / Documentation: KEGGREST Bioconductor package https://bioconductor.org/packages/3.1/bioc/html/KEGGREST.html
104
105
106 -----
107
108 .. class:: infomark
109
110 **Galaxy integration**
111
112 David Christiany, Florence Combes, Yves Vandenbrouck CEA, INSERM, CNRS, Grenoble-Alpes University, BIG Institute, FR
113
114 Sandra Dérozier, Olivier Rué, Valentin Loux INRA, Paris-Saclay University, MAIAGE Unit, Migale Bioinformatics platform
115
116 This work has been partially funded through the French National Agency for Research (ANR) IFB project.
117
118 Contact support@proteore.org for any questions or concerns about the Galaxy implementation of this tool.
119
120 -----
121
122 compute_KEGG_pathways R script
123
124 | Arguments:
125 | --**help** Print this test
126 | --**input** tab file
127 | --**id_list** id list ',' separated
128 | --**id_type** type of input ids (uniprot_AC or geneID)
129 | --**id_column** number og column containg ids of interest
130 | --**org** organism : Hs , Mm, ...
131 | --**nb_pathways** number of pathways to return
132 | --**header** boolean
133 | --**output** output path
134 | --**ref** ref file (l.hsa.gene.RData, l.hsa.up.RData)
135 |
136 | Example:
137 | Rscript compute_KEGG_pathways.R --input='P31946,P62258' --id_type='uniprot' --id_column 'c1' --header TRUE
138 |
139
140 ]]></help>
141 <citations>
142 <citation type="bibtex">
143 @misc{githubKEGGREST,
144 title = {KEGGREST: Client-side REST access to KEGG},
145 author = {Dan Tenenbaum},
146 year = {2018},
147 note = {R package version 1.18.1},
148 publisher = {GitHub},
149 journal = {GitHub repository},
150 url = {https://github.com/Bioconductor/KEGGREST},
151 }</citation>
152 </citations>
153 </tool>