annotate rank_pathways.xml @ 28:184d14e4270d

Update to Miller Lab devshed revision 4ede22dd5500
author Richard Burhans <burhans@bx.psu.edu>
date Wed, 17 Jul 2013 12:46:46 -0400
parents 8997f2ca8c7a
children a631c2f6d913
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
27
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
1 <tool id="gd_calc_freq" name="Rank Pathways" version="1.2.0">
22
95a05c1ef5d5 update to devshed revision aaece207bd01
Richard Burhans <burhans@bx.psu.edu>
parents: 21
diff changeset
2 <description>: Assess the impact of a gene set on KEGG pathways</description>
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
3
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
4 <command interpreter="python">
27
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
5 #if $rank_by.choice == 'pct'
22
95a05c1ef5d5 update to devshed revision aaece207bd01
Richard Burhans <burhans@bx.psu.edu>
parents: 21
diff changeset
6 rank_pathways_pct.py
27
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
7 --input '$rank_by.input1'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
8 --columnENSEMBLT '$rank_by.t_col1'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
9 --inBckgrndfile '$rank_by.input2'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
10 --columnENSEMBLTBckgrnd '$rank_by.t_col2'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
11 --columnKEGGBckgrnd '$rank_by.k_col2'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
12 --statsTest '$rank_by.stat'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
13 --output '$output'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
14 #else if $rank_by.choice == 'paths'
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
15 calclenchange.py
27
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
16 '--loc_file=${GALAXY_DATA_INDEX_DIR}/gd.rank.loc'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
17 '--species=${rank_by.input.metadata.dbkey}'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
18 '--input=${rank_by.input}'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
19 '--output=${output}'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
20 '--posKEGGclmn=${rank_by.kpath}'
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
21 '--KEGGgeneposcolmn=${rank_by.kgene}'
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
22 #end if
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
23 </command>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
24
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
25 <inputs>
27
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
26 <conditional name="rank_by">
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
27 <param name="choice" type="select" label="Rank by">
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
28 <option value="pct" selected="true">percentage of genes affected</option>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
29 <option value="paths">change in length and number of paths</option>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
30 </param>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
31 <when value="pct">
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
32 <!-- using fields similar to the Rank Terms tool -->
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
33 <param name="input1" type="data" format="tabular" label="Query dataset" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
34 <param name="t_col1" type="data_column" data_ref="input1" label="Column with ENSEMBL transcript codes" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
35 <param name="input2" type="data" format="tabular" label="Background dataset" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
36 <param name="t_col2" type="data_column" data_ref="input2" label="Column with ENSEMBL transcript codes" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
37 <param name="k_col2" type="data_column" data_ref="input2" label="Column with KEGG pathways" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
38 <param name="stat" type="select" label="Statistic for determining enrichment/depletion">
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
39 <option value="fisher" selected="true">two-tailed Fisher's exact test</option>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
40 <option value="hypergeometric">hypergeometric test</option>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
41 <option value="binomial">binomial probability</option>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
42 </param>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
43 </when>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
44 <when value="paths">
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
45 <param name="input" type="data" format="tabular" label="Dataset" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
46 <param name="kgene" type="data_column" data_ref="input" label="Column with KEGG gene ID" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
47 <param name="kpath" type="data_column" data_ref="input" numerical="false" label="Column with KEGG pathways" />
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
48 </when>
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
49 </conditional>
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
50 </inputs>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
51
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
52 <outputs>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
53 <data name="output" format="tabular" />
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
54 </outputs>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
55
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
56 <tests>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
57 <test>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
58 </test>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
59 </tests>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
60
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
61 <help>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
62
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
63 **Dataset formats**
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
64
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
65 The query dataset has a column containing ENSEMBL transcript codes for
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
66 the gene set of interest, while the background dataset has one column
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
67 with ENSEMBL transcript codes and another with GO terms, for some larger
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
68 universe of genes.
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
69
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
70 All of the input and output datasets are in tabular_ format. The input
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
71 dataset (i.e. query) to rank by "percentage of genes affected" has a
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
72 column containing ENSEMBL transcript codes for the gene set of interest,
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
73 while the background dataset has one column with ENSEMBL transcript
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
74 codes and another with KEGG pathways, for some larger universe of genes.
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
75 The input dataset to rank by "change in length and number of paths"
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
76 must have columns with KEGG gene ID and pathways. The output datasets
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
77 are described below. (`Dataset missing?`_)
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
78
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
79 .. _tabular: ./static/formatHelp.html#tab
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
80 .. _Dataset missing?: ./static/formatHelp.html
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
81
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
82 -----
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
83
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
84 **What it does**
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
85
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
86 Given a query set of genes from a larger background dataset, this tool
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
87 evaluates the over- or under-representation of KEGG pathways in the query
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
88 set, using the specified statistical test. Alternatively, the tool ranks
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
89 the pathways based on the change in length and number of paths connecting
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
90 sources and sinks. This change is calculated between graphs representing
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
91 pathways with and without excluding the nodes that represent the genes
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
92 in an input list. Sources are all the nodes representing the initial
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
93 reactants/products in the pathway. Sinks are all the nodes representing
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
94 the final reactants/products in the pathway.
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
95
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
96 If pathways are ranked by percentage of genes affected, the output
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
97 contains a row for each KEGG pathway, with the following columns:
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
98
27
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
99 1. count: the number of genes in the query set that are in this pathway
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
100 2. representation: the percentage of this pathway's genes (from the background dataset) that appear in the query set
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
101 3. ranking of this pathway, based on its representation ("1" is highest)
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
102 4. probability of depletion of this pathway in the query dataset
8997f2ca8c7a Update to Miller Lab devshed revision bae0d3306d3b
Richard Burhans <burhans@bx.psu.edu>
parents: 22
diff changeset
103 5. probability of enrichment of this pathway in the query dataset
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
104 6. name of the pathway
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
105
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
106 If pathways are ranked by change in length and number of paths, the
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
107 output is a tabular dataset with the following columns:
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
108
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
109 1. change in the mean length of paths between sources and sinks
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
110 2. mean length of paths between sources and sinks in the pathway including the genes in the input dataset. If the pathway do not have sources/sinks, the length is assumed to be infinite (I)
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
111 3. mean length of paths between sources and sinks in the pathway excluding the genes in the input dataset. If the pathway do not have sources/sinks, the length is assumed to be infinite (I)
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
112 4. rank of the change in the mean length of paths between sources and sinks (from high change to low change)
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
113 5. change in the number of paths between sources and sinks
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
114 6. number of paths between sources and sinks in the pathway including the genes in the input dataset. If the pathway do not have sources/sinks, it is assumed to be a circuit (C)
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
115 7. number of paths between sources and sinks in the pathway excluding the genes in the input dataset. If the pathway do not have sources/sinks, it is assumed to be a circuit (C)
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
116 8. rank of the change in the number of paths between sources and sinks (from high change to low change)
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
117 9. name of the pathway
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
118
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
119 -----
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
120
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
121 **Examples**
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
122
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
123 Rank by percentage of genes affected:
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
124
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
125 - input background dataset (column 5 for ENSEMBL transcript, column 12 for KEGG pathways, two-tailed Fisher's exact test for statistic)::
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
126
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
127 Contig39_chr1_3261104_3261850 414 chr1 3261546 ENSCAFT00000000001 ENSCAFP00000000001 S 667 F 476153 probably damaging cfa00230=Purine metabolism.cfa00500=Starch and sucrose metabolism.cfa00740=Riboflavin metabolism.cfa00760=Nicotinate and nicotinamide metabolism.cfa00770=Pantothenate and CoA biosynthesis.cfa01100=Metabolic pathways
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
128 Contig62_chr1_19011969_19012646 265 chr1 19012240 ENSCAFT00000000144 ENSCAFP00000000125 * 161 R 483960 probably damaging N
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
129 etc.
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
130
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
131 - input query dataset (column 5 for ENSEMBL transcript)::
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
132
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
133 Contig12_chr20_101969_112646 265 chr20 9822141 ENSCAFT00000001234 ENSCAFP00000021123 T 101 R 476153 probably damaging
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
134 Contig39_chr1_3261104_3261850 414 chr1 3261546 ENSCAFT00000000001 ENSCAFP00000000001 S 667 F 476153 probably damaging
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
135 etc.
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
136
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
137 - output::
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
138
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
139 3 0.20 1 1.0 0.0065 cfa03450=Non-homologous end-joining
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
140 1 0.067 2 1.0 0.019 cfa00750=Vitamin B6 metabolism
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
141 2 0.062 3 1.0 0.021 cfa00290=Valine, leucine and isoleucine biosynthesis
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
142 1 0.037 4 1.0 0.035 cfa00770=Pantothenate and CoA biosynthesis
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
143 etc.
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
144
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
145 Rank by change in length and number of paths:
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
146
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
147 - input (column 10 for KEGG gene ID, column 12 for KEGG pathways)::
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
148
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
149 Contig39_chr1_3261104_3261850 414 chr1 3261546 ENSCAFT00000000001 ENSCAFP00000000001 S 667 F 476153 probably damaging cfa00230=Purine metabolism.cfa00500=Starch and sucrose metabolism.cfa00740=Riboflavin metabolism.cfa00760=Nicotinate and nicotinamide metabolism.cfa00770=Pantothenate and CoA biosynthesis.cfa01100=Metabolic pathways
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
150 Contig62_chr1_19011969_19012646 265 chr1 19012240 ENSCAFT00000000144 ENSCAFP00000000125 * 161 R 483960 probably damaging N
21
d6b961721037 Miller Lab Devshed version 4c04e35b18f6
Richard Burhans <burhans@bx.psu.edu>
parents: 14
diff changeset
151 etc.
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
152
28
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
153 - output::
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
154
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
155 3.64 8.44 4.8 2 4 9 5 1 cfa00260=Glycine, serine and threonine metabolism
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
156 7.6 9.6 2 1 3 5 2 2 cfa00240=Pyrimidine metabolism
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
157 0.05 2.67 2.62 6 1 30 29 3 cfa00982=Drug metabolism - cytochrome P450
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
158 -0.08 8.33 8.41 84 1 30 29 3 cfa00564=Glycerophospholipid metabolism
184d14e4270d Update to Miller Lab devshed revision 4ede22dd5500
Richard Burhans <burhans@bx.psu.edu>
parents: 27
diff changeset
159 etc.
14
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
160 </help>
8ae67e9fb6ff Uploaded Miller Lab Devshed version a51c894f5bed again [possible toolshed.g2 bug]
miller-lab
parents:
diff changeset
161 </tool>