Mercurial > repos > malex > secimtools
annotate run_order_regression.xml @ 1:2e7d47c0b027 draft
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
author | malex |
---|---|
date | Mon, 08 Mar 2021 22:04:06 +0000 |
parents | |
children |
rev | line source |
---|---|
1
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
1 <tool id="secimtools_run_order_regression" name="Run Order Regression (ROR)" version="@WRAPPER_VERSION@"> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
2 <description>using the order samples were run.</description> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
3 <macros> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
4 <import>macros.xml</import> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
5 </macros> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
6 <expand macro="requirements" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
7 <command detect_errors="exit_code"><![CDATA[ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
8 run_order_regression.py |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
9 --input $input |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
10 --design $design |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
11 --ID $uniqID |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
12 --group $group |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
13 --order $order |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
14 --fig $order_plots |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
15 --table $order_summary |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
16 --flags $flags |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
17 ]]></command> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
18 <inputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
19 <param name="input" type="data" format="tabular" label="Wide Dataset" help="Input your tab-separated wide format dataset. If file is not tab separated see TIP below."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
20 <param name="design" type="data" format="tabular" label="Design File" help="Input your design file(tab-separated). Note you need a 'sampleID' column. If not tab separated see TIP below."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
21 <param name="uniqID" type="text" size="30" value="" label="Unique Feature ID" help="Name of the column in your wide dataset that has unique identifiers."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
22 <param name="group" type="text" size="30" value="" label="Group/Treatment" help="Name of the column in your design file that contains group classifications."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
23 <param name="order" type="text" size="30" value="" label="Run Order ID" help="The name of the column in your design file that contains the order the samples were run."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
24 </inputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
25 <outputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
26 <data name="order_plots" format="pdf" label="${tool.name} on ${on_string}: Plots" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
27 <data name="order_summary" format="tabular" label="${tool.name} on ${on_string}: Summary"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
28 <data name="flags" format="tabular" label="${tool.name} on ${on_string}: Flags"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
29 </outputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
30 <tests> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
31 <test> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
32 <param name="input" value="ST000006_data.tsv"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
33 <param name="design" value="ST000006_design.tsv"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
34 <param name="uniqID" value="Retention_Index" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
35 <param name="group" value="White_wine_type_and_source" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
36 <param name="order" value="run_Order_fake_variable" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
37 <output name="order_plots" file="ST000006_run_order_regression_figure.pdf" compare="sim_size" delta="10000" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
38 <output name="order_summary" file="ST000006_run_order_regression_table.tsv" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
39 <output name="flags" file="ST000006_run_order_regression_flags.tsv" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
40 </test> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
41 </tests> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
42 <help><![CDATA[ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
43 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
44 @TIP_AND_WARNING@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
45 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
46 **Tool Description** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
47 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
48 **NOTE:** The tool is intended to evaluate the impact of sample run order on feature (row) values. Not applicable in the absence of known run order. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
49 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
50 It uses linear regression to identify features where the regression slope is not zero for nominal levels of significance. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
51 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
52 The tool fits a simple linear regression by feature (row) using values for each feature as a response and sample run order as a linear predictor. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
53 The goal is to identify a linear trend that changes over time and determine whether the trends are statistically significant. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
54 The tool generates flags if the slope is statistically significant for two different levels of statistical significance ( alpha = 0.05 and alpha = 0.01). |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
55 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
56 NOTE: Groups with one element are excluded from the analysis. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
57 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
58 -------------------------------------------------------------------------------- |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
59 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
60 **Input** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
61 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
62 - Two input datasets are required. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
63 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
64 @WIDE@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
65 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
66 **NOTE:** The sample IDs must match the sample IDs in the Design File (below). Extra columns will automatically be ignored. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
67 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
68 @METADATA@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
69 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
70 @UNIQID@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
71 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
72 @GROUP@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
73 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
74 - **NOTE:** Groups with one element will be excluded. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
75 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
76 @RUNORDER@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
77 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
78 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
79 ----------------------------------------------------------------------------------- |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
80 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
81 **Output** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
82 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
83 This tool outputs three different files: |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
84 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
85 (1) a TSV file of regression summaries including the values of the regression slope, corresponding p-value and r-squared value. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
86 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
87 (2) a TSV file with the corresponding flags for two levels of statistical significance (alpha = 0.05 and alpha = 0.01). |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
88 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
89 (3) and a PDF file with fitted regression plots for each feature. The values of the feature are displayed on the plot together with the regression line, bands, slopes, and corresponding p and r-squared values. The values are colored according to group classification. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
90 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
91 ]]></help> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
92 <expand macro="citations"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
93 </tool> |