Mercurial > repos > malex > secimtools
annotate subset_data.xml @ 1:2e7d47c0b027 draft
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
author | malex |
---|---|
date | Mon, 08 Mar 2021 22:04:06 +0000 |
parents | |
children | caba07f41453 |
rev | line source |
---|---|
1
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
1 <tool id="secimtools_subset_data" name="Subset Wide Data and Design File" version="@WRAPPER_VERSION@"> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
2 <description>- Based on groups.</description> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
3 <requirements> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
4 <requirement type="python-module">os</requirement> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
5 <requirement type="python-module">pandas</requirement> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
6 <requirement type="python-module">interface</requirement> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
7 </requirements> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
8 <command detect_errors="exit_code"><![CDATA[ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
9 subset_data.py |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
10 --input $input |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
11 --design $design |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
12 --uniqID $uniqID |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
13 #if $group |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
14 --group $group |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
15 #end if |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
16 --drops $toDrop |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
17 --out $out |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
18 ]]></command> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
19 <inputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
20 <param name="input" type="data" format="tabular" label="Wide Dataset" help="Input your tab-separated wide format dataset. If not tab separated see TIP below."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
21 <param name="design" type="data" format="tabular" label="Design File" help="Input your design file (tab-separated). Note you need a 'sampleID' column. If not tab separated see TIP below."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
22 <param name="uniqID" type="text" size="30" value="" label="Unique Feature ID" help="Name of the column in your wide dataset that has unique identifiers."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
23 <param name="group" type="text" size="30" value="" optional="false" label="Group/Treatment [Optional]" help="Name of the column in your design file that contains group classifications. If not provided, the drop will be performed by 'sampleID'."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
24 <param name="toDrop" type="text" size="30" optional="false" label="Group(s)/Sample(s) to drop" help="Name of the Group(s)/Sample(s), comma separated, that will be removed from your wide datset."/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
25 </inputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
26 <outputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
27 <data format="tabular" name="out" label="${tool.name} on ${on_string}: Value"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
28 </outputs> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
29 <macros> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
30 <import>macros.xml</import> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
31 </macros> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
32 <tests> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
33 <test> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
34 <param name="input" value="ST000006_data.tsv"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
35 <param name="design" value="ST000006_design_names_underscore.tsv"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
36 <param name="uniqID" value="Retention_Index" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
37 <param name="group" value="White_wine_type_and_source" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
38 <param name="drops" value="Chardonnay_ Napa_ CA 2003,Riesling_ CA 2004" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
39 <output name="out" file="ST000006_subset_data_output.tsv" /> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
40 </test> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
41 </tests> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
42 <help> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
43 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
44 @TIP_AND_WARNING@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
45 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
46 **Tool Description** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
47 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
48 The tool creates new wide format dataset and design dataset based on the existing wide and design datasets where only groups specified by the user are present. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
49 The user chooses which group(s) to include in the new datasets. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
50 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
51 -------------------------------------------------------------------------------- |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
52 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
53 **Input** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
54 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
55 - Two input datasets are required. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
56 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
57 @WIDE@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
58 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
59 **NOTE:** The sample IDs must match the sample IDs in the Design File |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
60 (below). Extra columns will automatically be ignored. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
61 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
62 @METADATA@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
63 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
64 @UNIQID@ |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
65 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
66 **Group/Treatment [Optional]** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
67 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
68 - Name of the column in your Design File that contains group classifications. If none provided the drop will be performed by 'sampleID'. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
69 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
70 **Group(s)/Sample(s) to drop** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
71 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
72 - Name of the Group(s)/Sample(s), comma separeted, that will be removed from your wide datset. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
73 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
74 -------------------------------------------------------------------------------- |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
75 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
76 **Output** |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
77 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
78 This tool will output two TSV files: a TSV file containing the subset of the original wide format dataset and a TSV file containing the subset of the original design dataset. Both datasets will contain only the samples belonging to groups selected by the user. |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
79 |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
80 ]]></help> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
81 <expand macro="citations"/> |
2e7d47c0b027
"planemo upload for repository https://malex@toolshed.g2.bx.psu.edu/repos/malex/secimtools"
malex
parents:
diff
changeset
|
82 </tool> |