Mercurial > repos > miller-lab > genome_diversity
diff specify.xml @ 13:fdb4240fb565
Uploaded Miller Lab Devshed version a51c894f5bed
author | miller-lab |
---|---|
date | Fri, 28 Sep 2012 11:34:31 -0400 |
parents | |
children | 248b06e86022 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/specify.xml Fri Sep 28 11:34:31 2012 -0400 @@ -0,0 +1,87 @@ +<tool id="gd_specify" name="Specify Individuals" version="1.0.0"> + <description>: Define a collection of individuals from a gd_snp dataset</description> + + <command interpreter="bash"> + echo.bash "$input" "$output" + #for $individual in str($individuals).split(',') + #set $individual_idx = $input.dataset.metadata.individual_names.index($individual) + #set $individual_col = str( $input.dataset.metadata.individual_columns[$individual_idx] ) + #set $arg = '\t'.join([$individual_col, $individual, '']) + "$arg" + #end for + </command> + + <inputs> + <param name="input" type="data" format="gd_snp" label="SNP dataset"/> + <param name="individuals" type="select" display="checkboxes" multiple="true" label="Individuals to include"> + <options> + <filter type="data_meta" ref="input" key="individual_names" /> + </options> + <validator type="no_options" message="You must select at least one individual."/> + </param> + <param name="outname" type="text" size="20" label="Label for this collection"> + <validator type="empty_field" message="You must enter a label."/> + #used to be "Individuals from ${input.hid}" + </param> + </inputs> + + <outputs> + <data name="output" format="gd_indivs" label="${outname}" /> + </outputs> + + <tests> + <test> + <param name="input" value="test_in/sample.gd_snp" ftype="gd_snp" /> + <param name="individuals" value="PB1,PB2" /> + <output name="output" file="test_in/a.gd_indivs" /> + </test> + </tests> + + <help> + +**Dataset formats** + +The input dataset is in gd_snp_ format; +the output is in gd_indivs_ format. (`Dataset missing?`_) + +.. _gd_snp: ./static/formatHelp.html#gd_snp +.. _gd_indivs: ./static/formatHelp.html#gd_indivs +.. _Dataset missing?: ./static/formatHelp.html + +----- + +**What it does** + +This tool makes a list of selected entities (the sets of four columns +representing individuals or groups) from a gd_snp dataset. It does not copy +the SNP data; it just records which entities should be considered as belonging +to some collection or population. The label you specify is used to name the +output dataset in your history. This list can then be used to instruct other +tools to work on just part of the original gd_snp dataset. + +----- + +**Example** + +- input:: + + Contig161_chr1_4641264_4641879 115 C T 73.5 chr1 4641382 C 6 0 2 45 8 0 2 51 15 0 2 72 5 0 2 42 6 0 2 45 10 0 2 57 Y 54 0.323 0 + Contig48_chr1_10150253_10151311 11 A G 94.3 chr1 10150264 A 1 0 2 30 1 0 2 30 1 0 2 30 3 0 2 36 1 0 2 30 1 0 2 30 Y 22 +99. 0 + Contig20_chr1_21313469_21313570 66 C T 54.0 chr1 21313534 C 4 0 2 39 4 0 2 39 5 0 2 42 4 0 2 39 4 0 2 39 5 0 2 42 N 1 +99. 0 + etc. + +- input metadata:: + + #{"column_names":["scaf","pos","A","B","qual","ref","rpos","rnuc", + #"1A","1B","1G","1Q","2A","2B","2G","2Q","3A","3B","3G","3Q","4A","4B","4G","4Q","5A","5B","5G","5Q","6A","6B","6G","6Q", + #"pair","dist","prim","rflp"],"dbkey":"canFam2","individuals":[["PB1",9],["PB2",13],["PB3",17],["PB4",21],["PB6",25],["PB8",29]], + #"pos":2,"rPos":7,"ref":6,"scaffold":1,"species":"bear"} + +- output when individuals PB1, PB2, and PB3 are selected:: + + 9 PB1 + 13 PB2 + 17 PB3 + + </help> +</tool>