Mercurial > repos > greg > affy2vcf
changeset 0:a1e53778a82b draft
Uploaded
author | greg |
---|---|
date | Fri, 12 Oct 2018 09:46:32 -0400 |
parents | |
children | a2f0931898be |
files | .shed.yml affy2vcf.xml all_fasta.loc.sample tool_data_table_conf.xml.sample |
diffstat | 4 files changed, 152 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/.shed.yml Fri Oct 12 09:46:32 2018 -0400 @@ -0,0 +1,11 @@ +name: affy2vcf +owner: greg +description: | + Contains a tool that converts Affymetrix genotype calls and intensity files to VCF format. +homepage_url: https://github.com/freeseek/gtc2vcf +long_description: | + Contains a tool that converts Affymetrix genotype calls and intensity files to VCF format. +remote_repository_url: https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/convert_formats/affy2vcf +type: unrestricted +categories: + - Convert Formats
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/affy2vcf.xml Fri Oct 12 09:46:32 2018 -0400 @@ -0,0 +1,116 @@ +<tool id="affr2vcf" name="Convert Affymetrix" version="1.9"> + <description>genotype calls and intensities to VCF</description> + <requirements> + <requirement type="package" version="1.9">bcftools-gtc2vcf-plugin</requirement> + </requirements> + <command detect_errors="exit_code"><![CDATA[ +#set text_outputs_dir = 'text_outputs' +export BCFTOOLS_PLUGINS=\$(dirname `which bcftools`)/../libexec/bcftools && +mkdir $text_outputs_dir && +bcftools +\$BCFTOOLS_PLUGINS/affy2vcf.so +#if str($reference_genome_source_cond.reference_genome_source) == "history": + --fasta-ref '$reference_genome_source_cond.history_item' +#else: + --fasta-ref '$reference_genome_source_cond.locally_cached_item' +#end if +--annot '$annot' +--snp-posteriors '$snp_posteriors' +--summary '$summary' +--report '$report' +--calls '$calls' +--confidences '$confidences' +#if str($output_gender_estimate_cond.output_gender_estimate) == "yes" + --sex '$gender_estimate' +#end if +#if str($append_version) == "no": + --no-version +#end if +--output '$output' +--output-type $output_type +--threads \${GALAXY_SLOTS:-4} + ]]></command> + <inputs> + <conditional name="reference_genome_source_cond"> + <param name="reference_genome_source" type="select" label="Will you select a reference reference genome from your history or use a locally cached genome index?"> + <option value="history" selected="true">Use a reference genome from my history</option> + <option value="cached">Use a locally cached genome index</option> + </param> + <when value="history"> + <param name="history_item" type="data" format="fasta" label="Select reference genome" /> + </when> + <when value="cached"> + <param name="locally_cached_item" type="select" format="fasta" label="Fasta reference sequence"> + <options from_data_table="all_fasta"> + <column name="name" index="1"/> + <column name="value" index="2"/> + <column name="path" index="2"/> + <filter type="sort_by" column="1"/> + <validator type="no_options" message="No cached Fasta genome references are available." /> + </options> + </param> + </when> + </conditional> + <param name="annot" type="data" format="csv" label="Probeset annotation file" /> + <param name="summary" type="data" format="txt" label="Apt-probeset genotype summary file" /> + <param name="snp_posteriors" type="data" format="txt" label="Apt-probeset genotype snp-posteriors file" /> + <param name="report" type="data" format="txt" label="Apt-probeset genotype report file" /> + <param name="confidences" type="data" format="txt" label="Apt-probeset genotype confidences file" /> + <param name="calls" type="data" format="txt" label="Apt-probeset genotype calls file" /> + <conditional name="output_gender_estimate_cond"> + <param name="output_gender_estimate" type="select" force_select="true" label="Output apt-probeset-genotype gender estimate?"> + <option value="no" selected="true">No</option> + <option value="yes">Yes</option> + </param> + <when value="no"/> + <when value="yes"/> + </conditional> + <param name="append_version" type="select" force_select="true" label="Append version and command line to the header?"> + <option value="no" selected="true">No</option> + <option value="yes">Yes</option> + </param> + <param name="output_type" type="select" force_select="true" label="Select format for output?"> + <option value="v" selected="true">Uncompressed VCF</option> + <option value="z">Compressed VCF</option> + <option value="u" selected="true">Uncompressed BCF</option> + <option value="b">Compressed BCF</option> + </param> + </inputs> + <outputs> + <data name="output" format="vcf" /> + <data name="output_gender_estimate" format="txt" label="${tool.name} (gender estimate) on ${on_string}"> + <filter>output_gender_estimate_cond['output_gender_estimate'] == "yes"</filter> + </data> + </outputs> + <tests> + <test> + <param name="reference_genome_source" value="history"/> + <param name="history_item" value="GCF_000222465.1_Adig_1.1_genomic.fna" ftype="fasta"/> + <param name="annot" value="annot.csv" ftype="csv"/> + <param name="summary" value="summary.txt" ftype="txt"/> + <param name="snp_posteriors" value="snp_posteriors.txt" ftype="txt"/> + <param name="report" value="report.txt" ftype="txt"/> + <param name="confidences" value="confidences.txt" ftype="txt"/> + <param name="calls" value="calls.txt" ftype="txt"/> + <output name="output" value="output.vcf" ftype="vcf"/> + </test> + </tests> + <help> +This tool converts Affymetrix genotype calls and intensity files to VCF format. + +----- + +**Required options** + +**Other options** + </help> + <citations> + <citation type="bibtex"> + @misc{None, + journal = {None}, + author = {Genovese, Giulio}, + title = {None}, + year = {None}, + url = {https://github.com/freeseek/gtc2vcf},} + </citation> + </citations> +</tool>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/all_fasta.loc.sample Fri Oct 12 09:46:32 2018 -0400 @@ -0,0 +1,18 @@ +#This file lists the locations and dbkeys of all the fasta files +#under the "genome" directory (a directory that contains a directory +#for each build). The script extract_fasta.py will generate the file +#all_fasta.loc. This file has the format (white space characters are +#TAB characters): +# +#<unique_build_id> <dbkey> <display_name> <file_path> +# +#So, all_fasta.loc could look something like this: +# +#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa +#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa +#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa +# +#Your all_fasta.loc file should contain an entry for each individual +#fasta file. So there will be multiple fasta files for each build, +#such as with hg19 above. +#
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.sample Fri Oct 12 09:46:32 2018 -0400 @@ -0,0 +1,7 @@ +<tables> + <!-- Locations of all fasta files under genome directory --> + <table name="all_fasta" comment_char="#" allow_duplicate_entries="False"> + <columns>value, dbkey, name, path</columns> + <file path="tool-data/all_fasta.loc" /> + </table> +</tables>