changeset 0:a1e53778a82b draft

Uploaded
author greg
date Fri, 12 Oct 2018 09:46:32 -0400
parents
children a2f0931898be
files .shed.yml affy2vcf.xml all_fasta.loc.sample tool_data_table_conf.xml.sample
diffstat 4 files changed, 152 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/.shed.yml	Fri Oct 12 09:46:32 2018 -0400
@@ -0,0 +1,11 @@
+name: affy2vcf
+owner: greg
+description: |
+  Contains a tool that converts Affymetrix genotype calls and intensity files to VCF format.
+homepage_url: https://github.com/freeseek/gtc2vcf
+long_description: |
+  Contains a tool that converts Affymetrix genotype calls and intensity files to VCF format.
+remote_repository_url: https://github.com/gregvonkuster/galaxy_tools/tree/master/tools/convert_formats/affy2vcf
+type: unrestricted
+categories:
+  - Convert Formats
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/affy2vcf.xml	Fri Oct 12 09:46:32 2018 -0400
@@ -0,0 +1,116 @@
+<tool id="affr2vcf" name="Convert Affymetrix" version="1.9">
+    <description>genotype calls and intensities to VCF</description>
+    <requirements>
+        <requirement type="package" version="1.9">bcftools-gtc2vcf-plugin</requirement>
+    </requirements>
+    <command detect_errors="exit_code"><![CDATA[
+#set text_outputs_dir = 'text_outputs'
+export BCFTOOLS_PLUGINS=\$(dirname `which bcftools`)/../libexec/bcftools &&
+mkdir $text_outputs_dir &&
+bcftools +\$BCFTOOLS_PLUGINS/affy2vcf.so
+#if str($reference_genome_source_cond.reference_genome_source) == "history":
+    --fasta-ref '$reference_genome_source_cond.history_item'
+#else:
+    --fasta-ref '$reference_genome_source_cond.locally_cached_item'
+#end if
+--annot '$annot'
+--snp-posteriors '$snp_posteriors'
+--summary '$summary'
+--report '$report'
+--calls '$calls'
+--confidences '$confidences'
+#if str($output_gender_estimate_cond.output_gender_estimate) == "yes"
+    --sex '$gender_estimate'
+#end if
+#if str($append_version) == "no":
+    --no-version
+#end if
+--output '$output'
+--output-type $output_type
+--threads \${GALAXY_SLOTS:-4}
+    ]]></command>
+    <inputs>
+        <conditional name="reference_genome_source_cond">
+            <param name="reference_genome_source" type="select" label="Will you select a reference reference genome from your history or use a locally cached genome index?">
+                <option value="history" selected="true">Use a reference genome from my history</option>
+                <option value="cached">Use a locally cached genome index</option>
+            </param>
+            <when value="history">
+                <param name="history_item" type="data" format="fasta" label="Select reference genome" />
+            </when>
+            <when value="cached">
+                <param name="locally_cached_item" type="select" format="fasta" label="Fasta reference sequence">
+                    <options from_data_table="all_fasta">
+                        <column name="name" index="1"/>
+                        <column name="value" index="2"/>
+                        <column name="path" index="2"/>
+                        <filter type="sort_by" column="1"/>
+                        <validator type="no_options" message="No cached Fasta genome references are available." />
+                    </options>
+                </param>
+            </when>
+        </conditional>
+        <param name="annot" type="data" format="csv" label="Probeset annotation file" />
+        <param name="summary" type="data" format="txt" label="Apt-probeset genotype summary file" />
+        <param name="snp_posteriors" type="data" format="txt" label="Apt-probeset genotype snp-posteriors file" />
+        <param name="report" type="data" format="txt" label="Apt-probeset genotype report file" />
+        <param name="confidences" type="data" format="txt" label="Apt-probeset genotype confidences file" />
+        <param name="calls" type="data" format="txt" label="Apt-probeset genotype calls file" />
+        <conditional name="output_gender_estimate_cond">
+            <param name="output_gender_estimate" type="select" force_select="true" label="Output apt-probeset-genotype gender estimate?">
+                <option value="no" selected="true">No</option>
+                <option value="yes">Yes</option>
+            </param>
+            <when value="no"/>
+            <when value="yes"/>
+        </conditional>
+        <param name="append_version" type="select" force_select="true" label="Append version and command line to the header?">
+            <option value="no" selected="true">No</option>
+            <option value="yes">Yes</option>
+        </param>
+        <param name="output_type" type="select" force_select="true" label="Select format for output?">
+            <option value="v" selected="true">Uncompressed VCF</option>
+            <option value="z">Compressed VCF</option>
+            <option value="u" selected="true">Uncompressed BCF</option>
+            <option value="b">Compressed BCF</option>
+        </param>
+    </inputs>
+    <outputs>
+        <data name="output" format="vcf" />
+        <data name="output_gender_estimate" format="txt" label="${tool.name} (gender estimate) on ${on_string}">
+            <filter>output_gender_estimate_cond['output_gender_estimate'] == "yes"</filter>
+        </data>
+    </outputs>
+    <tests>
+        <test>
+            <param name="reference_genome_source" value="history"/>
+            <param name="history_item" value="GCF_000222465.1_Adig_1.1_genomic.fna" ftype="fasta"/>
+            <param name="annot" value="annot.csv" ftype="csv"/>
+            <param name="summary" value="summary.txt" ftype="txt"/>
+            <param name="snp_posteriors" value="snp_posteriors.txt" ftype="txt"/>
+            <param name="report" value="report.txt" ftype="txt"/>
+            <param name="confidences" value="confidences.txt" ftype="txt"/>
+            <param name="calls" value="calls.txt" ftype="txt"/>
+            <output name="output" value="output.vcf" ftype="vcf"/>
+        </test>
+    </tests>
+    <help>
+This tool converts Affymetrix genotype calls and intensity files to VCF format.
+
+-----
+
+**Required options**
+
+**Other options**
+    </help>
+    <citations>
+        <citation type="bibtex">
+            @misc{None,
+            journal = {None},
+            author = {Genovese, Giulio},
+            title = {None},
+            year = {None},
+            url = {https://github.com/freeseek/gtc2vcf},}
+        </citation>
+    </citations>
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/all_fasta.loc.sample	Fri Oct 12 09:46:32 2018 -0400
@@ -0,0 +1,18 @@
+#This file lists the locations and dbkeys of all the fasta files
+#under the "genome" directory (a directory that contains a directory
+#for each build). The script extract_fasta.py will generate the file
+#all_fasta.loc. This file has the format (white space characters are
+#TAB characters):
+#
+#<unique_build_id>	<dbkey>	<display_name>	<file_path>
+#
+#So, all_fasta.loc could look something like this:
+#
+#apiMel3	apiMel3	Honeybee (Apis mellifera): apiMel3	/path/to/genome/apiMel3/apiMel3.fa
+#hg19canon	hg19	Human (Homo sapiens): hg19 Canonical	/path/to/genome/hg19/hg19canon.fa
+#hg19full	hg19	Human (Homo sapiens): hg19 Full	/path/to/genome/hg19/hg19full.fa
+#
+#Your all_fasta.loc file should contain an entry for each individual
+#fasta file. So there will be multiple fasta files for each build,
+#such as with hg19 above.
+#
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.sample	Fri Oct 12 09:46:32 2018 -0400
@@ -0,0 +1,7 @@
+<tables>
+    <!-- Locations of all fasta files under genome directory -->
+    <table name="all_fasta" comment_char="#" allow_duplicate_entries="False">
+        <columns>value, dbkey, name, path</columns>
+        <file path="tool-data/all_fasta.loc" />
+    </table>
+</tables>