Repository 'bedtools'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/bedtools

Changeset 15:b73962f8fcbf (2017-07-05)
Previous changeset 14:304a594a7ef6 (2017-05-14) Next changeset 16:e0cec48a4695 (2017-08-18)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit c5007eff737fcabb28fa726ac40f13a1cd4893c1
modified:
closestBed.xml
tool_data_table_conf.xml.sample
added:
tool-data/all_fasta.loc.sample
tool-data/all_gff.loc.sample
removed:
all_fasta.loc.sample
b
diff -r 304a594a7ef6 -r b73962f8fcbf all_fasta.loc.sample
--- a/all_fasta.loc.sample Sun May 14 14:07:52 2017 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,18 +0,0 @@
-#This file lists the locations and dbkeys of all the fasta files
-#under the "genome" directory (a directory that contains a directory
-#for each build). The script extract_fasta.py will generate the file
-#all_fasta.loc. This file has the format (white space characters are
-#TAB characters):
-#
-#<unique_build_id> <dbkey> <display_name> <file_path>
-#
-#So, all_fasta.loc could look something like this:
-#
-#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa
-#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa
-#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa
-#
-#Your all_fasta.loc file should contain an entry for each individual
-#fasta file. So there will be multiple fasta files for each build,
-#such as with hg19 above.
-#
b
diff -r 304a594a7ef6 -r b73962f8fcbf closestBed.xml
--- a/closestBed.xml Sun May 14 14:07:52 2017 -0400
+++ b/closestBed.xml Wed Jul 05 17:12:00 2017 -0400
[
b'@@ -5,52 +5,70 @@\n     </macros>\n     <expand macro="requirements" />\n     <expand macro="stdio" />\n-    <command>\n-<![CDATA[\n-        #set inputBs = "\' \'".join([str( $file ) for $file in $inputB])\n-\n-        closestBed\n-        $strand\n-        $addition\n-        #if $addition2.addition2_select:\n-            -D $addition2.addition2_select\n-            $addition2.iu\n-            $addition2.id\n-        #end if\n-        $io\n-        -mdb $mdb\n-        -t $ties\n-        #if $k:\n-            -k $k\n-        #end if\n-        -a \'$inputA\'\n-        -b \'$inputBs\'\n-        > \'$output\'\n-]]>\n-    </command>\n+    <command><![CDATA[\n+closestBed\n+$strand\n+$addition\n+#if $addition2.addition2_select:\n+    -D $addition2.addition2_select\n+    $addition2.iu\n+    $addition2.id\n+#end if\n+$io\n+-mdb $mdb\n+-t $ties\n+#if str($k):\n+    -k $k\n+#end if\n+-a \'$inputA\'\n+#if str($overlap_with.source) == "data_table":\n+    -b \'$overlap_with.table.fields.path\'\n+#else\n+    #set inputBs = "\' \'".join([str( $file ) for $file in $overlap_with.inputB])\n+    -b \'$inputBs\'\n+#end if\n+> \'$output\'\n+    ]]></command>\n     <inputs>\n-        <param format="bed,vcf,gff,gff3" name="inputA" type="data" label="BED/VCF/GFF file"/>\n-        <param format="bed,gff,vcf,gff3" name="inputB" type="data" multiple="True" label="overlap intervals in this BED/VCF/GFF file?"/>\n+        <param name="inputA" type="data" format="bed,vcf,gff,gff3" label="BED/VCF/GFF file"/>\n+        <!-- overlap with file (inputB) -->\n+        <conditional name="overlap_with">\n+            <param name="source" type="select" label="Overlap with: will you select a BED/VCF/GFF file from your history or use a built-in GFF file?" help="Built-in GFF files contain full annotation of a reference genome">\n+                <option value="history" selected="true">Use a BED/VCF/GFF file from the history</option>\n+                <option value="data_table">Use a built-in GFF file</option>\n+            </param>\n+            <when value="data_table">\n+                <param name="table" type="select" label="Select reference GFF" help="If your genome of interest is not listed, contact the Galaxy team">\n+                    <options from_data_table="all_gff">\n+                        <filter type="sort_by" column="2"/>\n+                        <validator type="no_options" message="No files are available"/>\n+                    </options>\n+                </param>\n+            </when>\n+            <when value="history">\n+                <param name="inputB" type="data" format="bed,gff,vcf,gff3" multiple="true" label="Select a BED/VCF/GFF file" />\n+            </when>\n+        </conditional>\n \n         <param name="ties" type="select"\n             label="How ties for closest feature should be handled"\n             help="This occurs when two features in B have exactly the same overlap with a feature in A.">\n-            <option value="all" selected="True">all - Report all ties (default)</option>\n+            <option value="all" selected="true">all - Report all ties (default)</option>\n             <option value="first">first - Report the first tie that occurred in the B file</option>\n             <option value="last">last - Report the last tie that occurred in the B file</option>\n         </param>\n \n         <expand macro="strand2" />\n \n-        <param name="addition" type="boolean" checked="false" truevalue="-d" falsevalue=""\n+        <param name="addition" argument="-d" type="boolean" truevalue="-d" falsevalue="" checked="false"\n             label="In addition to the closest feature in B, report its distance to A as an extra column"\n-            help="The reported distance for overlapping features will be 0. (-d)" />\n+            help="The reported distance for overlapping features will be 0" />\n \n         <conditional name="addition2">\n-            <param name="addition2_select" type="select"\n+            <param name="addition2_select" argument="-D" type="select"\n                 label="Add additional columns to report distance'..b'atabases are resolved"\n-            help="(-mdb)">\n-            <option value="each" selected="True">Report closest records for each database. (-each)</option>\n+        <param argument="-mdb" type="select"\n+            label="How multiple databases are resolved">\n+            <option value="each" selected="true">Report closest records for each database. (-each)</option>\n             <option value="all">Report closest records among all databases. (-all)</option>\n         </param>\n     </inputs>\n     <outputs>\n         <!-- Would like to use a nicer name, but since there are possibly many inputB datasets, falling back to ${on_string} -->\n         <!-- <data format_source="inputA" name="output" metadata_source="inputA" label="Closest regions from ${inputB[0].name} to ${inputA.name}"/> -->\n-        <data format_source="inputA" name="output" metadata_source="inputA" label="Closest regions from ${on_string}"/>\n+        <data name="output" format_source="inputA" metadata_source="inputA" label="Closest regions from ${on_string}" />\n     </outputs>\n     <tests>\n         <test>\n             <param name="inputA" value="closestBedA.bed" ftype="bed" />\n+            <param name="source" value="history" />\n             <param name="inputB" value="closestBedB.bed" ftype="bed" />\n             <output name="output" file="closestBed_result1.bed" ftype="bed" />\n         </test>\n         <test>\n             <param name="inputA" value="closestBed_a.bed" ftype="bed" />\n+            <param name="source" value="history" />\n             <param name="inputB" value="closestBed_b1.bed,closestBed_b2.bed" ftype="bed" />\n-            <param name="addition" value="True" />\n+            <param name="addition" value="true" />\n             <output name="output" file="closestBed_result2.bed" ftype="bed" />\n         </test>\n         <test>\n             <param name="inputA" value="closestBed_a.bed" ftype="bed" />\n+            <param name="source" value="history" />\n             <param name="inputB" value="closestBed_b1.bed,closestBed_b2.bed" ftype="bed" />\n             <param name="addition" value="True" />\n             <param name="mdb" value="all" />\n@@ -107,34 +127,34 @@\n         </test>\n         <test>\n             <param name="inputA" value="closestBed_c.bed" ftype="bed" />\n+            <param name="source" value="history" />\n             <param name="inputB" value="closestBed_d.bed" ftype="bed" />\n             <param name="addition2_select" value="ref" />\n             <output name="output" file="closestBed_result4.bed" ftype="bed" />\n         </test>\n         <test>\n             <param name="inputA" value="closestBed_c.bed" ftype="bed" />\n+            <param name="source" value="history" />\n             <param name="inputB" value="closestBed_d.bed" ftype="bed" />\n             <param name="addition2_select" value="a" />\n             <output name="output" file="closestBed_result5.bed" ftype="bed" />\n         </test>\n         <test>\n             <param name="inputA" value="closestBedA.bed" ftype="bed" />\n+            <param name="source" value="history" />\n             <param name="inputB" value="a.bed" ftype="bed" />\n             <param name="k" value="3" />\n             <output name="output" file="closestBed_result6.bed" ftype="bed" />\n         </test>\n     </tests>\n-    <help>\n-<![CDATA[\n+    <help><![CDATA[\n **What it does**\n \n Similar to intersectBed, closestBed searches for overlapping features in A and B. In the event that no feature in B overlaps the current feature in A, closestBed will report the closest (that is, least genomic distance from the start or end of A) feature in B. For example, one might want to find which is the closest gene to a significant GWAS polymorphism. Note that closestBed will report an overlapping feature as the closest\xe2\x80\x94that is, it does not restrict to closest non-overlapping feature.\n \n .. image:: $PATH_TO_IMAGES/closest-glyph.png\n \n-\n @REFERENCES@\n-]]>\n-    </help>\n+    ]]></help>\n     <expand macro="citations" />\n </tool>\n'
b
diff -r 304a594a7ef6 -r b73962f8fcbf tool-data/all_fasta.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/all_fasta.loc.sample Wed Jul 05 17:12:00 2017 -0400
b
@@ -0,0 +1,18 @@
+#This file lists the locations and dbkeys of all the fasta files
+#under the "genome" directory (a directory that contains a directory
+#for each build). The script extract_fasta.py will generate the file
+#all_fasta.loc. This file has the format (white space characters are
+#TAB characters):
+#
+#<unique_build_id> <dbkey> <display_name> <file_path>
+#
+#So, all_fasta.loc could look something like this:
+#
+#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa
+#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa
+#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa
+#
+#Your all_fasta.loc file should contain an entry for each individual
+#fasta file. So there will be multiple fasta files for each build,
+#such as with hg19 above.
+#
b
diff -r 304a594a7ef6 -r b73962f8fcbf tool-data/all_gff.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/all_gff.loc.sample Wed Jul 05 17:12:00 2017 -0400
b
@@ -0,0 +1,14 @@
+#This file lists the locations and dbkeys of all the GFF files
+#This file has the format (white space characters are
+#TAB characters):
+#
+#<unique_build_id> <dbkey> <display_name> <file_path>
+#
+#So, all_gff.loc could look something like this:
+#
+#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/annotation/apiMel3/apiMel3.gff
+#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/annotation/hg19/hg19canon.gff
+#hg19full hg19 Human (Homo sapiens): hg19 Representative transcripts /path/to/annotation/hg19/hg19_representative_tx.gff
+#
+#Your all_gff.loc file should contain an entry for each different annotation.
+#So there can be multiple gff files for each build, such as with hg19 above.
b
diff -r 304a594a7ef6 -r b73962f8fcbf tool_data_table_conf.xml.sample
--- a/tool_data_table_conf.xml.sample Sun May 14 14:07:52 2017 -0400
+++ b/tool_data_table_conf.xml.sample Wed Jul 05 17:12:00 2017 -0400
b
@@ -4,4 +4,9 @@
         <columns>value, dbkey, name, path</columns>
         <file path="tool-data/all_fasta.loc" />
     </table>
+    <!-- Locations of all gff files with annotations of genome builds -->
+    <table name="all_gff" comment_char="#">
+        <columns>value, dbkey, name, path</columns>
+        <file path="tool-data/all_gff.loc" />
+    </table>
 </tables>