Repository 'multigps'
hg clone https://toolshed.g2.bx.psu.edu/repos/greg/multigps

Changeset 0:62bdb6ff11d1 (2018-09-05)
Commit message:
Uploaded
added:
.shed.yml
README.rst
macros.xml
multigps.xml
test-data/cntrl_hg19.scidx
test-data/expt_hg19.scidx
test-data/hg19_all_events_table1.tabular
test-data/hg19_all_events_table2.tabular
test-data/hg19_experiment_events1.tabular
test-data/hg19_experiment_events2.tabular
test-data/hg19_output_bed1.bed
test-data/hg19_output_bed2.bed
test-data/hg19_output_html1.html
test-data/hg19_output_html2.html
test-data/hg19_replicates_counts1.tabular
test-data/hg19_replicates_counts2.tabular
tool-data/all_fasta.loc.sample
tool-data/tool_data_table_conf.xml.sample
b
diff -r 000000000000 -r 62bdb6ff11d1 .shed.yml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/.shed.yml Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,13 @@
+name: multigps
+owner: greg
+description: Analyzes collections of multi-condition ChIP-seq data.
+homepage_url: http://mahonylab.org/software/multigps/
+long_description: |
+  Contains a tool that runs MultiGPS, a framework for analyzing collections of multi-condition ChIP-seq
+  datasets and characterizing differential binding events between conditions.  MultiGPS encourages consistency
+  in the reported binding event locations across conditions and provides accurate estimation of ChIP enrichment
+  levels at each event.  MultiGPS loads all data to memory, so you will need a lot of available memory if you
+  are running analysis over many conditions or large datasets.
+type: unrestricted
+categories:
+- ChIP-seq
b
diff -r 000000000000 -r 62bdb6ff11d1 README.rst
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/README.rst Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,17 @@
+MultiGPS wrapper for Galaxy
+================================
+
+* http://mahonylab.org/software/multigps/
+
+MultiGPS performs significant EM optimization of binding events along the genome and across experimental
+conditions, and it integrates motif-finding via MEME.  The tool loads all data into memory, so the potential
+exists for time and memory intensive analyses if running over many conditions or large datasets.
+
+Setting the memory allocation in Galaxy for this tool is handled using the <env id="_JAVA_OPTIONS"> tag for
+a selected job runner in the job_conf.xml file.
+
+License
+-------
+
+MIT
+
b
diff -r 000000000000 -r 62bdb6ff11d1 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,27 @@
+<?xml version='1.0' encoding='UTF-8'?>
+<macros>
+    <xml name="motif_finding_params">
+        <param name="memenmotifs" type="integer" min="0" value="3" label="Number of motifs MEME should find for each condition" />
+        <param name="mememinw" type="integer" min="0" value="6" label="Minimum motif width for MEME" />
+        <param name="mememaxw" type="integer" min="0" value="16" label="Maximum motif width for MEME" />
+    </xml>
+    <xml name="param_experiment_type">
+        <param name="experiment_type" type="select" display="radio" label="Experiment type for this replicate">
+            <option value="chipseq" selected="True">ChIP-seq</option>
+            <option value="chipexo">ChIP-exo</option>
+        </param>
+    </xml>
+    <xml name="cond_fixedreadcount">
+        <conditional name="fixedreadcount_cond">
+            <param  name="fixedreadcount_select" type="select" label="Set fixed per-base read count limit for this replicate?" help="Selecting No uses a global per-base limit that is estimated from a Poisson distribution.">
+                <option value="no" selected="True">No</option>
+                <option value="yes">Yes</option>
+            </param>
+            <when value="no"/>
+            <when value="yes">
+                <param name="fixedreadcount" type="integer" value="0" min="0" label="Fixed per-base read count limit"/>
+            </when>
+        </conditional>
+    </xml>
+</macros>
+
b
diff -r 000000000000 -r 62bdb6ff11d1 multigps.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/multigps.xml Wed Sep 05 08:59:42 2018 -0400
[
b'@@ -0,0 +1,542 @@\n+<tool id="multigps" name="MultiGPS" version="0.74.0">\n+    <description>analyzes collections of multi-condition ChIP-seq data</description>\n+    <macros>\n+        <import>macros.xml</import>\n+    </macros>\n+    <requirements>\n+        <requirement type="package" version="0.74">multigps</requirement>\n+    </requirements>\n+    <command detect_errors="aggressive">\n+        <![CDATA[\n+            #set output_dir = $output_html.files_path\n+            mkdir -p $output_dir &&\n+            multigps\n+            ## General options\n+            --design \'$build_design_file\'\n+            ## Append .txt extensions to events hrefs\n+            ## in output dataset so files will render\n+            ## in the browser.\n+            --eventsaretxt\n+            ## Do not run the parallel version of meme.\n+            --meme1proc\n+            --threads \\${GALAXY_SLOTS:-4}\n+            --geninfo \'$chromInfo\'\n+            ## Advanced options\n+            #set aoc = $advanced_options_cond\n+            #if str($aoc.advanced_options) == \'display\':\n+                #set bmsc = $aoc.binding_model_smoothing_cond\n+                #set gmsc = $aoc.gauss_model_smoothing_cond\n+                #set rbec = $aoc.report_binding_events_cond\n+                #set rloc = $aoc.reads_limits_options_cond\n+                #set sdc = $aoc.scale_data_cond\n+                #set umc = $aoc.use_motif_cond\n+                #if str($umc.use_motif) == \'yes\':\n+                    #set rgc = $umc.reference_genome_cond\n+                    --seq\n+                    #if str($rgc.reference_genome_source) == \'cached\':\n+                        \'${rgc.reference_genome.fields.path}\'\n+                    #else:\n+                        \'${rgc.reference_genome}\'\n+                    #end if\n+                #end if\n+                ## Limits on how many reads\n+                #if str($rloc.reads_limits) == \'yes\':\n+                    --fixedpb $rloc.fixedpb\n+                    --poissongausspb $rloc.poissongausspb\n+                    #if str($rloc.nonunique) == \'yes\':\n+                        --nonunique\n+                    #end if\n+                    --mappability $rloc.mappability\n+                    #if str($rloc.nocache) == \'yes\':\n+                        --nocache\n+                    #end if\n+                #end if\n+                ## Scaling data\n+                #if str($sdc.scale_data) == \'yes\':\n+                    #if str($sdc.scaling) == \'no\':\n+                        --noscaling $sdc.scaling\n+                    #end if\n+                    #if str($sdc.medianscale) == \'yes\':\n+                        --medianscale $sdc.medianscale\n+                    #end if\n+                    #if str($sdc.regressionscale) == \'yes\':\n+                        --regressionscale $sdc.regressionscale\n+                    #end if\n+                    #if str($sdc.sesscale) == \'yes\':\n+                        --sesscale $sdc.sesscale\n+                    #end if\n+                    #if $sdc.fixedscaling > 0:\n+                        \xe2\x80\x92\xe2\x80\x92fixedscaling $sdc.fixedscaling\n+                    #end if\n+                    --scalewin $sdc.scalewin\n+                    #if str($sdc.plotscaling) == \'yes\':\n+                        --plotscaling $sdc.plotscaling\n+                    #end if\n+                #end if\n+                ## Running MultiGPS\n+                #if str($aoc.readdistributionfile) != \'None\':\n+                    --readdistributionfile \'$aoc.readdistributionfile\'\n+                #end if\n+                --maxtrainingrounds $aoc.maxtrainingrounds\n+                #if str($aoc.nomodelupdate) == \'no\':\n+                    --nomodelupdate\n+                #end if\n+                --minmodelupdateevents $aoc.minmodelupdateevents\n+                #if str($bmsc.nomodelsmoothing) == \'no\':\n+                    --nomodelsmoothing\n+                #else:\n+                    --splinesmoothparam $bmsc.splinesmoothparam\n+                #end if\n+                #if s'..b'nding model updates?\n+ - **Minimum number of events to support an update of the read distribution** - Minimum number of events to support an update of the read distribution\n+ - **Perform binding model smoothing?** - Smooth with a cubic spline using a specified smoothing factor.\n+ - **Spline smoothing parameter** - Smoothing parameter for smoothing cubic spline.\n+ - **Perform Gaussian model smoothing?** - Select "Yes" to use Gaussian model smoothing using a specified smoothing factor if binding model smoothing is not performed.\n+ - **Allow joint events in model updates?** - Specify whether to allow joint events in model updates.\n+ - **Keep binding model range fixed to inital size?** - Flag to keep binding model range fixed to inital size (default: vary automatically)\n+ - **Poisson log threshold for potential region scanning** - Poisson log threshold for potential region scanning.\n+ - **Alpha scaling factor** - Alpha scaling factor. Increasing this parameter results in stricter binding event calls. \n+ - **Impose this alpha** - The alpha parameter is a sparse prior on binding events in the MultiGPS model. It can be interpreted as a minimum number of reads that each binding event must be responsible for in the model. Default: estimate alpha automatically.\n+ - **Share component configs in the ML step?** - Flag to not share component configs in the ML step\n+ - **Optional file containing a set of regions to ignore during MultiGPS training** - File containing a set of regions to ignore during MultiGPS training. It\xe2\x80\x99s a good idea to exclude the mitochondrial genome and other \xe2\x80\x98blacklisted\xe2\x80\x99 regions that contain artifactual accumulations of reads in both ChIP-seq and control experiments. MultiGPS will waste time trying to model binding events in these regions, even though they will not typically appear significantly enriched over the control (and thus will not be reported to the user).\n+\n+* **MultiGPS priors:**\n+\n+ - **Perform inter-experiment positional prior?** - Flag to turn off inter-experiment positional prior (default=on).\n+ - **Probability that events are shared across conditions** - Probability that events are shared across conditions.\n+ - **Perform both motif-finding and motif priors?** - Flag to turn off motif-finding and motif priors.\n+ - **Perform motif-finding only?** - Flag to turn off motif priors only.\n+ - **Number of motifs MEME should find for each condition** - Number of motifs MEME should find for each condition.\n+ - **Minimum motif width for MEME** - minw arg for MEME.\n+ - **Maximum motif width for MEME** - maxw arg for MEME.\n+\n+* **Reporting binding events:**\n+\n+ - **Minimum Q-value (corrected p-value) of reported binding events** - Minimum Q-value (corrected p-value) of reported binding events.\n+ - **Minimum event fold-change vs scaled control** - Minimum event fold-change vs scaled control.\n+ - **Run differential enrichment tests?** - Choose whether to run differential enrichment tests.\n+ - **EdgeR over-dispersion parameter value** - EdgeR over-dispersion parameter value.\n+ - **Minimum p-value for reporting differential enrichment** - Minimum p-value for reporting differential enrichment.\n+\n+    </help>\n+    <citations>\n+        <citation type="bibtex">\n+            @article{Mahony2014,\n+            journal = {PLOS Computational Biology},\n+            author = {1. Mahony S, Edwards MD, Mazzoni EO, Sherwood RI, Kakumanu A, Morrison CA, Wichterle H, Gifford DK},\n+            title = {An Integrated Model of Multiple-Condition ChIP-Seq Data Reveals Predeterminants of Cdx2 Binding},\n+            year = {2014},}\n+            volume = {10},\n+            number = {3},\n+            pages = {e1003501},}\n+        </citation>\n+        <citation type="bibtex">\n+            @article{Liang2012,\n+            journal = {BMC Bioinformatics},\n+            author = {2. Liang, Ketes},\n+            title = {Normalization of ChIP-seq data with control},\n+            year = {2012},}\n+        </citation>\n+    </citations>\n+</tool>\n+\n'
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/cntrl_hg19.scidx
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/cntrl_hg19.scidx Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,20 @@
+#2016-11-04 08:39:36.449;localbam.bam;READ1
+chrom index forward reverse value
+chr1 13038 1 0 1
+chr1 16604 0 1 1
+chr1 19215 1 0 1
+chr1 20151 0 1 1
+chr1 48908 1 0 1
+chr1 49489 1 0 1
+chr1 55105 1 0 1
+chr1 57499 0 1 1
+chr1 66636 1 0 1
+chr1 67393 0 1 1
+chr1 72875 0 1 1
+chr1 73954 0 1 1
+chr1 82146 1 0 1
+chr1 85089 0 1 1
+chr1 101405 1 0 1
+chr1 106851 0 1 1
+chr1 108358 0 1 1
+chr1 113877 0 1 1
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/expt_hg19.scidx
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expt_hg19.scidx Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,101 @@
+#2016-11-04 08:39:36.449;localbam.bam;READ1
+chrom index forward reverse value
+chr1 13038 1 0 1
+chr1 16604 0 1 1
+chr1 19215 1 0 1
+chr1 20151 0 1 1
+chr1 48908 1 0 1
+chr1 49489 1 0 1
+chr1 55105 1 0 1
+chr1 57499 0 1 1
+chr1 66636 1 0 1
+chr1 67393 0 1 1
+chr1 72875 0 1 1
+chr1 73954 0 1 1
+chr1 82146 1 0 1
+chr1 85089 0 1 1
+chr1 101405 1 0 1
+chr1 106851 0 1 1
+chr1 108358 0 1 1
+chr1 113877 0 1 1
+chr1 122833 1 0 1
+chr1 123101 0 1 1
+chr1 124863 1 0 1
+chr1 125216 0 1 1
+chr1 139373 0 1 1
+chr1 150551 1 0 1
+chr1 158113 1 0 1
+chr1 160681 1 0 1
+chr1 167381 1 0 1
+chr1 173325 0 1 1
+chr1 234394 1 0 1
+chr1 234434 0 1 1
+chr1 235111 1 0 1
+chr1 236086 0 1 1
+chr1 236159 1 0 1
+chr1 237302 0 1 1
+chr1 237648 1 0 1
+chr1 237735 1 0 1
+chr1 238867 0 1 1
+chr1 240339 1 0 1
+chr1 250472 1 0 1
+chr1 250560 0 1 1
+chr1 252828 1 0 1
+chr1 255896 1 0 1
+chr1 258157 1 0 1
+chr1 354230 0 1 1
+chr1 521482 0 1 1
+chr1 523810 0 1 1
+chr1 526070 0 1 1
+chr1 526303 1 0 1
+chr1 526406 1 0 1
+chr1 527103 0 1 1
+chr1 527586 1 0 1
+chr1 527590 1 0 1
+chr1 527599 1 0 1
+chr1 530330 1 0 1
+chr1 532712 0 1 1
+chr1 534863 0 1 1
+chr1 535107 1 0 1
+chr1 535662 1 0 1
+chr1 535998 1 0 1
+chr1 537647 0 1 1
+chr1 539496 1 0 1
+chr1 540024 0 1 1
+chr1 540628 1 0 1
+chr1 542424 1 0 1
+chr1 544024 0 1 1
+chr1 546672 1 0 1
+chr1 549581 0 1 1
+chr1 562709 1 0 1
+chr1 563545 0 1 1
+chr1 566222 0 1 1
+chr1 566375 0 1 1
+chr1 566736 1 0 1
+chr1 566863 1 0 1
+chr1 566974 1 0 1
+chr1 568430 0 1 1
+chr1 568570 1 0 1
+chr1 569236 0 1 1
+chr1 569310 0 1 1
+chr1 569499 1 0 1
+chr1 569640 1 0 1
+chr1 569752 1 0 1
+chr1 569823 1 0 1
+chr1 569890 1 0 1
+chr1 569902 1 0 1
+chr1 569912 1 0 1
+chr1 569914 1 0 1
+chr1 569917 1 0 1
+chr1 569931 0 1 1
+chr1 569942 0 1 1
+chr1 569954 0 1 1
+chr1 569960 0 1 1
+chr1 569961 0 1 1
+chr1 569963 0 1 1
+chr1 570032 0 1 1
+chr1 570109 1 0 1
+chr1 570164 0 1 1
+chr1 570169 1 0 1
+chr1 570177 0 1 1
+chr1 570226 0 1 1
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_all_events_table1.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_all_events_table1.tabular Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,31 @@
+### MultiGPS output
+#Condition Name Index TotalSigCount SignalFraction
+#Condition cond 0 99.0 0.555
+#Replicate ParentCond Name Index SigCount CtrlCount SigCtrlScaling SignalFraction
+#Replicate cond cond:1 0 99.0 0 1 0.56
+#
+#Point cond_Sig cond_Ctrl cond_log2Fold cond_log2P ActiveConds
+chr1:569927 14.3 0.0 3.838 -6.470 1
+chr1:536042 1.0 0.0 0.014 -1.474 1
+chr1:535151 1.0 0.0 0.014 -1.413 1
+chr1:534819 1.0 0.0 0.014 -1.348 1
+chr1:539540 1.0 0.0 0.024 -1.281 1
+chr1:539980 1.0 0.0 0.024 -1.211 1
+chr1:125172 1.0 0.0 0.033 -1.137 1
+chr1:49533 1.0 0.0 0.036 -1.059 1
+chr1:67349 1.0 0.0 0.041 -0.976 1
+chr1:563501 1.0 0.0 0.043 -0.889 1
+chr1:20107 1.0 0.0 0.046 -0.796 1
+chr1:568610 1.8 0.0 0.853 -0.696 1
+chr1:237754 2.0 0.0 1.015 -0.626 1
+chr1:236192 2.0 0.0 0.973 -0.589 1
+chr1:569214 2.0 0.0 0.989 -0.474 1
+chr1:569652 2.0 0.0 1.016 -0.433 1
+chr1:566215 2.0 0.0 0.991 -0.348 1
+chr1:234414 2.0 0.0 1.020 -0.211 1
+chr1:122967 2.0 0.0 0.996 -0.211 1
+chr1:570152 4.6 0.0 2.207 -0.100 1
+chr1:250516 2.0 0.0 0.998 -0.059 1
+chr1:527636 3.0 0.0 1.608 0.000 1
+chr1:566984 2.9 0.0 1.560 0.000 1
+chr1:526421 2.0 0.0 1.021 0.000 1
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_all_events_table2.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_all_events_table2.tabular Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,31 @@
+### MultiGPS output
+#Condition Name Index TotalSigCount SignalFraction
+#Condition cond 0 99.0 0.555
+#Replicate ParentCond Name Index SigCount CtrlCount SigCtrlScaling SignalFraction
+#Replicate cond cond:1 0 99.0 18.0 4.00 0.555
+#
+#Point cond_Sig cond_Ctrl cond_log2Fold cond_log2P ActiveConds
+chr1:569927 14.3 0.0 3.838 -6.470 1
+chr1:536042 1.0 0.0 0.014 -1.281 1
+chr1:535151 1.0 0.0 0.014 -1.211 1
+chr1:534819 1.0 0.0 0.014 -1.137 1
+chr1:539540 1.0 0.0 0.024 -1.059 1
+chr1:539980 1.0 0.0 0.024 -0.976 1
+chr1:125172 1.0 0.0 0.033 -0.889 1
+chr1:563501 1.0 0.0 0.043 -0.796 1
+chr1:568610 1.8 0.0 0.853 -0.696 1
+chr1:237754 2.0 0.0 1.015 -0.626 1
+chr1:236192 2.0 0.0 0.973 -0.589 1
+chr1:569214 2.0 0.0 0.989 -0.474 1
+chr1:569652 2.0 0.0 1.016 -0.433 1
+chr1:566215 2.0 0.0 0.991 -0.348 1
+chr1:234414 2.0 0.0 1.020 -0.211 1
+chr1:122967 2.0 0.0 0.996 -0.211 1
+chr1:570152 4.6 0.0 2.207 -0.100 1
+chr1:250516 2.0 0.0 0.998 -0.059 1
+chr1:49533 1.0 1.0 -2.000 -0.006 1
+chr1:527636 3.0 0.0 1.608 0.000 1
+chr1:566984 2.9 0.0 1.560 0.000 1
+chr1:526421 2.0 0.0 1.021 0.000 1
+chr1:20107 1.0 1.0 -2.000 0.000 1
+chr1:67349 1.0 1.0 -2.000 0.000 1
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_experiment_events1.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_experiment_events1.tabular Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,7 @@
+### MultiGPS output
+#Condition Name Index TotalSigCount SignalFraction
+#Condition experiment 0 99.0 0.555
+#Replicate ParentCond Name Index SigCount CtrlCount CtrlScaling SignalFraction
+#Replicate experiment experiment:rep1 0 99.0 0 1 0.555
+#
+#Point experiment_Sig experiment_Ctrl experiment_log2Fold experiment_log2P Sequence MotifScore
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_experiment_events2.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_experiment_events2.tabular Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,7 @@
+### MultiGPS output
+#Condition Name Index TotalSigCount SignalFraction
+#Condition experiment 0 99.0 0.555
+#Replicate ParentCond Name Index SigCount CtrlCount CtrlScaling SignalFraction
+#Replicate experiment experiment:rep1 0 99.0 18.0 4.000 0.555
+#
+#Point experiment_Sig experiment_Ctrl experiment_log2Fold experiment_log2P Sequence MotifScore
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_output_bed1.bed
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_output_bed1.bed Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,1 @@
+track name=multiGPS-cond description=multiGPS events cond
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_output_bed2.bed
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_output_bed2.bed Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,1 @@
+track name=multiGPS-cond description=multiGPS events cond
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_output_html1.html
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_output_html1.html Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,33 @@
+<html>
+ <body>
+ <h1>MultiGPS results (dataset_3_files)</h1>
+ <h2>Binding events</h2>
+ <table>
+ <tr> <th>Condition</th>
+ <th>Events</th>
+ <th>File</th>
+ </tr>
+ <tr> <td>cond</td>
+ <td>0</td>
+ <td><a href='dataset_3_files_cond.events.txt'>dataset_3_files_cond.events.txt</a></td>
+ </tr>
+ </table>
+ <h2>Input data</h2>
+ <table>
+ <tr> <th>Replicate</th>
+ <th>ReadCount</th>
+ <th>CtrlScaling</th>
+ <th>SignalFraction</th>
+ <th>ReadDistributionModel</th>
+ </tr>
+ <tr> <td>cond 1</td>
+ <td>99.0</td>
+ <td>NA</td>
+ <td>0.555</td>
+ <td><a href='#' onclick='return fullpopitup("images/dataset_3_files_cond-1_Read_Distributions.png")'><img src='images/dataset_3_files_cond-1_Read_Distributions.png' height='300'></a></td>
+ </tr>
+ </table>
+ <h2>Miscellaneous files</h2>
+ <p><a href='intermediate-results/dataset_3_files.intraCondPeakDistances.histo.txt'>Peak-peak distance histograms (same condition)</a></p>
+ </body>
+</html>
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_output_html2.html
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_output_html2.html Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,34 @@
+<html>
+ <head><title>MultiGPS results (dataset_9_files)</title></head>
+ <body>
+ <h1>MultiGPS results (dataset_9_files)</h1>
+ <h2>Binding events</h2>
+ <table>
+ <tr> <th>Condition</th>
+ <th>Events</th>
+ <th>File</th>
+ </tr>
+ <tr> <td>cond</td>
+ <td>0</td>
+ <td><a href='dataset_9_files_cond.events.txt'>dataset_9_files_cond.events.txt</a></td>
+ </tr>
+ </table>
+ <h2>Input data</h2>
+ <table>
+ <tr> <th>Replicate</th>
+ <th>ReadCount</th>
+ <th>CtrlScaling</th>
+ <th>SignalFraction</th>
+ <th>ReadDistributionModel</th>
+ </tr>
+ <tr> <td>cond 1</td>
+ <td>99.0</td>
+ <td>4.000</td>
+ <td>0.555</td>
+ <td><a href='#' onclick='return fullpopitup("images/dataset_9_files_cond-1_Read_Distributions.png")'><img src='images/dataset_9_files_cond-1_Read_Distributions.png' height='300'></a></td>
+ </tr>
+ </table>
+ <h2>Miscellaneous files</h2>
+ <p><a href='intermediate-results/dataset_9_files.intraCondPeakDistances.histo.txt'>Peak-peak distance histograms (same condition)</a></p>
+ </body>
+</html>
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_replicates_counts1.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_replicates_counts1.tabular Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,25 @@
+Point cond:1
+chr1:569927 14
+chr1:536042 1
+chr1:535151 1
+chr1:534819 1
+chr1:539540 1
+chr1:539980 1
+chr1:125172 1
+chr1:49533 1
+chr1:67349 1
+chr1:563501 1
+chr1:20107 1
+chr1:568610 2
+chr1:237754 2
+chr1:236192 2
+chr1:569214 2
+chr1:569652 2
+chr1:566215 2
+chr1:234414 2
+chr1:122967 2
+chr1:570152 5
+chr1:250516 2
+chr1:527636 3
+chr1:566984 3
+chr1:526421 2
b
diff -r 000000000000 -r 62bdb6ff11d1 test-data/hg19_replicates_counts2.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/hg19_replicates_counts2.tabular Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,25 @@
+Point cond:1
+chr1:569927 14
+chr1:536042 1
+chr1:535151 1
+chr1:534819 1
+chr1:539540 1
+chr1:539980 1
+chr1:125172 1
+chr1:563501 1
+chr1:568610 2
+chr1:237754 2
+chr1:236192 2
+chr1:569214 2
+chr1:569652 2
+chr1:566215 2
+chr1:234414 2
+chr1:122967 2
+chr1:570152 5
+chr1:250516 2
+chr1:49533 1
+chr1:527636 3
+chr1:566984 3
+chr1:526421 2
+chr1:20107 1
+chr1:67349 1
b
diff -r 000000000000 -r 62bdb6ff11d1 tool-data/all_fasta.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/all_fasta.loc.sample Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,18 @@
+#This file lists the locations and dbkeys of all the fasta files
+#under the "genome" directory (a directory that contains a directory
+#for each build). The script extract_fasta.py will generate the file
+#all_fasta.loc. This file has the format (white space characters are
+#TAB characters):
+#
+#<unique_build_id>  <dbkey> <display_name>  <file_path>
+#
+#So, all_fasta.loc could look something like this:
+#
+#apiMel3    apiMel3 Honeybee (Apis mellifera): apiMel3  /path/to/genome/apiMel3/apiMel3.fa
+#hg19canon  hg19    Human (Homo sapiens): hg19 Canonical    /path/to/genome/hg19/hg19canon.fa
+#hg19full   hg19    Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa
+#
+#Your all_fasta.loc file should contain an entry for each individual
+#fasta file. So there will be multiple fasta files for each build,
+#such as with hg19 above.
+#
b
diff -r 000000000000 -r 62bdb6ff11d1 tool-data/tool_data_table_conf.xml.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/tool_data_table_conf.xml.sample Wed Sep 05 08:59:42 2018 -0400
b
@@ -0,0 +1,7 @@
+<tables>
+    <!-- Locations of all fasta files under genome directory -->
+    <table name="all_fasta" comment_char="#">
+        <columns>value, dbkey, name, path</columns>
+        <file path="tool-data/all_fasta.loc" />
+    </table>
+</tables>