Repository 'rename_tracks'
hg clone https://toolshed.g2.bx.psu.edu/repos/yating-l/rename_tracks

Changeset 0:8b19a698d90e (2018-06-25)
Next changeset 1:72ccb2f848a0 (2018-07-26)
Commit message:
planemo upload commit b615ca3bfed9f2115f62d1af30d4726fe8ba08d8
added:
rename_tracks.iml
rename_tracks.py
rename_tracks.xml
test-data/Augustus.gff3
test-data/HISAT.bam
test-data/StringTie_assembled_transcripts.gtf
test-data/TrfBig.bed
test-data/name_mapping.csv
test-data/rename_Augustus.gff3
test-data/rename_HISAT.bam
test-data/rename_StringTie.gtf
test-data/rename_TrfBig.bed
test-data/rename_sequence_cov.bigwig
test-data/renamed_reference.fasta
test-data/sequence_cov.bigwig
tool_dependencies.xml
b
diff -r 000000000000 -r 8b19a698d90e rename_tracks.iml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rename_tracks.iml Mon Jun 25 15:01:41 2018 -0400
b
@@ -0,0 +1,9 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<module type="PYTHON_MODULE" version="4">
+  <component name="NewModuleRootManager" inherit-compiler-output="true">
+    <exclude-output />
+    <content url="file://$MODULE_DIR$" />
+    <orderEntry type="inheritedJdk" />
+    <orderEntry type="sourceFolder" forTests="false" />
+  </component>
+</module>
\ No newline at end of file
b
diff -r 000000000000 -r 8b19a698d90e rename_tracks.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rename_tracks.py Mon Jun 25 15:01:41 2018 -0400
[
@@ -0,0 +1,69 @@
+# -*- coding: utf8 -*-
+
+"""
+Rename the custom evidence tracks so that the tracks use the same sequence names as the renamed reference 
+"""
+import sys
+import csv
+import subprocess
+import tempfile
+
+def rename_interval(inputFile, nameDict, renamedFile):
+    writer = open(renamedFile, 'w')
+    with open(inputFile, 'r') as f:
+        lines = f.readlines()
+        for l in lines:
+            if not l.startswith("#"):
+                scaffold_name = l.split()[0]
+                if scaffold_name in nameDict:
+                    l = l.replace(scaffold_name, nameDict[scaffold_name])
+            writer.write(l)
+    writer.close()
+
+def rename_bam(inputFile, nameDict, renamedFile):
+    header = subprocess.Popen(['samtools', 'view', '-H', inputFile], stdout=subprocess.PIPE)
+    array_call = ['sed']
+    for k,v in nameDict.items():
+        substitute = "s/%s/%s/" % (str(k), str(v))
+        array_call.append('-e')
+        array_call.append(substitute)
+    reheader = subprocess.Popen(array_call, stdin=header.stdout, stdout=subprocess.PIPE)
+    out = open(renamedFile, 'w')
+    subprocess.Popen(['samtools', 'reheader', '-', inputFile], stdin=reheader.stdout, stdout=out)
+
+def rename_bigwig(inputFile, renamedReference, nameDict, renamedFile):
+    bedGraphFile = tempfile.NamedTemporaryFile(bufsize=0)
+    chrom_sizes = tempfile.NamedTemporaryFile(bufsize=0)
+    sorted_bedGraphFile = tempfile.NamedTemporaryFile(bufsize=0)
+    renamed_sorted_bedGraphFile = tempfile.NamedTemporaryFile(bufsize=0)
+
+    subprocess.call(['bigWigToBedGraph', inputFile, bedGraphFile.name])
+    subprocess.call(['faSize', '-detailed', '-tab', renamedReference], stdout=chrom_sizes)
+    subprocess.call(['sort', '-k1,1', '-k2,2n', bedGraphFile.name], stdout=sorted_bedGraphFile)
+    rename_interval(sorted_bedGraphFile.name, nameDict, renamed_sorted_bedGraphFile.name)
+    subprocess.call(['bedGraphToBigWig', renamed_sorted_bedGraphFile.name, chrom_sizes.name, renamedFile])
+   
+def getNameDict(nameMapping):
+    nameDict = {}
+    with open(nameMapping, 'r') as f:
+        reader = csv.reader(f)
+        for row in reader:
+            nameDict[row[0]] = row[1]
+    return nameDict
+
+def main():
+    inputFile = sys.argv[1]
+    nameMapping = sys.argv[2]
+    inputFormat = sys.argv[3]
+    outputfile = sys.argv[4]
+    nameDict = getNameDict(nameMapping)
+    if inputFormat == "bed" or inputFormat == "gff3" or inputFormat == "gtf":
+        rename_interval(inputFile, nameDict, outputfile)
+    elif inputFormat == "bam":
+        rename_bam(inputFile, nameDict, outputfile)
+    elif inputFormat == "bigwig":
+        renamedReference = sys.argv[5]
+        rename_bigwig(inputFile, renamedReference, nameDict, outputfile)
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
b
diff -r 000000000000 -r 8b19a698d90e rename_tracks.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/rename_tracks.xml Mon Jun 25 15:01:41 2018 -0400
[
@@ -0,0 +1,92 @@
+<tool id="rename_tracks" name="rename the tracks" version="1.2">
+<description>a Galaxy tool to rename the scaffold names in the custom track files</description>
+    <requirements>
+        <requirement type="package" version="1.2">samtools</requirement>
+        <requirement type="package" version="340">ucsc_rename_bigwig</requirement>
+    </requirements>
+    <stdio>
+        <exit_code range="1:" />
+    </stdio>
+    <command><![CDATA[
+        python $__tool_directory__/rename_tracks.py "${format_select.input}" "${mapping}" $format_select.format "${output}"
+        #if $format_select.format == "bigwig"
+            "${format_select.reference}"
+        #end if
+
+
+    ]]></command>
+    <inputs>
+        <conditional name="format_select">
+            <param name="format" type="select" label="Select the format of your custom track file">
+                <option value="bed">BED</option>
+                <option value="gff3">GFF3</option>
+                <option value="gtf">GTF</option>
+                <option value="bam">BAM</option>
+                <option value="bigwig">BigWig</option>
+            </param>
+            <when value="bed">
+                <param name="input" type="data" format="bed" label="Custom track file" />
+            </when>
+            <when value="gff3">
+                <param name="input" type="data" format="gff3" label="Custom track file" />
+            </when>
+            <when value="gtf">
+                <param name="input" type="data" format="gtf" label="Custom track file" />
+            </when>
+            <when value="bam">
+                <param name="input" type="data" format="bam" label="Custom track file" />
+            </when>
+            <when value="bigwig">
+                <param name="input" type="data" format="bigwig" label="Custom track file" />
+                <param name="reference" type="data" format="fasta" label="Provide the renamed the reference file from 'renamed the scaffolds' tool" />
+            </when>
+        </conditional>
+        <param name="mapping" type="data" format="csv" label="Provide the name mapping file from 'renamed the scaffolds' tool"/>
+    </inputs>
+    <outputs>
+        <data name="output" format_source="input" label="${tool.name} on ${on_string}: renamed_track" />
+    </outputs>
+    <tests>
+        <test>
+            <!-- Test with GFF3 -->
+            <param name="input" value="Augustus.gff3" />
+            <param name="format" value="gff3" />
+            <param name="mapping" value="name_mapping.csv" />
+            <output name="output" file="rename_Augustus.gff3"/>
+        </test>
+        <test>
+            <!-- Test with BED -->
+            <param name="input" value="TrfBig.bed" />
+            <param name="format" value="bed" />
+            <param name="mapping" value="name_mapping.csv" />
+            <output name="output" file="rename_TrfBig.bed"/>
+        </test>
+        <test>
+            <!-- Test with GTF -->
+            <param name="input" value="StringTie_assembled_transcripts.gtf" />
+            <param name="format" value="gtf" />
+            <param name="mapping" value="name_mapping.csv" />
+            <output name="output" file="rename_StringTie.gtf" />
+        </test>
+        <test>
+            <!-- Test with BAM -->
+            <param name="input" value="HISAT.bam" />
+            <param name="format" value="bam" />
+            <param name="mapping" value="name_mapping.csv" />
+            <output name="output" file="rename_HISAT.bam" />
+        </test>
+        <test>
+            <!-- Test with BigWig -->
+            <param name="input" value="sequence_cov.bigwig" />
+            <param name="format" value="bigwig" />
+            <param name="mapping" value="name_mapping.csv" />
+            <param name="reference" value="renamed_reference.fasta" />
+            <output name="output" file="rename_sequence_cov.bigwig" />
+        </test>
+    </tests>
+    <help><![CDATA[
+    This tool is to rename scaffold names in the custom track files, so that the tracks use the same scaffold names as the reference genome renamed by "rename the scaffolds" tool
+    ]]></help>
+    <citations>
+    </citations>
+</tool>
\ No newline at end of file
b
diff -r 000000000000 -r 8b19a698d90e test-data/Augustus.gff3
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/Augustus.gff3 Mon Jun 25 15:01:41 2018 -0400
[
b'@@ -0,0 +1,6937 @@\n+##gff-version 3\n+# This output was generated with AUGUSTUS (version 3.1.0).\n+# AUGUSTUS is a gene prediction tool written by Mario Stanke (mario.stanke@uni-greifswald.de),\n+# Oliver Keller, Stefanie K\xc3\xb6nig and Lizzy Gerischer.\n+# Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008),\n+# Using native and syntenically mapped cDNA alignments to improve de novo gene finding\n+# Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013\n+# No extrinsic information on sequences given.\n+# Initialising the parameters using config directory /home/galaxy/galaxy/database/dependencies/augustus/3.1/iuc/package_augustus_3_1/24009970003a/config/ ...\n+# fly version. Using default transition matrix.\n+# Looks like /home/galaxy/galaxy/database/files/000/dataset_283.dat is in fasta format.\n+# We have hints for 0 sequences and for 0 of the sequences in the input set.\n+#\n+# ----- prediction on sequence number 1 (length = 45179, name = contig1) -----\n+#\n+# Predicted genes for sequence number 1 on both strands\n+# start gene contig1.g1\n+contig1\tAUGUSTUS\tgene\t553\t34688\t0.03\t-\t.\tID=contig1.g1\n+contig1\tAUGUSTUS\ttranscript\t553\t34688\t0.03\t-\t.\tID=contig1.g1.t1;Parent=contig1.g1\n+contig1\tAUGUSTUS\tCDS\t553\t578\t0.41\t-\t2\tID=contig1.g1.t1.cds;Parent=contig1.g1.t1\n+contig1\tAUGUSTUS\tCDS\t652\t1047\t0.25\t-\t2\tID=contig1.g1.t1.cds;Parent=contig1.g1.t1\n+contig1\tAUGUSTUS\tCDS\t12541\t12968\t0.87\t-\t1\tID=contig1.g1.t1.cds;Parent=contig1.g1.t1\n+contig1\tAUGUSTUS\tCDS\t32202\t33826\t0.89\t-\t0\tID=contig1.g1.t1.cds;Parent=contig1.g1.t1\n+contig1\tAUGUSTUS\tCDS\t33880\t34044\t0.98\t-\t0\tID=contig1.g1.t1.cds;Parent=contig1.g1.t1\n+contig1\tAUGUSTUS\tCDS\t34107\t34619\t0.99\t-\t0\tID=contig1.g1.t1.cds;Parent=contig1.g1.t1\n+contig1\tAUGUSTUS\tCDS\t34674\t34688\t0.45\t-\t0\tID=contig1.g1.t1.cds;Parent=contig1.g1.t1\n+contig1\tAUGUSTUS\tstart_codon\t34686\t34688\t.\t-\t0\tParent=contig1.g1.t1\n+# coding sequence = [atggcagcactctcgcaaaaggactttaatgacggaaaccagagaaatcgtcagaggaaaagtactgtcactgagcagc\n+# cctcatcaacatcaggaagcgtggcccaagtagaagcggacagcgcatcgtcacatttgtctgatcgctgttataacaacatagcaagtactaccaaa\n+# agtattgttggtgatgtgaaaacaagcagacgctgtgaagactttataagtagtggatcagcttcgactccattaaatgaatatgattgtgccaacgc\n+# tgatacgacggatattaaagatgaacctggagattttatagaaacaaattgtcattggcgaagttgttgtattgaatttaatacgcaagatgagcttg\n+# ttaaacatatcaataatgaccatatccaaaccaataagaaggcctttgtctgtcgatgggaaaattgtacccgtggtgaaaaacctttcaaagcgcag\n+# tatatgctagttgtgcatatgcgtcgtcataccggcgaaaagccacataaatgcacatttgaaggctgttttaaggcatattcacgcttggaaaacct\n+# aaaaacacatttacggtcacacacaggtgaaaaaccctatatgtgcgagtatccgggatgcagcaaggcgtttagtaatgcaagcgatcgtgcaaagc\n+# atcaaaatcgtactcacagtaatgagaaaccgtacatttgtaaagctcctggttgcacgaaacgttacaccgacccaagttctttgcgtaaacatgtt\n+# aaaacagttcatggtgctgagttttatgctaataaaaaacacaagggattgcccctaaatgatgcgaactctcgcctccaccgagacagtggccaagg\n+# tcggcataatcttcaagagcataatattgactctagcccttgcagcgaagaacttcaggtgggaaaacttataggcatgtctagtcccagtattaaat\n+# ctgaatctgatgaaagttcaccacatcatcagttgttaagtggagttcgagcttcagactgttttttaacatattcacaagatggtgccgccgaacat\n+# ataactttagatgacggctgggattgtgacgatgacgttgacgtggccgacttaccaattgtcttgcgtgctatggtaaatgttggcagcggaaattc\n+# gatggccccgaccattggagggggtgttgttgcgaggcagcgatttagaagtcgtttgcaaactaaaggaataaactctagtatggttatgcttggca\n+# acatccccgaaagcaatcgcaccattggaataagcgaacttaaccagcgtataacagaacttaagatggagcctggtaccgcttgtgatattacagtt\n+# ccattgaatacggggctggaaaggatttcagaagacttatcacaaaatcaatcaaatataacattaaataagcaaagcttctttaccgcttccggctc\n+# tctccaaggacattttcgtcgcgatagccagaactccactgcaagtacatattatggtagcatgcaaagtcgccgcagtagtcaatcatctcaggtgt\n+# cttctatatctacaatgcgtccaggcccatcgtacaacacaaccacagcttccctctatgatccaatttccccaggatgctctcgacgctctagccaa\n+# atgtctaatgtagtcaactcctacgcacttacatcaacatcaggattgactgcaattaacaaggacttaaatgcaaacagcagcccaaatgcttctat\n+# taataaaccgggtcttggtggtcagtactttggtttttacaataacagtcttcctccacctccatcgtctcatttaattgccaccaatttgaagcatc\n+# tgcaggacacagactctaggagttgttatcacaacacaactggcggtcgattttccattcccaattgtacgccatctctacatttagactacaatgga\n+# ccggctggagagcaggaaattgataaagaaatcccgaataacatattacgacgtcaatctgagccaatgccaaacataagtttg'..b'gt\n+# tttcgtgttggacgaatattgcgctcgctatggtgtgcggggatgctaccgacatttatgctacctttctgatttactggatcgtgcagaaaagcaac\n+# acatgatagatccaacactaattcactattcatttgcgttttgcgcaagccacgttcacggaaatcgacctgatggggtaggaagcattacgcatgag\n+# gaaaaggaaaaattttctgaaatcaaagaacgcctacgtcagttactggagtttcaaataaccaattttagatactgttttcctttcggtcgccccga\n+# aggcgctcttaaagcgacattatctttactagagagagtgctaatgaaagacattgttacccctgttccacctgaagaagttcgtcaaatgattaaaa\n+# aaagtttagagacggcagcgcttgtaaattacacccgtctctccaataaagctaagattgaaggcacttttccgttcaagggacacgtgccagggaaa\n+# tcctatcggaatttcaaaatttttccaagcactttcctgtacacgggaaacgtcccagggaaagcctatcggaaaggtcccagggaaatcccgtcgga\n+# tattcaggatttgcgaggagaggttattgttccgcccccaaaaaaactagaggacctaattcacttagcagaactttgtgttgatctgttgcaacaaa\n+# atgaagagcactatggagaactgcgcaaacatgacaaaatggataaaattaaaatgcgtaaggaagatgatgatgtaccaaaaggccacaatgaaagc\n+# gatattgatttaaccgccaatactggactcagtagcacatcagacctggcttctgcagcatcaactaatggatcgtcatttcgttattataatttgag\n+# gaatgggcgttttcatcagcacctgcgagacacattcgcaccattagtcgtgcggtacgtggatctgatggaatcttcaatagctcagtcgattcata\n+# agggatttgaaaaagaacgctgggaaagtaaagggaacggatgtgccacctctgaagacttattttggaaactagatgctctacagtcgtttataaga\n+# gacctgcactggccagacgcagagtttcgacaacatttagaacagcgtcttaaaatgatggccgtcgatatgatagagcaatgtatacaacgaactga\n+# ttcgtcttttcagtcgtggctaaaaaaaaacattgccttcatatcaactgattatattttaccttcagaaatgtgcgctatggtcaatgtgatattag\n+# atgctaaaaatcaaagctttaaattgactactattgacggcattgatttgtataaatttcatgcaaaaattgacgaccaaatcgacaaagcgaatgta\n+# gctatgacacaaggtctaactggtaaacttatgtcagtgctagagtcgactttgtcaaaattagcacgatacgacgaaggtagcctaatcggctcgat\n+# tcttagttttacaaatgtatcgagctcgggaaaggatctcgggcaaggatatgtaaatttctttagaaataatatggatcaagtacgaggaaaaattg\n+# gcgacgatttatggaccctgaatttctttgagcagtggtactcgcagcagattaacatgctatgtaattggctttcggaacgtttggaccacgctctg\n+# cactacgctcaagtttcatctatttctcacattatcaagaaaatatattcagacttcgaattacaaggtgtattagaagataaattaaactctaaagc\n+# atatcaagcagtcgcacagcgaatggcgacagaggaagcgacatgtgctttgacaatgcctgatgttagcgaagatgaaccctgtgacgacattcgag\n+# aaggggaagaagaagatactggcgacgaatctacctctaacataccaaggggcttaccaaaaccaaaaattgctgccgctcaagctgctgctgttacc\n+# aacgttgttgccggccgtgtgggtaatttactcggcaaaggcattggcggccttagttcaaagttgggaagtggaagttggttttaa]\n+# protein sequence = [MIDPSSSEEEGEDDPIANVSSKGRLTHAPKGTNTVSILGGVSGPGVGSNMAISGSNGDLAGNQRQSNISSISNRNDAG\n+# NVAGVGGSSNKNEQIHGSRVDGGNLEVPNSCIPSGVSQETLNQSIGSSRANSLPRPLSPSPSLTSEKPDTGDPHAFLKGETQIMADEAFQNAVQSYHD\n+# VFLKSERVLKMVQSGASSQHDFREVFRNNIEKRVRSLPEIDGLSKETVLTSWMAKFDIILKGTGEEDSKRPSRMQQSLNSELILSKEQLYDMFQQILL\n+# VKKFEHQILYNALMLDSADEQAAAIRRELDGRMQRVGEMEKNRKLMPKFVLKEMESLYVEELKSSINLLMANLESLPVSKGNMDSKYGLQKLKRYNHR\n+# KLILRSHGSLSKLEGDSEDGSTQLTKLDVVLTFQLEVIVMEVKGLKSLAPNRIVYCTMEVENGEKLQTDQAEASKPMWDTQGDFTTTHPLPVVKVKLY\n+# TENPGMLALEDKELGKVILKPTPLSSKSPEWHRMVIPKNLPDQDIRIKIACRLDKPLNMKHCGYKEKKSEPSEMMQLDGYTVDYIEAASANLMFGIDL\n+# NGGRFFFNAVREGDSISFACDDENECSLWVMAMYRATGQSHKPTPPITQDKNSAMSKIQGARVAPDGSIFLWASFFVAAATRNSSSYHWFRVGGRLNP\n+# MVVSAAARMEWDMCAQSPLASTWRGIGWWSSSERGQPYDLVDVEVPKSGATHYHVSCRGEVNQPETVVRDGLMEAESTDGGVKDAFATELCVEVPEDK\n+# LHVVVWGWFSPGQVFVLDEYCARYGVRGCYRHLCYLSDLLDRAEKQHMIDPTLIHYSFAFCASHVHGNRPDGVGSITHEEKEKFSEIKERLRQLLEFQ\n+# ITNFRYCFPFGRPEGALKATLSLLERVLMKDIVTPVPPEEVRQMIKKSLETAALVNYTRLSNKAKIEGTFPFKGHVPGKSYRNFKIFPSTFLYTGNVP\n+# GKAYRKGPREIPSDIQDLRGEVIVPPPKKLEDLIHLAELCVDLLQQNEEHYGELRKHDKMDKIKMRKEDDDVPKGHNESDIDLTANTGLSSTSDLASA\n+# ASTNGSSFRYYNLRNGRFHQHLRDTFAPLVVRYVDLMESSIAQSIHKGFEKERWESKGNGCATSEDLFWKLDALQSFIRDLHWPDAEFRQHLEQRLKM\n+# MAVDMIEQCIQRTDSSFQSWLKKNIAFISTDYILPSEMCAMVNVILDAKNQSFKLTTIDGIDLYKFHAKIDDQIDKANVAMTQGLTGKLMSVLESTLS\n+# KLARYDEGSLIGSILSFTNVSSSGKDLGQGYVNFFRNNMDQVRGKIGDDLWTLNFFEQWYSQQINMLCNWLSERLDHALHYAQVSSISHIIKKIYSDF\n+# ELQGVLEDKLNSKAYQAVAQRMATEEATCALTMPDVSEDEPCDDIREGEEEDTGDESTSNIPRGLPKPKIAAAQAAAVTNVVAGRVGNLLGKGIGGLS\n+# SKLGSGSWF]\n+# end gene contig70.g117\n+###\n+# command line:\n+# augustus --strand=both --noInFrameStop=false --gff3=on --uniqueGeneId=true --protein=on --codingseq=on --introns=off --stop=off --stop=off --cds=on --singlestrand=false /home/galaxy/galaxy/database/files/000/dataset_283.dat --UTR=off --genemodel=complete --species=fly\n'
b
diff -r 000000000000 -r 8b19a698d90e test-data/HISAT.bam
b
Binary file test-data/HISAT.bam has changed
b
diff -r 000000000000 -r 8b19a698d90e test-data/StringTie_assembled_transcripts.gtf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/StringTie_assembled_transcripts.gtf Mon Jun 25 15:01:41 2018 -0400
b
@@ -0,0 +1,11 @@
+# stringtie /home/galaxy/galaxy/database/files/000/dataset_328.dat -o /home/galaxy/galaxy/database/files/000/dataset_332.dat -p 1
+# StringTie version 1.2.3
+contig16 StringTie transcript 1751 17824 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; cov "14.618678"; FPKM "322160.531250"; TPM "866155.937500";
+contig16 StringTie exon 1751 1897 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; cov "6.787892";
+contig16 StringTie exon 11285 11463 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; cov "19.860081";
+contig16 StringTie exon 11518 11705 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; cov "23.926477";
+contig16 StringTie exon 11759 11858 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "4"; cov "17.452721";
+contig16 StringTie exon 11922 11975 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "5"; cov "11.461867";
+contig16 StringTie exon 12601 12811 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "6"; cov "11.876496";
+contig16 StringTie exon 17222 17337 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "7"; cov "15.915709";
+contig16 StringTie exon 17406 17824 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "8"; cov "11.738873";
b
diff -r 000000000000 -r 8b19a698d90e test-data/TrfBig.bed
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/TrfBig.bed Mon Jun 25 15:01:41 2018 -0400
b
b'@@ -0,0 +1,602 @@\n+contig1\t9130\t9428\ttrf\t163\t1.8\t164\t86\t2\t438\t36\t12\t13\t37\t1.82\tAAAAAAAATTATATCTTCGGTGTTTTTCAACATACAACCTCCTAAGCTTGGAAATAACATTTCTTAATCAGTTCTGAATTTCGAATTAAATTTTTATCAAAATCGGACAACTATACCATATAGCTGTCATAGGAAGGATTGGATAATTAGTGGTAAAATAATAT\n+contig1\t15707\t15757\ttrf\t20\t2.5\t19\t83\t9\t55\t32\t12\t2\t54\t1.49\tTATATCATTTATATCTCAG\n+contig1\t16261\t16302\ttrf\t12\t3.4\t12\t89\t0\t64\t2\t36\t24\t36\t1.69\tTCCGTCTGTCCG\n+contig1\t23387\t23483\ttrf\t45\t2.2\t45\t92\t1\t158\t19\t22\t30\t27\t1.98\tTCGGCGAAGAAATGTGCCACTTCGGCGGCACTTCTTGGAGTCACT\n+contig1\t23451\t23520\ttrf\t24\t2.9\t24\t80\t0\t75\t15\t26\t27\t30\t1.96\tTTCGGCGACACTTCTTGAAGTCAG\n+contig1\t24200\t24233\ttrf\t15\t2.2\t15\t94\t0\t57\t51\t12\t15\t21\t1.75\tAAACAATGGAATGCT\n+contig1\t29159\t29628\ttrf\t162\t2.9\t160\t80\t8\t518\t37\t12\t11\t38\t1.80\tGGAAAACATGAAATAAAAATTATATCTTTCGTGTTTTTTAACATATACCTTCTAAGCTTGAAAATAACATTTTTTATTTGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACAATCGGAAAATAAGTA\n+contig1\t37571\t37606\ttrf\t8\t4.4\t8\t88\t0\t52\t31\t25\t42\t0\t1.55\tGACGGACA\n+contig1\t38436\t38491\ttrf\t8\t6.9\t8\t79\t8\t58\t0\t38\t27\t34\t1.57\tTGTCCGTC\n+contig1\t38436\t38491\ttrf\t12\t4.6\t12\t81\t0\t65\t0\t38\t27\t34\t1.57\tTGTCCGTCCGTC\n+contig1\t38436\t38491\ttrf\t20\t3.1\t18\t80\t17\t69\t0\t38\t27\t34\t1.57\tTGTCCGTCTGTCCGTCCG\n+contig1\t43116\t43168\ttrf\t2\t26.0\t2\t96\t0\t95\t48\t0\t1\t50\t1.12\tTA\n+contig2\t540\t590\ttrf\t20\t2.5\t19\t83\t9\t55\t32\t12\t2\t54\t1.49\tTATATCATTTATATCTCAG\n+contig2\t1094\t1135\ttrf\t12\t3.4\t12\t89\t0\t64\t2\t36\t24\t36\t1.69\tTCCGTCTGTCCG\n+contig2\t8220\t8316\ttrf\t45\t2.2\t45\t92\t1\t158\t19\t22\t30\t27\t1.98\tTCGGCGAAGAAATGTGCCACTTCGGCGGCACTTCTTGGAGTCACT\n+contig2\t8284\t8353\ttrf\t24\t2.9\t24\t80\t0\t75\t15\t26\t27\t30\t1.96\tTTCGGCGACACTTCTTGAAGTCAG\n+contig2\t9033\t9066\ttrf\t15\t2.2\t15\t94\t0\t57\t51\t12\t15\t21\t1.75\tAAACAATGGAATGCT\n+contig2\t13992\t14461\ttrf\t162\t2.9\t160\t80\t8\t518\t37\t12\t11\t38\t1.80\tGGAAAACATGAAATAAAAATTATATCTTTCGTGTTTTTTAACATATACCTTCTAAGCTTGAAAATAACATTTTTTATTTGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACAATCGGAAAATAAGTA\n+contig2\t22404\t22439\ttrf\t8\t4.4\t8\t88\t0\t52\t31\t25\t42\t0\t1.55\tGACGGACA\n+contig2\t23269\t23324\ttrf\t8\t6.9\t8\t79\t8\t58\t0\t38\t27\t34\t1.57\tTGTCCGTC\n+contig2\t23269\t23324\ttrf\t12\t4.6\t12\t81\t0\t65\t0\t38\t27\t34\t1.57\tTGTCCGTCCGTC\n+contig2\t23269\t23324\ttrf\t20\t3.1\t18\t80\t17\t69\t0\t38\t27\t34\t1.57\tTGTCCGTCTGTCCGTCCG\n+contig2\t27949\t28001\ttrf\t2\t26.0\t2\t96\t0\t95\t48\t0\t1\t50\t1.12\tTA\n+contig2\t38280\t38311\ttrf\t16\t1.9\t16\t93\t0\t53\t41\t19\t6\t32\t1.77\tTACATACATACATATG\n+contig3\t3265\t3296\ttrf\t16\t1.9\t16\t93\t0\t53\t41\t19\t6\t32\t1.77\tTACATACATACATATG\n+contig3\t17933\t17958\ttrf\t10\t2.5\t10\t100\t0\t50\t60\t8\t0\t32\t1.26\tATATAAACAT\n+contig3\t19067\t19124\ttrf\t28\t2.0\t28\t100\t0\t114\t43\t14\t10\t31\t1.79\tAATTAAATTTTATCAAAATCGGACGACT\n+contig3\t23368\t23418\ttrf\t2\t25.0\t2\t100\t0\t100\t50\t0\t0\t50\t1.00\tAT\n+contig3\t24889\t25322\ttrf\t160\t2.7\t161\t80\t6\t452\t36\t12\t12\t38\t1.82\tAATATTAAAAATTATATCTTTGGTGTTTTTTAACATATAACCTTCTAAGCTTGGAAATAACATTTTTTATTTGGTTTAATTTCGAATTAAATTTTATTAAAATCGGACGACCATATCATACAGCTCCCATAGAAACAATCGGAAAATTAGTCGGAAACATG\n+contig3\t26816\t26900\ttrf\t18\t5.0\t16\t83\t13\t89\t20\t5\t0\t73\t1.03\tTTTTTTTATATATTTT\n+contig3\t26816\t26887\ttrf\t18\t4.1\t17\t84\t12\t90\t19\t4\t0\t76\t0.96\tTTTTTTTATATATTTTT\n+contig3\t26816\t26900\ttrf\t15\t5.2\t15\t79\t16\t71\t20\t5\t0\t73\t1.03\tTTTTTTTATATATAT\n+contig3\t26820\t26887\ttrf\t17\t3.7\t19\t80\t20\t74\t20\t4\t0\t74\t0.99\tTTTATATATTTTTTTTTCA\n+contig3\t29468\t29515\ttrf\t25\t2.0\t23\t84\t12\t60\t34\t0\t17\t48\t1.47\tATTATAATTATGATGTTATGATG\n+contig3\t38756\t38791\ttrf\t10\t3.6\t10\t92\t7\t63\t40\t0\t0\t60\t0.97\tATTTATTTAA\n+contig3\t38758\t38788\ttrf\t9\t3.2\t9\t95\t4\t51\t40\t0\t0\t60\t0.97\tTTATTTAAA\n+contig4\t7931\t7956\ttrf\t10\t2.5\t10\t100\t0\t50\t60\t8\t0\t32\t1.26\tATATAAACAT\n+contig4\t9065\t9122\ttrf\t28\t2.0\t28\t100\t0\t114\t43\t14\t10\t31\t1.79\tAATTAAATTTTATCAAAATCGGACGACT\n+contig4\t13366\t13416\ttrf\t2\t25.0\t2\t100\t0\t100\t50\t0\t0\t50\t1.00\tAT\n+contig4\t14887\t15320\ttrf\t160\t2.7\t161\t80\t6\t452\t36\t12\t12\t38\t1.82\tAATATTAAAAATTATATCTTTGGTGTTTTTTAACATATAACCTTCTAAGCTTGGAAATAACATTTTTTATTTGGTTTAATTTCGAATTAAATTTTATTAAAATCGGACGACCATATCATACAGCTCCCATAGAAACAATCGGAAAATTAGTCGGAAACATG\n+contig4\t16814\t16898\ttrf\t18\t5.0\t16\t83\t13\t89\t20\t5\t0\t73\t1.03\tTTTTTTTATATATTTT\n+contig4\t16814\t16885\ttrf\t18\t4.1\t17\t84\t12\t90\t19\t4\t0\t76\t0.96\tTTTTTTTATATATTTTT\n+contig4\t16814\t16898\ttrf\t15\t5.2\t15\t79\t16\t71\t20\t5\t0\t73\t1.03\tTTTTTTTATATATAT'..b'\n+contig69\t18503\t18850\ttrf\t163\t2.1\t163\t88\t3\t502\t36\t12\t16\t35\t1.86\tCTTTGGTGCTATTTGACATATAACCTCCTAAGCTTGGAAATATCATTTTTTAATTGATTTTGAAATTCAAATTAAATTTGATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACGATCGGAAAATTGGTGGAAAAATAATATGAAACAAATTATAG\n+contig69\t18536\t18888\ttrf\t163\t2.2\t161\t85\t4\t472\t36\t9\t16\t37\t1.82\tTTGGAAATACAATTTTTTATATTTATGAAATTCAAATTAAATTTGATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACGATCGGAAAATTGGTGGAAAAATAATATGAAACAAATTATAGCTTTGGAGCTGTTTGACATATAACCCTATAAGA\n+contig69\t19781\t19812\ttrf\t15\t2.1\t14\t94\t5\t53\t58\t0\t0\t41\t0.98\tATATAATTATAATA\n+contig69\t23637\t24060\ttrf\t162\t2.7\t156\t83\t6\t496\t37\t11\t12\t38\t1.79\tAAAAAAATTATATCTTCGGTGCTTTTTAACATATAACCTTCTAAGCTTGGAAATAACATTTTTTAATTAGTTCTGAATTTCAATTAAATTTTATCAAAATCGGACGACTTATAGCTGCCATAGGAACGATCGAAAAATTGATGGGAAAATAAATAT\n+contig69\t36863\t36892\ttrf\t15\t1.9\t15\t100\t0\t58\t27\t20\t48\t3\t1.66\tGGGGAACGCGAGCAT\n+contig69\t38645\t39124\ttrf\t158\t3.0\t157\t85\t5\t615\t34\t13\t13\t38\t1.84\tTAAAAATTGTTATTTCCAAGCTTAGAAGGTTATATGTTAAAAAACACCAAGATATAATTTTTTCATATTTTCCGACTATTTTTCCGATCGTTTCTATGGCAGCTATATGATATAGTCGTCCGATTTTGATAAAATTTAATTTGAAATTAAAACCAAT\n+contig69\t43653\t44084\ttrf\t162\t2.7\t162\t87\t4\t586\t40\t10\t13\t35\t1.79\tAACATTTTTTAATTAGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGAAGACTATATCATATAGCTGTCATAGGAACGATCGAAAAATTGGTGGAAAATAATATAATAAAAATTATATCCTTGGTATTTTTTAACATATAACAATATAAGCTAGAAAAG\n+contig70\t6910\t6939\ttrf\t15\t1.9\t15\t100\t0\t58\t27\t20\t48\t3\t1.66\tGGGGAACGCGAGCAT\n+contig70\t8692\t9171\ttrf\t158\t3.0\t157\t85\t5\t615\t34\t13\t13\t38\t1.84\tTAAAAATTGTTATTTCCAAGCTTAGAAGGTTATATGTTAAAAAACACCAAGATATAATTTTTTCATATTTTCCGACTATTTTTCCGATCGTTTCTATGGCAGCTATATGATATAGTCGTCCGATTTTGATAAAATTTAATTTGAAATTAAAACCAAT\n+contig70\t13700\t14131\ttrf\t162\t2.7\t162\t87\t4\t586\t40\t10\t13\t35\t1.79\tAACATTTTTTAATTAGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGAAGACTATATCATATAGCTGTCATAGGAACGATCGAAAAATTGGTGGAAAATAATATAATAAAAATTATATCCTTGGTATTTTTTAACATATAACAATATAAGCTAGAAAAG\n+contig70\t17962\t18295\ttrf\t161\t2.1\t160\t83\t5\t413\t37\t12\t13\t35\t1.84\tAAAAAATTATATCTCTGGTGTTTTTAAACATATAACCTCCTAAACTTGGAAATAACATTTTATAATTAGTTCTGAATTTCGAATTAAATTTTATCAAAACCCGACGACTATATCATACATGTAACTGTAACGATCGGAAAATTGATGGGAAAATAATATG\n+contig70\t19030\t19306\ttrf\t137\t2.0\t137\t94\t1\t482\t39\t13\t13\t34\t1.83\tTTTAACACATACCTTTCTAAGCTTGGATATAACATTTTTAAACTGGTTCTGAATTTCAAATTAAATTCAATTAAAATCGGACGACTATATCATATAGCTCCCATAGGAAAAATCGGAAAATTAGTGAGAAAATAATA\n+contig70\t22269\t22308\ttrf\t19\t2.1\t19\t100\t0\t78\t58\t15\t15\t10\t1.62\tAACTAAGGAAATACCAGAA\n+contig70\t22812\t23252\ttrf\t162\t2.8\t156\t84\t5\t562\t37\t11\t13\t37\t1.81\tTTCTAAGCTTGAAATAACATTTTTTAATTAGTTCTGAATTTCGAATTTAATTTTATTAAAATCGGACGACTATATCATATAGCTGCCATAGGAACGATCGGAAAATTAGTGGAAAATAATAAATAAAAATTATATTTGTATTTTTAACATATAACC\n+contig70\t23421\t23486\ttrf\t13\t4.7\t13\t70\t20\t51\t38\t0\t0\t61\t0.96\tATATATATAATTT\n+contig70\t23426\t23479\ttrf\t7\t7.4\t7\t79\t12\t54\t35\t0\t0\t64\t0.94\tTATATTT\n+contig70\t23430\t23486\ttrf\t27\t2.0\t27\t83\t10\t69\t35\t0\t0\t64\t0.94\tATTTATATATTTATTAATATATTTTAT\n+contig70\t25576\t25606\ttrf\t12\t2.5\t12\t94\t0\t51\t33\t26\t36\t3\t1.73\tACGGACGGACAG\n+contig70\t27263\t27382\ttrf\t63\t1.9\t63\t85\t3\t168\t27\t25\t21\t26\t1.99\tATTTTTCCAAGCACTTTCCTGTACAAGGGAAACGTCCCAGGGAAAGCCTATCGGAATTTCAAA\n+contig70\t27353\t27406\ttrf\t25\t2.1\t25\t85\t0\t70\t30\t26\t32\t11\t1.91\tGGAAACGTCCCAGGGAAAGCCCATC\n+contig70\t27848\t27878\ttrf\t12\t2.5\t12\t88\t0\t51\t30\t30\t40\t0\t1.57\tACGGACGGACAG\n+contig70\t35504\t35713\ttrf\t102\t2.0\t102\t99\t0\t409\t37\t12\t13\t36\t1.82\tAAAACGATGGTAGACAAATATGCATATATTTTTTACACAAAACGAAATATAATGGACTTTTAAAAATTCTTTTTTCTATCTTTCCTGGTGGGAGATATATAT\n+contig70\t43333\t43446\ttrf\t57\t2.0\t57\t94\t0\t199\t30\t17\t22\t29\t1.97\tAATATTGGGAATAACATATTATCTTATAATATGGGAGCGCGAAGGCTCCTCGCCCAT\n+contig70\t44242\t44281\ttrf\t7\t5.7\t7\t81\t6\t53\t28\t20\t12\t38\t1.89\tTACATGT\n+contig70\t44241\t44281\ttrf\t13\t2.9\t14\t85\t7\t55\t27\t22\t12\t37\t1.90\tCTACATGTTACATG\n+contig70\t44485\t44531\ttrf\t14\t3.3\t14\t84\t0\t65\t41\t21\t10\t26\t1.86\tAACCGTATATGACT\n+contig70\t45147\t45181\ttrf\t16\t2.0\t17\t88\t11\t52\t52\t0\t2\t44\t1.16\tAAATATTAGTAATATAT\n+contig70\t46706\t46990\ttrf\t147\t1.9\t147\t100\t0\t568\t39\t10\t9\t40\t1.72\tTTCTTTATTTTTTTTATTTTAAAATACTTAGTACTTAGTAATGTCGCTAAAACCAATATAATATTCTTTAAAATTTAGAAAATATATTCAGACTTCGAATTACAAGGTGTATTAGAAGATAAATTAAACTCTAAAGCTTAATTTATC\n+contig70\t53900\t53978\ttrf\t28\t2.8\t28\t80\t5\t97\t15\t43\t5\t35\t1.69\tCTCTGTCACCCTCTCTTTACCTACCTCA\n'
b
diff -r 000000000000 -r 8b19a698d90e test-data/name_mapping.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/name_mapping.csv Mon Jun 25 15:01:41 2018 -0400
b
@@ -0,0 +1,71 @@
+Original sequence name,Renamed sequence name
+contig1,scaffold_1
+contig2,scaffold_2
+contig3,scaffold_3
+contig4,scaffold_4
+contig5,scaffold_5
+contig6,scaffold_6
+contig7,scaffold_7
+contig8,scaffold_8
+contig9,scaffold_9
+contig10,scaffold_10
+contig11,scaffold_11
+contig12,scaffold_12
+contig13,scaffold_13
+contig14,scaffold_14
+contig15,scaffold_15
+contig16,scaffold_16
+contig17,scaffold_17
+contig18,scaffold_18
+contig19,scaffold_19
+contig20,scaffold_20
+contig21,scaffold_21
+contig22,scaffold_22
+contig23,scaffold_23
+contig24,scaffold_24
+contig25,scaffold_25
+contig26,scaffold_26
+contig27,scaffold_27
+contig28,scaffold_28
+contig29,scaffold_29
+contig30,scaffold_30
+contig31,scaffold_31
+contig32,scaffold_32
+contig33,scaffold_33
+contig34,scaffold_34
+contig35,scaffold_35
+contig36,scaffold_36
+contig37,scaffold_37
+contig38,scaffold_38
+contig39,scaffold_39
+contig40,scaffold_40
+contig41,scaffold_41
+contig42,scaffold_42
+contig43,scaffold_43
+contig44,scaffold_44
+contig45,scaffold_45
+contig46,scaffold_46
+contig47,scaffold_47
+contig48,scaffold_48
+contig49,scaffold_49
+contig50,scaffold_50
+contig51,scaffold_51
+contig52,scaffold_52
+contig53,scaffold_53
+contig54,scaffold_54
+contig55,scaffold_55
+contig56,scaffold_56
+contig57,scaffold_57
+contig58,scaffold_58
+contig59,scaffold_59
+contig60,scaffold_60
+contig61,scaffold_61
+contig62,scaffold_62
+contig63,scaffold_63
+contig64,scaffold_64
+contig65,scaffold_65
+contig66,scaffold_66
+contig67,scaffold_67
+contig68,scaffold_68
+contig69,scaffold_69
+contig70,scaffold_70
b
diff -r 000000000000 -r 8b19a698d90e test-data/rename_Augustus.gff3
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/rename_Augustus.gff3 Mon Jun 25 15:01:41 2018 -0400
[
b'@@ -0,0 +1,6937 @@\n+##gff-version 3\n+# This output was generated with AUGUSTUS (version 3.1.0).\n+# AUGUSTUS is a gene prediction tool written by Mario Stanke (mario.stanke@uni-greifswald.de),\n+# Oliver Keller, Stefanie K\xc3\xb6nig and Lizzy Gerischer.\n+# Please cite: Mario Stanke, Mark Diekhans, Robert Baertsch, David Haussler (2008),\n+# Using native and syntenically mapped cDNA alignments to improve de novo gene finding\n+# Bioinformatics 24: 637-644, doi 10.1093/bioinformatics/btn013\n+# No extrinsic information on sequences given.\n+# Initialising the parameters using config directory /home/galaxy/galaxy/database/dependencies/augustus/3.1/iuc/package_augustus_3_1/24009970003a/config/ ...\n+# fly version. Using default transition matrix.\n+# Looks like /home/galaxy/galaxy/database/files/000/dataset_283.dat is in fasta format.\n+# We have hints for 0 sequences and for 0 of the sequences in the input set.\n+#\n+# ----- prediction on sequence number 1 (length = 45179, name = contig1) -----\n+#\n+# Predicted genes for sequence number 1 on both strands\n+# start gene contig1.g1\n+scaffold_1\tAUGUSTUS\tgene\t553\t34688\t0.03\t-\t.\tID=scaffold_1.g1\n+scaffold_1\tAUGUSTUS\ttranscript\t553\t34688\t0.03\t-\t.\tID=scaffold_1.g1.t1;Parent=scaffold_1.g1\n+scaffold_1\tAUGUSTUS\tCDS\t553\t578\t0.41\t-\t2\tID=scaffold_1.g1.t1.cds;Parent=scaffold_1.g1.t1\n+scaffold_1\tAUGUSTUS\tCDS\t652\t1047\t0.25\t-\t2\tID=scaffold_1.g1.t1.cds;Parent=scaffold_1.g1.t1\n+scaffold_1\tAUGUSTUS\tCDS\t12541\t12968\t0.87\t-\t1\tID=scaffold_1.g1.t1.cds;Parent=scaffold_1.g1.t1\n+scaffold_1\tAUGUSTUS\tCDS\t32202\t33826\t0.89\t-\t0\tID=scaffold_1.g1.t1.cds;Parent=scaffold_1.g1.t1\n+scaffold_1\tAUGUSTUS\tCDS\t33880\t34044\t0.98\t-\t0\tID=scaffold_1.g1.t1.cds;Parent=scaffold_1.g1.t1\n+scaffold_1\tAUGUSTUS\tCDS\t34107\t34619\t0.99\t-\t0\tID=scaffold_1.g1.t1.cds;Parent=scaffold_1.g1.t1\n+scaffold_1\tAUGUSTUS\tCDS\t34674\t34688\t0.45\t-\t0\tID=scaffold_1.g1.t1.cds;Parent=scaffold_1.g1.t1\n+scaffold_1\tAUGUSTUS\tstart_codon\t34686\t34688\t.\t-\t0\tParent=scaffold_1.g1.t1\n+# coding sequence = [atggcagcactctcgcaaaaggactttaatgacggaaaccagagaaatcgtcagaggaaaagtactgtcactgagcagc\n+# cctcatcaacatcaggaagcgtggcccaagtagaagcggacagcgcatcgtcacatttgtctgatcgctgttataacaacatagcaagtactaccaaa\n+# agtattgttggtgatgtgaaaacaagcagacgctgtgaagactttataagtagtggatcagcttcgactccattaaatgaatatgattgtgccaacgc\n+# tgatacgacggatattaaagatgaacctggagattttatagaaacaaattgtcattggcgaagttgttgtattgaatttaatacgcaagatgagcttg\n+# ttaaacatatcaataatgaccatatccaaaccaataagaaggcctttgtctgtcgatgggaaaattgtacccgtggtgaaaaacctttcaaagcgcag\n+# tatatgctagttgtgcatatgcgtcgtcataccggcgaaaagccacataaatgcacatttgaaggctgttttaaggcatattcacgcttggaaaacct\n+# aaaaacacatttacggtcacacacaggtgaaaaaccctatatgtgcgagtatccgggatgcagcaaggcgtttagtaatgcaagcgatcgtgcaaagc\n+# atcaaaatcgtactcacagtaatgagaaaccgtacatttgtaaagctcctggttgcacgaaacgttacaccgacccaagttctttgcgtaaacatgtt\n+# aaaacagttcatggtgctgagttttatgctaataaaaaacacaagggattgcccctaaatgatgcgaactctcgcctccaccgagacagtggccaagg\n+# tcggcataatcttcaagagcataatattgactctagcccttgcagcgaagaacttcaggtgggaaaacttataggcatgtctagtcccagtattaaat\n+# ctgaatctgatgaaagttcaccacatcatcagttgttaagtggagttcgagcttcagactgttttttaacatattcacaagatggtgccgccgaacat\n+# ataactttagatgacggctgggattgtgacgatgacgttgacgtggccgacttaccaattgtcttgcgtgctatggtaaatgttggcagcggaaattc\n+# gatggccccgaccattggagggggtgttgttgcgaggcagcgatttagaagtcgtttgcaaactaaaggaataaactctagtatggttatgcttggca\n+# acatccccgaaagcaatcgcaccattggaataagcgaacttaaccagcgtataacagaacttaagatggagcctggtaccgcttgtgatattacagtt\n+# ccattgaatacggggctggaaaggatttcagaagacttatcacaaaatcaatcaaatataacattaaataagcaaagcttctttaccgcttccggctc\n+# tctccaaggacattttcgtcgcgatagccagaactccactgcaagtacatattatggtagcatgcaaagtcgccgcagtagtcaatcatctcaggtgt\n+# cttctatatctacaatgcgtccaggcccatcgtacaacacaaccacagcttccctctatgatccaatttccccaggatgctctcgacgctctagccaa\n+# atgtctaatgtagtcaactcctacgcacttacatcaacatcaggattgactgcaattaacaaggacttaaatgcaaacagcagcccaaatgcttctat\n+# taataaaccgggtcttggtggtcagtactttggtttttacaataacagtcttcctccacctccatcgtctcatttaattgccaccaatttgaagcatc\n+# tgcaggacacagactctaggagttgttatcacaacacaactggcggtcgattttccattcccaattgtacgccatctctacatttagactacaatgga\n+# '..b'gt\n+# tttcgtgttggacgaatattgcgctcgctatggtgtgcggggatgctaccgacatttatgctacctttctgatttactggatcgtgcagaaaagcaac\n+# acatgatagatccaacactaattcactattcatttgcgttttgcgcaagccacgttcacggaaatcgacctgatggggtaggaagcattacgcatgag\n+# gaaaaggaaaaattttctgaaatcaaagaacgcctacgtcagttactggagtttcaaataaccaattttagatactgttttcctttcggtcgccccga\n+# aggcgctcttaaagcgacattatctttactagagagagtgctaatgaaagacattgttacccctgttccacctgaagaagttcgtcaaatgattaaaa\n+# aaagtttagagacggcagcgcttgtaaattacacccgtctctccaataaagctaagattgaaggcacttttccgttcaagggacacgtgccagggaaa\n+# tcctatcggaatttcaaaatttttccaagcactttcctgtacacgggaaacgtcccagggaaagcctatcggaaaggtcccagggaaatcccgtcgga\n+# tattcaggatttgcgaggagaggttattgttccgcccccaaaaaaactagaggacctaattcacttagcagaactttgtgttgatctgttgcaacaaa\n+# atgaagagcactatggagaactgcgcaaacatgacaaaatggataaaattaaaatgcgtaaggaagatgatgatgtaccaaaaggccacaatgaaagc\n+# gatattgatttaaccgccaatactggactcagtagcacatcagacctggcttctgcagcatcaactaatggatcgtcatttcgttattataatttgag\n+# gaatgggcgttttcatcagcacctgcgagacacattcgcaccattagtcgtgcggtacgtggatctgatggaatcttcaatagctcagtcgattcata\n+# agggatttgaaaaagaacgctgggaaagtaaagggaacggatgtgccacctctgaagacttattttggaaactagatgctctacagtcgtttataaga\n+# gacctgcactggccagacgcagagtttcgacaacatttagaacagcgtcttaaaatgatggccgtcgatatgatagagcaatgtatacaacgaactga\n+# ttcgtcttttcagtcgtggctaaaaaaaaacattgccttcatatcaactgattatattttaccttcagaaatgtgcgctatggtcaatgtgatattag\n+# atgctaaaaatcaaagctttaaattgactactattgacggcattgatttgtataaatttcatgcaaaaattgacgaccaaatcgacaaagcgaatgta\n+# gctatgacacaaggtctaactggtaaacttatgtcagtgctagagtcgactttgtcaaaattagcacgatacgacgaaggtagcctaatcggctcgat\n+# tcttagttttacaaatgtatcgagctcgggaaaggatctcgggcaaggatatgtaaatttctttagaaataatatggatcaagtacgaggaaaaattg\n+# gcgacgatttatggaccctgaatttctttgagcagtggtactcgcagcagattaacatgctatgtaattggctttcggaacgtttggaccacgctctg\n+# cactacgctcaagtttcatctatttctcacattatcaagaaaatatattcagacttcgaattacaaggtgtattagaagataaattaaactctaaagc\n+# atatcaagcagtcgcacagcgaatggcgacagaggaagcgacatgtgctttgacaatgcctgatgttagcgaagatgaaccctgtgacgacattcgag\n+# aaggggaagaagaagatactggcgacgaatctacctctaacataccaaggggcttaccaaaaccaaaaattgctgccgctcaagctgctgctgttacc\n+# aacgttgttgccggccgtgtgggtaatttactcggcaaaggcattggcggccttagttcaaagttgggaagtggaagttggttttaa]\n+# protein sequence = [MIDPSSSEEEGEDDPIANVSSKGRLTHAPKGTNTVSILGGVSGPGVGSNMAISGSNGDLAGNQRQSNISSISNRNDAG\n+# NVAGVGGSSNKNEQIHGSRVDGGNLEVPNSCIPSGVSQETLNQSIGSSRANSLPRPLSPSPSLTSEKPDTGDPHAFLKGETQIMADEAFQNAVQSYHD\n+# VFLKSERVLKMVQSGASSQHDFREVFRNNIEKRVRSLPEIDGLSKETVLTSWMAKFDIILKGTGEEDSKRPSRMQQSLNSELILSKEQLYDMFQQILL\n+# VKKFEHQILYNALMLDSADEQAAAIRRELDGRMQRVGEMEKNRKLMPKFVLKEMESLYVEELKSSINLLMANLESLPVSKGNMDSKYGLQKLKRYNHR\n+# KLILRSHGSLSKLEGDSEDGSTQLTKLDVVLTFQLEVIVMEVKGLKSLAPNRIVYCTMEVENGEKLQTDQAEASKPMWDTQGDFTTTHPLPVVKVKLY\n+# TENPGMLALEDKELGKVILKPTPLSSKSPEWHRMVIPKNLPDQDIRIKIACRLDKPLNMKHCGYKEKKSEPSEMMQLDGYTVDYIEAASANLMFGIDL\n+# NGGRFFFNAVREGDSISFACDDENECSLWVMAMYRATGQSHKPTPPITQDKNSAMSKIQGARVAPDGSIFLWASFFVAAATRNSSSYHWFRVGGRLNP\n+# MVVSAAARMEWDMCAQSPLASTWRGIGWWSSSERGQPYDLVDVEVPKSGATHYHVSCRGEVNQPETVVRDGLMEAESTDGGVKDAFATELCVEVPEDK\n+# LHVVVWGWFSPGQVFVLDEYCARYGVRGCYRHLCYLSDLLDRAEKQHMIDPTLIHYSFAFCASHVHGNRPDGVGSITHEEKEKFSEIKERLRQLLEFQ\n+# ITNFRYCFPFGRPEGALKATLSLLERVLMKDIVTPVPPEEVRQMIKKSLETAALVNYTRLSNKAKIEGTFPFKGHVPGKSYRNFKIFPSTFLYTGNVP\n+# GKAYRKGPREIPSDIQDLRGEVIVPPPKKLEDLIHLAELCVDLLQQNEEHYGELRKHDKMDKIKMRKEDDDVPKGHNESDIDLTANTGLSSTSDLASA\n+# ASTNGSSFRYYNLRNGRFHQHLRDTFAPLVVRYVDLMESSIAQSIHKGFEKERWESKGNGCATSEDLFWKLDALQSFIRDLHWPDAEFRQHLEQRLKM\n+# MAVDMIEQCIQRTDSSFQSWLKKNIAFISTDYILPSEMCAMVNVILDAKNQSFKLTTIDGIDLYKFHAKIDDQIDKANVAMTQGLTGKLMSVLESTLS\n+# KLARYDEGSLIGSILSFTNVSSSGKDLGQGYVNFFRNNMDQVRGKIGDDLWTLNFFEQWYSQQINMLCNWLSERLDHALHYAQVSSISHIIKKIYSDF\n+# ELQGVLEDKLNSKAYQAVAQRMATEEATCALTMPDVSEDEPCDDIREGEEEDTGDESTSNIPRGLPKPKIAAAQAAAVTNVVAGRVGNLLGKGIGGLS\n+# SKLGSGSWF]\n+# end gene contig70.g117\n+###\n+# command line:\n+# augustus --strand=both --noInFrameStop=false --gff3=on --uniqueGeneId=true --protein=on --codingseq=on --introns=off --stop=off --stop=off --cds=on --singlestrand=false /home/galaxy/galaxy/database/files/000/dataset_283.dat --UTR=off --genemodel=complete --species=fly\n'
b
diff -r 000000000000 -r 8b19a698d90e test-data/rename_HISAT.bam
b
Binary file test-data/rename_HISAT.bam has changed
b
diff -r 000000000000 -r 8b19a698d90e test-data/rename_StringTie.gtf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/rename_StringTie.gtf Mon Jun 25 15:01:41 2018 -0400
b
@@ -0,0 +1,11 @@
+# stringtie /home/galaxy/galaxy/database/files/000/dataset_328.dat -o /home/galaxy/galaxy/database/files/000/dataset_332.dat -p 1
+# StringTie version 1.2.3
+scaffold_16 StringTie transcript 1751 17824 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; cov "14.618678"; FPKM "322160.531250"; TPM "866155.937500";
+scaffold_16 StringTie exon 1751 1897 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; cov "6.787892";
+scaffold_16 StringTie exon 11285 11463 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; cov "19.860081";
+scaffold_16 StringTie exon 11518 11705 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; cov "23.926477";
+scaffold_16 StringTie exon 11759 11858 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "4"; cov "17.452721";
+scaffold_16 StringTie exon 11922 11975 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "5"; cov "11.461867";
+scaffold_16 StringTie exon 12601 12811 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "6"; cov "11.876496";
+scaffold_16 StringTie exon 17222 17337 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "7"; cov "15.915709";
+scaffold_16 StringTie exon 17406 17824 1000 - . gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "8"; cov "11.738873";
b
diff -r 000000000000 -r 8b19a698d90e test-data/rename_TrfBig.bed
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/rename_TrfBig.bed Mon Jun 25 15:01:41 2018 -0400
b
b'@@ -0,0 +1,602 @@\n+scaffold_1\t9130\t9428\ttrf\t163\t1.8\t164\t86\t2\t438\t36\t12\t13\t37\t1.82\tAAAAAAAATTATATCTTCGGTGTTTTTCAACATACAACCTCCTAAGCTTGGAAATAACATTTCTTAATCAGTTCTGAATTTCGAATTAAATTTTTATCAAAATCGGACAACTATACCATATAGCTGTCATAGGAAGGATTGGATAATTAGTGGTAAAATAATAT\n+scaffold_1\t15707\t15757\ttrf\t20\t2.5\t19\t83\t9\t55\t32\t12\t2\t54\t1.49\tTATATCATTTATATCTCAG\n+scaffold_1\t16261\t16302\ttrf\t12\t3.4\t12\t89\t0\t64\t2\t36\t24\t36\t1.69\tTCCGTCTGTCCG\n+scaffold_1\t23387\t23483\ttrf\t45\t2.2\t45\t92\t1\t158\t19\t22\t30\t27\t1.98\tTCGGCGAAGAAATGTGCCACTTCGGCGGCACTTCTTGGAGTCACT\n+scaffold_1\t23451\t23520\ttrf\t24\t2.9\t24\t80\t0\t75\t15\t26\t27\t30\t1.96\tTTCGGCGACACTTCTTGAAGTCAG\n+scaffold_1\t24200\t24233\ttrf\t15\t2.2\t15\t94\t0\t57\t51\t12\t15\t21\t1.75\tAAACAATGGAATGCT\n+scaffold_1\t29159\t29628\ttrf\t162\t2.9\t160\t80\t8\t518\t37\t12\t11\t38\t1.80\tGGAAAACATGAAATAAAAATTATATCTTTCGTGTTTTTTAACATATACCTTCTAAGCTTGAAAATAACATTTTTTATTTGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACAATCGGAAAATAAGTA\n+scaffold_1\t37571\t37606\ttrf\t8\t4.4\t8\t88\t0\t52\t31\t25\t42\t0\t1.55\tGACGGACA\n+scaffold_1\t38436\t38491\ttrf\t8\t6.9\t8\t79\t8\t58\t0\t38\t27\t34\t1.57\tTGTCCGTC\n+scaffold_1\t38436\t38491\ttrf\t12\t4.6\t12\t81\t0\t65\t0\t38\t27\t34\t1.57\tTGTCCGTCCGTC\n+scaffold_1\t38436\t38491\ttrf\t20\t3.1\t18\t80\t17\t69\t0\t38\t27\t34\t1.57\tTGTCCGTCTGTCCGTCCG\n+scaffold_1\t43116\t43168\ttrf\t2\t26.0\t2\t96\t0\t95\t48\t0\t1\t50\t1.12\tTA\n+scaffold_2\t540\t590\ttrf\t20\t2.5\t19\t83\t9\t55\t32\t12\t2\t54\t1.49\tTATATCATTTATATCTCAG\n+scaffold_2\t1094\t1135\ttrf\t12\t3.4\t12\t89\t0\t64\t2\t36\t24\t36\t1.69\tTCCGTCTGTCCG\n+scaffold_2\t8220\t8316\ttrf\t45\t2.2\t45\t92\t1\t158\t19\t22\t30\t27\t1.98\tTCGGCGAAGAAATGTGCCACTTCGGCGGCACTTCTTGGAGTCACT\n+scaffold_2\t8284\t8353\ttrf\t24\t2.9\t24\t80\t0\t75\t15\t26\t27\t30\t1.96\tTTCGGCGACACTTCTTGAAGTCAG\n+scaffold_2\t9033\t9066\ttrf\t15\t2.2\t15\t94\t0\t57\t51\t12\t15\t21\t1.75\tAAACAATGGAATGCT\n+scaffold_2\t13992\t14461\ttrf\t162\t2.9\t160\t80\t8\t518\t37\t12\t11\t38\t1.80\tGGAAAACATGAAATAAAAATTATATCTTTCGTGTTTTTTAACATATACCTTCTAAGCTTGAAAATAACATTTTTTATTTGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACAATCGGAAAATAAGTA\n+scaffold_2\t22404\t22439\ttrf\t8\t4.4\t8\t88\t0\t52\t31\t25\t42\t0\t1.55\tGACGGACA\n+scaffold_2\t23269\t23324\ttrf\t8\t6.9\t8\t79\t8\t58\t0\t38\t27\t34\t1.57\tTGTCCGTC\n+scaffold_2\t23269\t23324\ttrf\t12\t4.6\t12\t81\t0\t65\t0\t38\t27\t34\t1.57\tTGTCCGTCCGTC\n+scaffold_2\t23269\t23324\ttrf\t20\t3.1\t18\t80\t17\t69\t0\t38\t27\t34\t1.57\tTGTCCGTCTGTCCGTCCG\n+scaffold_2\t27949\t28001\ttrf\t2\t26.0\t2\t96\t0\t95\t48\t0\t1\t50\t1.12\tTA\n+scaffold_2\t38280\t38311\ttrf\t16\t1.9\t16\t93\t0\t53\t41\t19\t6\t32\t1.77\tTACATACATACATATG\n+scaffold_3\t3265\t3296\ttrf\t16\t1.9\t16\t93\t0\t53\t41\t19\t6\t32\t1.77\tTACATACATACATATG\n+scaffold_3\t17933\t17958\ttrf\t10\t2.5\t10\t100\t0\t50\t60\t8\t0\t32\t1.26\tATATAAACAT\n+scaffold_3\t19067\t19124\ttrf\t28\t2.0\t28\t100\t0\t114\t43\t14\t10\t31\t1.79\tAATTAAATTTTATCAAAATCGGACGACT\n+scaffold_3\t23368\t23418\ttrf\t2\t25.0\t2\t100\t0\t100\t50\t0\t0\t50\t1.00\tAT\n+scaffold_3\t24889\t25322\ttrf\t160\t2.7\t161\t80\t6\t452\t36\t12\t12\t38\t1.82\tAATATTAAAAATTATATCTTTGGTGTTTTTTAACATATAACCTTCTAAGCTTGGAAATAACATTTTTTATTTGGTTTAATTTCGAATTAAATTTTATTAAAATCGGACGACCATATCATACAGCTCCCATAGAAACAATCGGAAAATTAGTCGGAAACATG\n+scaffold_3\t26816\t26900\ttrf\t18\t5.0\t16\t83\t13\t89\t20\t5\t0\t73\t1.03\tTTTTTTTATATATTTT\n+scaffold_3\t26816\t26887\ttrf\t18\t4.1\t17\t84\t12\t90\t19\t4\t0\t76\t0.96\tTTTTTTTATATATTTTT\n+scaffold_3\t26816\t26900\ttrf\t15\t5.2\t15\t79\t16\t71\t20\t5\t0\t73\t1.03\tTTTTTTTATATATAT\n+scaffold_3\t26820\t26887\ttrf\t17\t3.7\t19\t80\t20\t74\t20\t4\t0\t74\t0.99\tTTTATATATTTTTTTTTCA\n+scaffold_3\t29468\t29515\ttrf\t25\t2.0\t23\t84\t12\t60\t34\t0\t17\t48\t1.47\tATTATAATTATGATGTTATGATG\n+scaffold_3\t38756\t38791\ttrf\t10\t3.6\t10\t92\t7\t63\t40\t0\t0\t60\t0.97\tATTTATTTAA\n+scaffold_3\t38758\t38788\ttrf\t9\t3.2\t9\t95\t4\t51\t40\t0\t0\t60\t0.97\tTTATTTAAA\n+scaffold_4\t7931\t7956\ttrf\t10\t2.5\t10\t100\t0\t50\t60\t8\t0\t32\t1.26\tATATAAACAT\n+scaffold_4\t9065\t9122\ttrf\t28\t2.0\t28\t100\t0\t114\t43\t14\t10\t31\t1.79\tAATTAAATTTTATCAAAATCGGACGACT\n+scaffold_4\t13366\t13416\ttrf\t2\t25.0\t2\t100\t0\t100\t50\t0\t0\t50\t1.00\tAT\n+scaffold_4\t14887\t15320\ttrf\t160\t2.7\t161\t80\t6\t452\t36\t12\t12\t38\t1.82\tAATATTAAAAATTATATCTTTGGTGTTTTTTAACATATAACCTTCTAAGCTTGGAAATAACATTTTTTATTTGGTTTAATTTCGAATTAAATTTTATTAAAATCGGACGACCATATCATACAGCTCCCATAGAAACAATCGGAAAATTAGTCGGAAACATG\n+scaffold_4\t16814\t16898\ttrf\t18\t5.0\t16\t83\t13\t89\t20\t5\t0\t73\t1.03\tTTTTTTTATATATTTT\n+scaffold_4\t16814\t16885\ttrf\t'..b'ATAACCTCCTAAGCTTGGAAATATCATTTTTTAATTGATTTTGAAATTCAAATTAAATTTGATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACGATCGGAAAATTGGTGGAAAAATAATATGAAACAAATTATAG\n+scaffold_69\t18536\t18888\ttrf\t163\t2.2\t161\t85\t4\t472\t36\t9\t16\t37\t1.82\tTTGGAAATACAATTTTTTATATTTATGAAATTCAAATTAAATTTGATCAAAATCGGACGACTATATCATATAGCTGTCATAGGAACGATCGGAAAATTGGTGGAAAAATAATATGAAACAAATTATAGCTTTGGAGCTGTTTGACATATAACCCTATAAGA\n+scaffold_69\t19781\t19812\ttrf\t15\t2.1\t14\t94\t5\t53\t58\t0\t0\t41\t0.98\tATATAATTATAATA\n+scaffold_69\t23637\t24060\ttrf\t162\t2.7\t156\t83\t6\t496\t37\t11\t12\t38\t1.79\tAAAAAAATTATATCTTCGGTGCTTTTTAACATATAACCTTCTAAGCTTGGAAATAACATTTTTTAATTAGTTCTGAATTTCAATTAAATTTTATCAAAATCGGACGACTTATAGCTGCCATAGGAACGATCGAAAAATTGATGGGAAAATAAATAT\n+scaffold_69\t36863\t36892\ttrf\t15\t1.9\t15\t100\t0\t58\t27\t20\t48\t3\t1.66\tGGGGAACGCGAGCAT\n+scaffold_69\t38645\t39124\ttrf\t158\t3.0\t157\t85\t5\t615\t34\t13\t13\t38\t1.84\tTAAAAATTGTTATTTCCAAGCTTAGAAGGTTATATGTTAAAAAACACCAAGATATAATTTTTTCATATTTTCCGACTATTTTTCCGATCGTTTCTATGGCAGCTATATGATATAGTCGTCCGATTTTGATAAAATTTAATTTGAAATTAAAACCAAT\n+scaffold_69\t43653\t44084\ttrf\t162\t2.7\t162\t87\t4\t586\t40\t10\t13\t35\t1.79\tAACATTTTTTAATTAGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGAAGACTATATCATATAGCTGTCATAGGAACGATCGAAAAATTGGTGGAAAATAATATAATAAAAATTATATCCTTGGTATTTTTTAACATATAACAATATAAGCTAGAAAAG\n+scaffold_70\t6910\t6939\ttrf\t15\t1.9\t15\t100\t0\t58\t27\t20\t48\t3\t1.66\tGGGGAACGCGAGCAT\n+scaffold_70\t8692\t9171\ttrf\t158\t3.0\t157\t85\t5\t615\t34\t13\t13\t38\t1.84\tTAAAAATTGTTATTTCCAAGCTTAGAAGGTTATATGTTAAAAAACACCAAGATATAATTTTTTCATATTTTCCGACTATTTTTCCGATCGTTTCTATGGCAGCTATATGATATAGTCGTCCGATTTTGATAAAATTTAATTTGAAATTAAAACCAAT\n+scaffold_70\t13700\t14131\ttrf\t162\t2.7\t162\t87\t4\t586\t40\t10\t13\t35\t1.79\tAACATTTTTTAATTAGTTCTGAATTTCGAATTAAATTTTATCAAAATCGGAAGACTATATCATATAGCTGTCATAGGAACGATCGAAAAATTGGTGGAAAATAATATAATAAAAATTATATCCTTGGTATTTTTTAACATATAACAATATAAGCTAGAAAAG\n+scaffold_70\t17962\t18295\ttrf\t161\t2.1\t160\t83\t5\t413\t37\t12\t13\t35\t1.84\tAAAAAATTATATCTCTGGTGTTTTTAAACATATAACCTCCTAAACTTGGAAATAACATTTTATAATTAGTTCTGAATTTCGAATTAAATTTTATCAAAACCCGACGACTATATCATACATGTAACTGTAACGATCGGAAAATTGATGGGAAAATAATATG\n+scaffold_70\t19030\t19306\ttrf\t137\t2.0\t137\t94\t1\t482\t39\t13\t13\t34\t1.83\tTTTAACACATACCTTTCTAAGCTTGGATATAACATTTTTAAACTGGTTCTGAATTTCAAATTAAATTCAATTAAAATCGGACGACTATATCATATAGCTCCCATAGGAAAAATCGGAAAATTAGTGAGAAAATAATA\n+scaffold_70\t22269\t22308\ttrf\t19\t2.1\t19\t100\t0\t78\t58\t15\t15\t10\t1.62\tAACTAAGGAAATACCAGAA\n+scaffold_70\t22812\t23252\ttrf\t162\t2.8\t156\t84\t5\t562\t37\t11\t13\t37\t1.81\tTTCTAAGCTTGAAATAACATTTTTTAATTAGTTCTGAATTTCGAATTTAATTTTATTAAAATCGGACGACTATATCATATAGCTGCCATAGGAACGATCGGAAAATTAGTGGAAAATAATAAATAAAAATTATATTTGTATTTTTAACATATAACC\n+scaffold_70\t23421\t23486\ttrf\t13\t4.7\t13\t70\t20\t51\t38\t0\t0\t61\t0.96\tATATATATAATTT\n+scaffold_70\t23426\t23479\ttrf\t7\t7.4\t7\t79\t12\t54\t35\t0\t0\t64\t0.94\tTATATTT\n+scaffold_70\t23430\t23486\ttrf\t27\t2.0\t27\t83\t10\t69\t35\t0\t0\t64\t0.94\tATTTATATATTTATTAATATATTTTAT\n+scaffold_70\t25576\t25606\ttrf\t12\t2.5\t12\t94\t0\t51\t33\t26\t36\t3\t1.73\tACGGACGGACAG\n+scaffold_70\t27263\t27382\ttrf\t63\t1.9\t63\t85\t3\t168\t27\t25\t21\t26\t1.99\tATTTTTCCAAGCACTTTCCTGTACAAGGGAAACGTCCCAGGGAAAGCCTATCGGAATTTCAAA\n+scaffold_70\t27353\t27406\ttrf\t25\t2.1\t25\t85\t0\t70\t30\t26\t32\t11\t1.91\tGGAAACGTCCCAGGGAAAGCCCATC\n+scaffold_70\t27848\t27878\ttrf\t12\t2.5\t12\t88\t0\t51\t30\t30\t40\t0\t1.57\tACGGACGGACAG\n+scaffold_70\t35504\t35713\ttrf\t102\t2.0\t102\t99\t0\t409\t37\t12\t13\t36\t1.82\tAAAACGATGGTAGACAAATATGCATATATTTTTTACACAAAACGAAATATAATGGACTTTTAAAAATTCTTTTTTCTATCTTTCCTGGTGGGAGATATATAT\n+scaffold_70\t43333\t43446\ttrf\t57\t2.0\t57\t94\t0\t199\t30\t17\t22\t29\t1.97\tAATATTGGGAATAACATATTATCTTATAATATGGGAGCGCGAAGGCTCCTCGCCCAT\n+scaffold_70\t44242\t44281\ttrf\t7\t5.7\t7\t81\t6\t53\t28\t20\t12\t38\t1.89\tTACATGT\n+scaffold_70\t44241\t44281\ttrf\t13\t2.9\t14\t85\t7\t55\t27\t22\t12\t37\t1.90\tCTACATGTTACATG\n+scaffold_70\t44485\t44531\ttrf\t14\t3.3\t14\t84\t0\t65\t41\t21\t10\t26\t1.86\tAACCGTATATGACT\n+scaffold_70\t45147\t45181\ttrf\t16\t2.0\t17\t88\t11\t52\t52\t0\t2\t44\t1.16\tAAATATTAGTAATATAT\n+scaffold_70\t46706\t46990\ttrf\t147\t1.9\t147\t100\t0\t568\t39\t10\t9\t40\t1.72\tTTCTTTATTTTTTTTATTTTAAAATACTTAGTACTTAGTAATGTCGCTAAAACCAATATAATATTCTTTAAAATTTAGAAAATATATTCAGACTTCGAATTACAAGGTGTATTAGAAGATAAATTAAACTCTAAAGCTTAATTTATC\n+scaffold_70\t53900\t53978\ttrf\t28\t2.8\t28\t80\t5\t97\t15\t43\t5\t35\t1.69\tCTCTGTCACCCTCTCTTTACCTACCTCA\n'
b
diff -r 000000000000 -r 8b19a698d90e test-data/rename_sequence_cov.bigwig
b
Binary file test-data/rename_sequence_cov.bigwig has changed
b
diff -r 000000000000 -r 8b19a698d90e test-data/renamed_reference.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/renamed_reference.fasta Mon Jun 25 15:01:41 2018 -0400
b
b'@@ -0,0 +1,66784 @@\n+>scaffold_1\n+AAAACTAATTTTATCAAAATCGGACAACTATATCATATAGCTGCCATACG\n+AACGATCGGAAAATTGGTAAGTAAATAATTAAAAATATTATATCTTTGGT\n+GTGTTTTTGGAAATAACATTTTTTAATATGTTTTGAATTTTGAATTAAAT\n+TCTATCAAAATCGGACGACTATATCATATAGCTGCCATACAAACGATCGG\n+AAAATTGGTGAATAAATAATATGAAAAAATTATATCTTTGGTTATTTTTT\n+AGACAAATAACCTCCAACGCTTGGAAATAACATTTTTTAATTAGTTATAA\n+ATTTGATATTTTAATTTTATCAAAATCGGACGAATATAGCATATAGCTGT\n+TAAAATAATATGAAACAAATTATAGCTCCGGTGTTTTTTACATATTATCT\n+TATACTATTGGGAAAATAGTTTATTATATTTTAAAGAATTTCCAATTAAA\n+CTCTAACATATAGCTTTCAAAGAAACGGTCAAAAAAGTAAAGAAATCATT\n+TTTTTTTAACATCACTGAAGCTAGAAACAATCCTTAAAAATGTAACATGG\n+TGTTAGTAGCATTGAAAATTGCTTATAACTGCAAAGGGAAAACAAACATC\n+GGCTTGCCGAATGTAATTTCCATTCTTGTTTGACTTGAGTTTATAACTTA\n+CAATTATGGTAAGGTGCCTGATTTTGGTTTTTGCCATACGGTATGTGGTA\n+GTTATCATTTTGCCGTGCTATAAGTGACATCACAGCCGATTCTTTTACTC\n+CATAATGGGCCAATGTGTTGAGGCGTTTCCATCCATTTATTGTTTTTGTA\n+GTTAGGTCTTCATCTTGTAATGTGAGATGACCTCCTCTTCCATGCCTCCA\n+TTCTAAGTCAACTTCGTGCACAGATGGTCTCATAGAAAACGGAGTATTTT\n+TAAAAATTGCGTCCAAAATTTTTAATTTAACTTGCGATATGGTATCCAAA\n+TCGTTTACACGACATTGGACTTTTTCATCAAGATCATCTTGTAAAATGTG\n+CAAAATTACAACAGAATGGGTAACTTGTTCGTGGAGAAGTCGTTCCTCTG\n+AAAGTGAATAACGAGCATCGTGGGTTATTGCGTCCACCAAACCCTTTTCA\n+ATTTGATGCTTAATTGCCTTGAACAGCAAAAATAAATTAGATCCAGCATA\n+TTCTTTTAGGTAGTCGTACATACAAATTGCTAAGTAGTTTGTTAACATTT\n+TTTCAACTACGCTCTCAGTGCGTCGTAGCATTAGCTGAGGATGCTTGCTG\n+GCGAGCGATTTGTCAATTAATCGCAATAAAAGGGACTTTAAAATTTCCGT\n+CGCATATTCCATTTTGTTCATTAGAACAACCATAAGTAAAGAGGCGACGT\n+TAACTCGATCGCGAATTGAGAAAGATGACCGTTGAGCTTCTAAAGTTTCT\n+ATGAACAATAGTAAAAAATATTTGTTTCCAATAAGTTGCTCGAATTGTAT\n+CATAGCTGCATCATAGTTAGTGTGCGGGCTACTTCCACAAAATTTTCGGG\n+AGTTTAGAATAGGATGATCTGATACACCGGGAAAGAAAACTTTCATAATG\n+TAATTGACGTGATCTAACGTTGGTATACCGGTGCTCTCCAAATCTGCTGT\n+TAGATCGGTCATGTCCGTTTGGAGCTCAGCAAATGCCTGTTTACACTCAG\n+AACGAACGTTGCTTTCCAATGTTATCATCTGTATCTGAATTCGTTTGTAT\n+TCCCGTTCTGCTTGGGTCGATTTCCTTCTAAATATTATTAGTACGACAAC\n+CAAAACGATGACAAGCACTGCAACTGTCAATATAACGACAAACATGGCAT\n+GTGAAAAAACATAGGGTTTATTTAAATCATATTTCAAATATCCTATGGCG\n+AAACGAAGATTTCGCCCTACTTTAACCACAACTAGAGGTAAATCTGTCGA\n+TTGATCCACACCATTTTCATCAGTTGGGAGTGGTTGATGTTCCGGTGGAA\n+TGCACAAAAGTTGAGTTAGTGTAAGGCTTGTTATATTGCATTGAGTAGTA\n+CCAATGGTTACATTAACGTCGTATTCATCAGCTGCCAAATTTAGTAGCTC\n+GCCTTCAATAACCAAGCTGTCACCCTTGTATAGTTTAATTCCGTCATTTG\n+GAAATGGTAAATATTTTGGATCGGCTAAATAAACAATAGTGCTCCTGATA\n+TCATGAAAGTATTTATTTAGATCTCGAACAAGCTGTACATTGTCCATTAC\n+AAAACTAAGTTGTAAATTCAGTTGCGTTTCATGGACCTTTACAAAAGTTG\n+TAACATCCATATTATTATTGACGAAATAGCTAGGCGCAGTTCCCCCTGTT\n+GTGTATATATGAAAGTTGTCTACGAAGTCTGCTTTTCGCTTTCGTCTAGA\n+ATATTCGTTCTGATGCGCACTTTCATTTTTAAAGTCAAATTCCGAATCCA\n+TCACTCTGTTAGAACTTTTAAATGCTTGAAATTTATCATTTACCGGAGGA\n+GATGGGCATTCCATTTGATTTGAATTGATTACTACGCAAGATGTTTTGTT\n+TACTCTTTCATTATCAAAAAAAACTTCAAGTTCAGGCTTTTGAATTGAAT\n+TAAGATACATTCCATGAACGGTCAGAACGCGACCACCACTTACAAAACTG\n+CGTAAAGGCTTAATCTGCATTATACGCGGGTCTTGGGTATAGTTAAAAAT\n+AGAACAGGGCTGCCTTGGTAACGTACGAAATTGGTATGAACCGAAATTAC\n+TTCGAGTTAGATTTTTATTGGGTATAGTTGCGGGTGAGATATGACATTCT\n+AAAGTTCGGTTGGCACCGTCAATAAGAAGGTGTAGAGACCGTATTGGTTC\n+TGGCTGGGTCGCCTCTGATGTAGTACTACTAACTTGAGTTGAAGAAGCTT\n+GTGTAACGTTTATATGACACTCGTACTCATCTAAATATGCTCGCATGGTT\n+GATCCAATGTTCAAAAACTTTCCTATTAACGACAATTGTGTTCCTCCCGA\n+CCTGGGCCCAATCGTGGGATATAATCCTGTTAGCAAAACATTCTTAAAGT\n+GAAATTGTACACTAGATTCAGTATACCCTGCATCATTTGCAACCTTTATA\n+GGCGCTGACATTTCATACATCACTGCTCCAGTGCGGCATTCGATCTTTAC\n+AGAAATTTGGTAGTTGACTAGTTCACAAGGCACAGACCCAATAAATATTT\n+TTCCACGCACATCTCCTTCGCGAATGCCCAAATTACTGCCTTCAATTGTA\n+ATAAGGGTACCACCCTCAATAGGTCCAGATAACGGTTTAATAATATCGAT\n+CCTTGGTAAAGGGCACTCGTTTTCTTTAGTTGTTTTTGATCCTGCACTAA\n+TAGCACGATCACTGTCTGCTATGCAAGTCTCGTTATATACACATGAGTTG\n+CTGCACCAAGCACATTGGTATTTTGGATCACGAGTGACACACAAACTGCA\n+ATCAGCATGATCCCGATGTGAGCCCAGTACGTCGCATTTATATAATGTAA\n+CAATCGCCGTGTCCACATAGTGCTGGAAATTCCATGTAATTACAACCTTT\n+GCTTGGTATTCATGTGTATTAGTCTCGTAGAAATAAGGTGTTTTTTCACA\n+AACAACAATCTTGTTTGACTCAATGTGGGCAGGCAATAGCATCTGAGCAG\n+CTTCAATATGAACTGTACACAAGAATCCAGCGTGAGCGCTTTTGGGTTTT\n+GGTAAGTTTTCTATCTCTAAACGAATTTCTTTTGGCACCCGCACCGGTAA\n+AAGAATCGCCGGACGATTGCTTTTTAAATGGGGGCATTGACCAACACTAG\n+TTACCGAATTTTCTATATTACGACATTGTATTGATTGATGGACACATTTA\n+TTGTCAAAAATAC'..b'CCACTGGACCCGTTGGATAGCGTC\n+GGCACTTTTCTGTTTGGTGCCATTCACTGGTCACTAGTAGGACCGCTCTG\n+CCTATTAAAATAGGAGTGCTGCTTAGAATTTATTTCAGCAAGACAGCCGT\n+AAGATATATATGAATAGTATTTAACGGCAGTGGCAGAGGCCTTTACAATA\n+TAAGGCTTTACGGGATTTTAAACAATGAAAAACAAAAATATTTTTATAGA\n+GTCGAGATAAAATACTTTTTACAATAAATACTAAGTATTTTTAAAAGATA\n+AAAATATTTAAAAGTAAATACTGAATATTTTAACAGGTGTTAAGTACTGG\n+GAACTGTGACTAAGGACGGCGGTATATCGCTACCATAATATTTTTAAAGG\n+AACTGAATACTGAAAGATGTGACCAAAATGGTAGAATATCGCTAACGAAA\n+ATCACAGACGCAAATATCGATAGTGGCCTAGAGACCCGATATCGCCGCCG\n+TGATTATCGATGAAACTACAGCTGAGCTGCTTGTTTACATTCTAAAGTTA\n+AAATTTTTAAAAATTTCCAATACAAAAAAAAATTCTTCGTATTAACACGG\n+CTGTTTGCCGGTAAGATCTGAAGTGGATTCAAGTTGCAGCACCCTCAGGA\n+AAAGAATAAATTATTATAATATAATAATATAATATAAAGAATTTAAATTC\n+GAACCAAACGCGGTATGTCACTCTTCATTTAGAGAATTTGTGGCTTTGTT\n+TTGTACAAAAAACTATTCTTTTTTCTTGAAAATTAGCATCAAGAATTTAT\n+TGCCAAAACAGAACGCAATTCTGCTAAATCTGGTTACCCTGCCAAATGGC\n+TGGCCGTTCTGTGCATTCAATAACACAAGCTAACGGCTTACGGCACATTC\n+GGAAAGATCCAAAAGAATTTCTATTCCGGCATTTTTTATGTATTATCGTC\n+CAATTTTTGTATGTGTATTCATTCTTTTGGCTGTCCGTTATTAAGCTTTT\n+CTTATCCACATAAGCTGACCAGCTGCCAAAAAGCCGACCGTTTTGTGCAG\n+CCAATAACCCAAGCTAACTATCAACAGCAATTTCGAAAAATCCAGAAGAA\n+GCTATCCTTCGGCAATTTTTTCTTATATTATAATTTTTTTGTCACAATTT\n+TTTGTCAAAAAATCGACAATAATTAAGTGTTTACATTTTAATGCGATTTA\n+ATTGGAAATTTGAATTCGAATCAAACGCGGTGTCACTCTACATATGGACA\n+ATTTGTGGCTACAAAATTAGTTGAAAGTGCATGTTTTTTTTTAAGTGAAA\n+TAAAACAAAAACAGCAATAACAGGCCAAAATGTTGTTTTATAAATAAATA\n+CTTACATATCCGCATATAAATATGAATGAAAAAAAAAACAGCAAGACTGG\n+GCCAAAATATTGTTCTTTAATATGTAAATAAATACATATCTACATATACA\n+TATGTGGACAAAAGTGTTAAAATTAGTTAATAGTGCATGTTTTTTAAATG\n+AAAAAATAAAACAAAAAAAGCAAGCAAATATAAATTATATTCCACACACA\n+TTTACAATAATTTCAAACTACGCTAAAAATACCCAACAGAAAAAACATAG\n+AAAGGTAAACAAAATACAAGAATATCAAAAAAAATCTAATTTTCACGTTG\n+TTGTGGCCGGTACCACCGGTCATACATACATATAGATACATATTTAGATT\n+CTCACAAAAAGAATAGAAAATTACCGCTAATTTCCTTATATACGTTTTTG\n+TTTTCAGTGTTTTGAAATAGTATTTTTCAAACAAAAAACAATACAAAAGG\n+GTTAAAAAAATTGTTCGATTGGCTTTAACATACTAATTAAAAAAAATCAC\n+AATTTTTTGGCAAAATATCGAAAAAAATTAAGTGTTTACATTTTTATGCG\n+AATTATTTGGAAATTTAAATAAGAACCCAACGCGGTTTGTCACTCTACAT\n+ATGGACAATTTGTGGCTTTGTTTTGAACAAAAAATGAATTTTTTTTTACT\n+CAAAATTAACAAGAAGAAACAGTAATGCGGGTTTTGATCGCAATTCTGCT\n+AAATCGAATTTCCGTGCCCAAAGGCTGACCTTTTTGTGCAGCAAATAGCC\n+CAAGCTAATAATCTACAGCAATTTCTTAAAGACCGAAAATGTATCAACTT\n+CGGCAAAATATGAAAATTTAACATTTATTTTTCAACATTTTTTGCCAAAT\n+AATCGACAAAAATTTCAGTGTCCCGATTTGGATGCGAATTAATTGAGGAC\n+AATTGTGACTTTGTTTTGTAAAAAAACTATTTTTTTTACTGAAAATTACA\n+ATCAAGAATCTAAGGCCAAATCAGAATATTTTCACTGCGGTTTTTTGATC\n+GCAATTCTGCTAAATCGGGTTCCGTGCCAAAAAGCTGACTATTTTTTTTA\n+CTGAGAATTAGCATCAAGAATTTATTGCCAAAACAGAACGCAATTCTGCT\n+AAATCGGGTTGCCCTGCCAAAAGGCTGGCCGTTTTGCGCATTCAATAACA\n+CAAGCTAACGGTTTACAGCACATTCGGAAAGATCCAAAAGAATTTCTATT\n+TCGGCATTTTTTATGTATTATCGTCTAATTTTGGTATGTGTATTCATTCT\n+TTTGGCTGTCCGTTATTAAGCTGCTTTTCTTATTCACATATTCAATGGCG\n+CAGTACATAAAAAGAATGAACCGTGGTTTTCTTGCCCTCTCCATCTCCCT\n+CTACCACTTCCCCTCTCAACAACTATCTCACGCACTCTGTCCCTTCTCGT\n+CTCTGTCACCCTCTCTTTACCTACCTCACTCTGGCACACTCTCTCTACCT\n+ATCTCACTCTGTCACCTTCTTCTACCTAATTCTCTCTGTCGCGCTCGCTC\n+TCTCAACATGCCTTTCGCACCGTATCTCTTCGTTTCTCTGTATGCTTGCT\n+CTCTTAATTTAAGTTTCTCTTTCTTTGTGTTCAATATCTTTCGCGCTCGT\n+GACTCCTATTGACCGGACTCTGAGCGGTGCTCATTAAGAGTGGAGTTTTC\n+GATGATGGCGGGTGGCGCGAACGAGAATTTTTTACATAAAGGTAAGTTGC\n+CAATTCTTTTTTAAATGTGACATACAGCATGCATATTTTATTTATTGTAA\n+TTATATGTGAAAGAATAAAATTATATGTACTTTTATCTAATCTATTGCAT\n+CTATTTTTTCACAGGTAAACGAGTCACACGAGAAGTAAAACACAAACACA\n+AGGATCAAAATAAAATTCAGGTGAGTGAACGAACGTGTTGAAAGTAGTTA\n+ATAGTGCATGTCTATTTAAGTGTAAGAAACAAAAAAGACACAAATGGGCC\n+AATAATTCGTTTCTTTAATAGATAACTGCCTATATTATGTTCAAACTATG\n+CTAAAAAGACCCAAAAGGAAAACATAAAGTATATACCTTGCAAAATGAAT\n+AAAAAGAAATCATATATATTCATATACGTTTGACCGGTACCACCGGTCAT\n+ACATACATAAACATAAACACAAAAAGACTAGAATATAAATACCATATTTT\n+TGATTGGCTTAAAAATGGCACAAAAAAAAGATAAAAACTAGAGTGTCTAG\n+CTTTAAGTGACAATCGACTCGGAAAATGATCAAGAAATAAATGAAAAATT\n+TGTCTTGCGGCTTTTTGGTCGCAATTCTAAATCGGTTTGTATGTATGTCA\n+CTCTTCATGTATACAATTTGGTGGCTTTGTATTCCACAAAAGTCACAGTA\n+GTCACAAAAGTTTTTTTTACTGAAAATTACCATCAAGAGTCTATGGCCAA\n+ATCAGAATATTTTCACTGCGGTTTTTTATTTCAATTCTGCTAAATCGGGT\n+TTCCGTGCCAAAAAGCTTTTGCAGCCAACAACAATATTCAATTTTTTGGC\n+AAAAAATCGACAAAAAAATT\n'
b
diff -r 000000000000 -r 8b19a698d90e test-data/sequence_cov.bigwig
b
Binary file test-data/sequence_cov.bigwig has changed
b
diff -r 000000000000 -r 8b19a698d90e tool_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml Mon Jun 25 15:01:41 2018 -0400
b
@@ -0,0 +1,9 @@
+<?xml version="1.0"?>
+<tool_dependency>
+    <package name="samtools" version="1.2">
+        <repository changeset_revision="f6ae3ba3f3c1" name="package_samtools_1_2" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
+    </package>
+    <package name="ucsc_rename_bigwig" version="340">
+        <repository changeset_revision="39d26518c84b" name="package_ucsc_rename_bigwig_340" owner="yating-l" toolshed="https://toolshed.g2.bx.psu.edu" />
+    </package>
+</tool_dependency>