Repository 'change_fasta_header_using_tabular_file'
hg clone https://toolshed.g2.bx.psu.edu/repos/portiahollyoak/change_fasta_header_using_tabular_file

Changeset 0:540425dc9746 (2016-04-22)
Commit message:
planemo upload for repository https://github.com/portiahollyoak/Tools commit 132bb96bba8e7aed66a102ed93b7744f36d10d37-dirty
added:
change_fasta_header_using_tabular_file.py
change_fasta_header_using_tabular_file.xml
test-data/genbank_input.fasta
test-data/output.fasta
test-data/tabular_file.tsv
b
diff -r 000000000000 -r 540425dc9746 change_fasta_header_using_tabular_file.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/change_fasta_header_using_tabular_file.py Fri Apr 22 12:07:53 2016 -0400
[
@@ -0,0 +1,63 @@
+
+# coding: utf-8
+import argparse
+import sys
+
+
+def get_dict(tabular_file_handle):  # In this function, the file tab_file_handle is used
+    """
+    This function creates a dictionary out of the file provided containing TE ID names\
+    and their common usage names separated by a tab
+    """
+    dictionary = {}  # A dictionary is named 'dictionary'
+    for line in tabular_file_handle:  # For every line in the file
+        line = line.strip()  # The leading and trailing white spaces are stripped
+        key, value = line.split("\t")  # The line is then split where there is a tab and 
+                                       # then the two results are defined as key and value
+        dictionary[key] = value  # The key is linked to the value
+    return dictionary  # Show dictionary on the screen
+
+
+def replace_id(line, dictionary):  
+# In this function, the dictionary and the lines of the fasta_file_handle are fed in.
+    """
+    This function reads a fasta header (line), recovers the name of the sequence "(>fasta_1)"
+    and stores this in key. We look up key in the dictionary, and if the key is present,
+    we replace the key in the line with the value that is assigned to the key in the
+    dictionary.
+    """
+    key = line[1:].strip()  #The key is the ID name (not including the >)
+    if key in dictionary:  #If key is in the dictionary, it is replaced
+        line = line.replace(key,dictionary[key])
+        return line
+    print("Value  %s is not present in multifastafile" % key)
+    return line
+
+
+description = ( "This script will exchange fasta headers in multifasta file with values linked in tabular file")
+
+parser = argparse.ArgumentParser(description)
+parser.add_argument("--tab_input", help="A tabular file containing two linked columns separated by a tab")
+parser.add_argument("--fasta_input", help="A multifasta file containing fasta headers and their sequences")
+parser.add_argument("output", help="Name of the output fasta file.")
+# uncomment the next line only when interactively testing!
+#args = parser.parse_args(["TE_ID_Names.tsv", "TE_seq_d.fasta", "my_fancy_new_out.fasta"])
+args = parser.parse_args()
+
+
+python_version = sys.version_info
+if python_version.major >= 3:
+    kwargs = {"encoding": "utf-8"}
+else:
+    kwargs = {}
+
+with open(args.tab_input, **kwargs) as tabular_file_handle:
+    dictionary = get_dict(tabular_file_handle)
+
+with open(args.fasta_input, **kwargs) as fasta_file_handle:
+    with open(args.output, "w") as output:
+        for line in fasta_file_handle:
+           if line.startswith(">"):
+                line = replace_id(line, dictionary)
+           output.write(line)
+
b
diff -r 000000000000 -r 540425dc9746 change_fasta_header_using_tabular_file.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/change_fasta_header_using_tabular_file.xml Fri Apr 22 12:07:53 2016 -0400
[
@@ -0,0 +1,52 @@
+<tool id ="change_fasta_header_using_tabular_file" name="Change fasta header" version=" 0.1.0">
+    <description>using a tabular file</description>
+    <stdio>
+        <exit_code range="1:" />
+    </stdio>
+    <command>python $__tool_directory__/change_fasta_header_using_tabular_file.py
+        --tab_input "$input1"
+        --fasta_input "$input2"
+        "$output"
+    </command>
+    <inputs>
+        <param format="tabular" name="input1" type="data" label="Tabular File"/>
+        <param format="fasta" name="input2" type="data" label="Fasta file"/>
+    </inputs>
+    <outputs>
+        <data format="fasta" name="output" />
+    </outputs>
+    <tests>
+        <test>
+            <param name="input1" value="tabular_file.tsv" ftype="tabular"/>
+            <param name="input2" value="genbank_input.fasta" ftype="fasta"/>
+            <output name="output" file="output.fasta"/>
+        </test>
+    </tests>
+    <help> <![CDATA[
+
+This tool takes 2 input files, a tabular file with text to replace in the first column,
+and a replacement text in the 2nd column, as well as a fasta file.
+Every occurence of values in the first column of the tabular file will be replaced with the
+value in the 2nd column.
+
+-----
+
+*Example*
+
+**Fasta header** ::
+
+    >RT1C
+    ATGCATGC
+
+**Tabular file** ::
+
+    RT1C    Rt1c
+
+**Output file** ::
+
+    >Rt1c
+    ATGCATGC
+
+
+    ]]> </help>
+</tool>
\ No newline at end of file
b
diff -r 000000000000 -r 540425dc9746 test-data/genbank_input.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genbank_input.fasta Fri Apr 22 12:07:53 2016 -0400
b
b'@@ -0,0 +1,4 @@\n+>RT1C\n+GGGGACGCGCGCGAGTAGCCGTGTGAATCGAGTTGGCGCTCCTGGAAAACCCCAAAATTTTCCGTGTCGCGGCGGCTTGATGGAGACAGGAGTGGCTGTCTCTAACACACAGTGCCGATATGAGTACTCACCAGCAGTGGGCAAGCTCCAAGTATCCATGGATCGCCCGCCGGCGCCGATCCTCAGGGCCATGGAGCAGGTCAGGGTGAGAGAAGCAGCGAACTTTCTCTGCACTACTTTCTCTTTGTCGCTGTGTTGTTTCTTTTGGCGTCTTGGCTGCCACCAGACTTGCCGGTCACGCCAGCTGATCTCGCAGTCAGCTTGGAAAGCAGTGCTGGTAAACGGCTAAAGCACCGCGGTCTGGCAGCGCTGGTCGGATGCACGAGTCCCCTAGCACAGGTGAGCCGTTTTCTCGGTGAAAGCACTCACTGACAAAAGCTAGCAGCTACGGAAATCGCCTAACGATCGGTTCACCGGTCGTAGCATACATTTTTGGGCGGCTGACGGTTATCCTTGGCAACATCCCATGGAAACCCGGAGACAGATCCATAATCGAGCAGGAGAGGCAGAACAAGAGTGTAAAAAGTCAAGGAGCAGACCAATAGCCAACCCCCCCGCTTAGGCGGCACACTTTAAATCCGGGGCTCTGGCGACCAAGCTGGAGCGGTATATCTCCCACCGTCGCAACTTTCCCCTGCTCACCCACCCCATAAGTCCACGGCGCGTCTGACCCAAAGTGGGCGGGTACGTGGCCTGCGCCTGTTCTCTTTACCAGCCGGGCAGCAGCAAAATAAAAACCCATTCAGCGTCTGAGCCAAGTTGGCCGGCGGAATGGTCTGCGTCTGCGCCGCATCGGCCGGCAGAATATCCAAAACCTGGCGAAAGGTATAAAGCCGCAAACCTGGCAGGAGGTATAAAATGCAACACCTAACTGGAATGTCTGTAAACAACTTTATTACTCCAGGTGGCAGCCACACATGTGGAAATCCACCCTCGGCTAATCCCGAGGCTAGGGCACGGATTCTGGAGGCCCTACCAAACATTCTCCCCAAACCCGCCCCGACGGCGGCACACTTGGCCGTCGGACTAAGCAATGCAACAAGTGCACCCACAACGGACGAAGAAAGCTTGGTGTTTGGGAAAAGGTCAAAGGTCCTAAGGACCCCACCCCAGAACCCGAGCGATGGCACCCCCAAGAGGCCATTAGAAGCGACATCCCCCCTACCAGAGCCCAACCAGCAAAGCGGGTAAAGACCCCCCAGCTAGAAATCGAGGAGATGGGAGCAATCCTGGACGACCTTCTGACGAAGGTCAACCACAACGGGGTGAGGAGCGTCAATCAGGCAATGAAAAACTCATTCGCCAGATTGAAGGAGCTCCAACTAAAGCTGCGCACAAGGCTGCCGGAGGCGGAGAATTCGCATGTCGGACGCACCGCAAGAGCCGATGCTAGCCAACAGACCACCCCTAAGCGCCCCTCCAGCCACGAAGAACCGAGTAAGGGTCCGCGAAGAAAGCCCAGCGATCCGACCACCAGAAGGCAGCGGGACCCAAGCGCCTACCAAGGGCTCCGCCCCAAGCCACTGCAGCGGGAAACAAGACGCAACCAAGATTGCAGCATCCGCCCGGACCGCGCAGGAAGAGACCGCCAAGGGAGAGGCCAGATGCGCTGGTTATCACCCCCTCAGCTGGCTTACCGTACAGCGAAGTGCTGTCGCTGGTCACAAGAGGGCAGGACGCCAGGCTCAGGGCCATCGGGGAGAACGTATCAAGGGTTAAGAGGACGGCCAAAGGCGAACTGCTCCTCGAGCTACGTGCCTCTGCCCAAGACTTGACGCAGAAGCTCAAGATGGACATGGGAGCGGTGCTAGGAGACCGCGCCAGCCTTCGCGCGTTAACTCAATCCAAAGTATTTTTGATTCGCGACCTCGACGAGCTTACTACTGAAGACGAGCTGAGGAGGGTCCTGGAGTCCCGGCATAGATTCCAGCAGCAGTGGTGGCTATCAAGAGCCTCCGTCAAACGCAGTATGGAGGGAAGTCTGCTATAATAGCAGTTCCAGCCAATCTGGCGGACCCGCTGATCAAGCGTGGCAAGCTGAGGGTAGGATGGTCCCAATGTCTGATCAAGGAACTGGAGCCACGCCAAAGATGCTTCAAATGTCTGGAGGAAGGCCACATAGCGGCCCATTGTAGAAGCGCCGTCGACAGAAGCCAGTGCTGCTTCAGATGCGGGTCCGCGGGACACAAGGCCGCAGAGTGTCCCAACGAGGCTAAGTGCTTTTTGTGCGCAAGCAGAGGAAGCCAAGCGACCAACCACCAAGCAGGCACCCGGAAGTGCCCATTGGCGGGCAAAGGAGCACCAAAGGCACCACAATGATGCGTTTGATTCAGCTAAACCTGAATCACTGCACGGCAGCCCAAGACCTGCTAGTGCAGACGGTGCGCGAACGCAGAGTGGAGCTTGCGTTACTTAGCGAGCCCTACCGGACGGCGGACAGCCCAGACTGGGCTTTCGACCGCGCCAAGAAAGCAGCAATCTGGAGGTGCAGCAGAGAAGCCCAACAATTAACCGATGTTTTTTCGGACATCGGGTTTGTTAGGGCAAAGGTGGGCAGATGGTGGGTGTACAGCCGGATGCTAGAGGCCGCACCCAGGTTCTCATAGCTGGCGACTTCAACGCATGGTCAGAGAGCTGGGGCAGTTCAACCACCAACGCGAGAGGCAGGATGGTGCTCGAGGCATTCGCGACGCTGGACCTGGCTCTATTAAACCAAGGGAACCGGCACACGTTCAGGCGTGCCGGACTGGGCTCTGTGGTGGACCTCACCTTCACTAGCGGCTCGTCGTTCAGGCTAACGAGGTGGAGACTCAGCGAGGAATACACTGGCAGTGACCACTTGGCCATCATTTGTGATCTGGGATGCCCTTCCTCGACCCAAGCCCAGCTAGCAGCCCAAGCCAGGATAAAATACAAAACGGACACCCTGGACACGCAGTTATTCCGAGAGCAGTTCCTACCCTCGGTGAGTGGAGAAGGAGCTGAGCTGACGGCAGTGGCGCTGATGAGGCAGCTGAAGACCGCGTGCGACGACAGCATGCAAACAAGCAGGACACATAGCCAACAAAGAGCCCCTGTCTACTGGTGGAACCAGGAGATAGAGACGGCTCGCCGAGAATGCCTCTCCGCCAGACGTCGCTATCAACGCGCTAGAGGTGCGGAGTCCTTTGCCGAACGCCAATCCGAGTATAGAGCCCGCAGGAAAGCACTCAAGCTAGCCATACGGGAGAGCAAGCGGAAATGCTTCCTCGACCTATGCGATTCTGCTGACAGCGACCCATGGGGAAGTGCCTACAAGGTGGTGGTCAAGCAGGCATATACGAGGACTCCCAAGCTACTGGACCCAGCGATGCTCCGCAGTGTAGCGGAACATCTGTTTCCTTTGATGGACAGGTTACGCCCCGCCGACCCAGCCACAGGGGACCACGTCGAAGCCGACGCCACGGTCAGCAGTGAGGAGATCCTGGAGCTGGCGAAACTGCTGAAGGACGGCAAGGCCCCCGGGCCCGACGGCATTCCGATCAGGGCGCTTCGGCTCTCTCTACCTCCAGCCAACTCGTTTGCGAAGGCATTCACCAAGTGCCTGACGGAAGGAGTCTTCCCAAGTTGCTGGAAGGTACAAAAGTGTTGCTCCTCCCAAAACCAGGGAAGCCACCCGAGGAGCCTATATCGTTCCGGCCGATATGCCTCATCGATGGAACTGGCAAGCTCCTGGAGAAACTGGTGTGCATTCGGCTAGAGAGGGCTATCGCAGACGCGGGTGACCTCTCACGGTCCCAGTTTGGCTTCAGGAAAGCGCGGTCCACCGTCGACGCCGTCAACAGAGTGGTCGAAGTAGCGGCCCAAGCAATCGAGGGCACCAGATGGAAGGGGGGTAGCAAAGAGTACTGCCTCATGGTCACACTAGACATCAGG'..b'GACAGGAGAGGCTTCGTACGCAGAGATGCTTCGGAAGCTAAGATCGGACCCGAGCCTTAGCGAACTGGGCAGCCACGTGCGAAAAATCCGGAGAACGCAGAAAGGTGAGCTGTTGCTCGAGGTAGAGGGGAAAGCTTCGGAAAGCGTCCCCAAGTTTAAGAGCGACCTGGAAGCGGCGCTCAATGACTTGGCCTCTGTGCGCACAGGAGCGCAAAGAATAGCTCTATCTTGCAGCGGATTGGACGAGGCTACGACAGCAGAGGAGCTCCACAGCTGCTTGGTCGCCCAATTCCAGGGCCTGCAGATAAATCCTGAAGATATCAGGGGCCTTCGCAGAATGCGGGATGGCACGCAAATAGCCTCAGTGCTGCTGAACGCGAACGTTGCGATACCAGTCCTTAAACAGGGCACCATAACCGTTGGATGGTCAAGATGTCGTATCACCCAGGACGTTCGACCCACGAGATGCTACAGGTGTCTCGGCTATGGGCATCGATCAGCAACCTGCAAGAACACTGACAGGGCAGACTGCTGTCTTAGATGCGGTGAGCGTGGGCACAAGGCAAAGGGGTGCGTTGCAGCACCAAAATGCCTGATCTGCAGCAGCGAGGTGGACAGAAACCACTCGACGGGTAGCTTTGCGTGCCCGACCTACAGAGCGACCCTAAAAGAAGCCAAGAGCCACCTTAATGCACACTCATATTAGCGTAGTACAGCTCAATGTCAATCATTGCGCAGCAGCTCAGAGCCTCCTGGCCCAGACTGCGGCTGAGCGCAATGTAGACATCATGCTCCTAAGCGAACCCTACGTCTCTGGTAGCGGACAATCGTCCATGATCCTTGACGAGACAGGTAAAGCAGCTATCAAATGCTGCAGCTCTCTCCACGTCGAGGAACTGGCTGCTTTACCTATGCGGGGTATCGCTTATGCGAAGTTAAAACACGTGCACTTGTACAGCTGCTACGCTCCGCCGAGCGACACCCCCGATCAGTTCGAGGAGTTTCTGGAGGCGCTCGTGGACCATGCGAGAGGGCGAAGCCCGAAGGTCATTGCCGGCGACTTTAATGCCTGGGCAGTGGAATGGGGCAGCAGGACATCCAACACCAGAGGCCGAGCTGTGATTGACGCCATGGGAATGCTGGACCTTATACTGCTGAACGACGGACGGAAGCCGACGTTTAACAACGATAGGGGTACGTCCTTTATTGACGTTACCTTTGTCAGCAGAGGGCTAGTAGACAACAATAACTGGATGGTCCATGACGTCATGACGCTGAGCGACCACGCCCTGATCTCCTTCAGTCTCTCCCCGGAGGACATGCCCAGGAGACGGCAGAGTAGAGCAGTCGGGAAAGCATGGGACACCAGGAAGATCGATGAGGCCATGCTGGCCTATCAGATCAATTCCCTGGAAATCCCAAGTGGGGACGCAGAGAGTATGGCGGCAGGCCTCATGAATATGCTGGGAAGAATCTGCGACGCAATCATGCCAAGGAAAAATAAGGCACAGCGCAAACCACCCGTTTACTGGTGGAGCGCCTCCCTAAGCCAACTACGGTCTGATTGCCTCAGGGCTAGGAGAATGGCGCAACGAGCCAGAGGCAGTACCCACCACGCGGAACTCTTGGAGGCTTTCAGAAGGAAACGTCTAGAGTTCAAGCACGGCATCGCGGCTGCCAAAGCGCGGTCGTTTAAGGAGCTGCAGGATGGCGTAGACAGCGATACCTGGGGCCTCGCCTACAAGCTTGTTACCAAAAAGCTAAGGAGGAGAGCGGCAACCCCATCCGACCCGGGGGTCCTGGCTAACATAGTAGGGGAGCTATTCCCAAAGCAGACCACACTATGGAGGCCAACAGAGGCAGCCCCTGCCCCAGATTTTCCGTGCGTCACAGAACTTGAAGTCGCCGAGGCAGCCAAGCGCATCAAACCCAACAAAGCCCCTGGACTAGATGGTATTCCTGGAGCTGTTATAAAAGCAGTGGCGCTGGGTAGACCTGAAATCTTCAGGGCCACCTTCCAGCAATGCCTTCTGGACGGAATCTTCCCAACAAGGTGGAAAAGCCAGAAGCTAGTCCTGTTGCCGAAAGGCAAGGGACCAGCACATGCTGCAAACAGCTACCGCCCTCTATGCCTACTGGATATAGTAGGAAAACTGTTCGAACGTATCCTGTATACCAGAATAGAGGCAATCACCGAGAGCATCAACGGCCTGGGAAGTCATCAATATGGCTTCCGGAAAGGTAAGAGCACTCTGGACGCTCTTTCGGCCGTTTGTAACATCGCCAAGACCGCTATTTCTGGTGATAGATGGTTAGGGGGCAGGAAGGAATACTGCGCAATTGTGACTCTGGACGTAAGGAACGCTTTCAACACCGCCAGATGGCCCGTAATCCTCGCGGCCATGTACCGTATGGGGATCCCGGAGTACCTAAGGATAGTCGTTGGCAGCTACTTTAGGGACCGGGTCCTATGGTACGATACGGAAGATGGCCCAAAAAGATACCGAGTTTCGGCAGGTGTTCCCCAAGGATCGGTACTTGGACCAATCCTATGGAACATTATGTACGATGGGATCTTGGGCATCAACAGGCCCGTAGGAGTAGAGCTGCATTGTTTTGCTGACGATGTGGCAATCACAGCTGTCTCGAAAACAATCGCAGGGTTGGAAGACAAATGCAACTCTACGATCGGTGCTGCCATCCGCTGGCTCGAGAAAGCCGGGCTAGCAATAGCGGCTCACAAGACCGAAGCAGTCCTACTAAGCAGCAGGAAAAAGGTGGAGAACATGCTGGTCTCCGTCAAGGGTACACAGGTGACCTCTCAAGAGTCCCTAAAGTACCTGGGGGTAATGATAGATCGCAGACTATCGTTCAAGGACCACGCGAGCCACGCCAGCAAGAAGGCAGCAATCACAGCCTCTTCGTTGGCGAGGCTTATGCCCAACGTCGGAGGCCCAAGACACCCGGCCAGGAAACTGCTGGTGTCAGTAGCAAAGGCTTCGCTACTATACGCTGCACCAGTCTGGAGCAATGCCACTGGCAGGGTCTCATACCTGAAAGGAGCTCGTTCGGTGCTACGGTCAATGTCTCTGAGGCTCATTAGAGGTTTCAGGACCATATCCGAAGACGCGGCGCTAGCGCTGGCAGGCCTGCCGCCGATTGATCTGGAGATCAAGGCTCTCAGCCTAATGCGGAGTGGCGCTTCCAGGCAAGAGGCACACGAGTGGCTATTAGGTGAATGGCAGAGTAGATGGCAAACGTCGCGACGGGGGAGGTGGACTTATCAGCTCATCCCAGAGATGACGGTTTGGGCAGAGTGCCAACACAAATGCTTGGACTACCACCTAACCCAGTTCCTCACGGACCATGGCTGCTTCCGGGCCTATCTACTCCGGTTCCGTCACGTAGAGTCAGCCCAATGCTTGTTCTGCGTCGACGGTGAAGAAACAGCAGAACATGTGCTAATGCACTGCTCCAGGTTCACGGCGGAGAGAGAGCAGCTAAAGACGCTGTCAGGTTCCCCGTTCAGCCCTAGTGGCTTGTTCGCGGCTATGATGGCGAACAGGGGGGCTTGGGAGCGGGGACACAGCATTATCATTAATATGATGAAGCGTGTCCGATCAGACGAGATGGCCAACAGAGTGGATGTCTAAGCCCAAACTGGTGTCCTGGGTGACGGCGGGCGAAGAATTCATCCTCAGCGTCCCCGGCTCGTCGTAAAAGGCGACTAAAGGGTGGAAGGAGGAGCCCCCATGGACTACACTGAAGGAAGGGAGTGCGACCTGGCCTCACATCCTGCTCACCGAAGTCATACCTTGACTGGCAGTCCCGGTGAGCGAGCAAGGACTGTAGAGCACGCGGAGGTTTTTGTTTTAGTACGTAGGCATAATTCCAATAGGGCTTATGAATCGTGCATGCCACCTACGGACGGTAGGTGGTATCTTTAGAAGATTTTAATTTTCCTACCGTAAGTCAAATAATAAAAAAAAAAAAAAAAA\n'
b
diff -r 000000000000 -r 540425dc9746 test-data/output.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output.fasta Fri Apr 22 12:07:53 2016 -0400
b
b'@@ -0,0 +1,4 @@\n+>Rt1c\n+GGGGACGCGCGCGAGTAGCCGTGTGAATCGAGTTGGCGCTCCTGGAAAACCCCAAAATTTTCCGTGTCGCGGCGGCTTGATGGAGACAGGAGTGGCTGTCTCTAACACACAGTGCCGATATGAGTACTCACCAGCAGTGGGCAAGCTCCAAGTATCCATGGATCGCCCGCCGGCGCCGATCCTCAGGGCCATGGAGCAGGTCAGGGTGAGAGAAGCAGCGAACTTTCTCTGCACTACTTTCTCTTTGTCGCTGTGTTGTTTCTTTTGGCGTCTTGGCTGCCACCAGACTTGCCGGTCACGCCAGCTGATCTCGCAGTCAGCTTGGAAAGCAGTGCTGGTAAACGGCTAAAGCACCGCGGTCTGGCAGCGCTGGTCGGATGCACGAGTCCCCTAGCACAGGTGAGCCGTTTTCTCGGTGAAAGCACTCACTGACAAAAGCTAGCAGCTACGGAAATCGCCTAACGATCGGTTCACCGGTCGTAGCATACATTTTTGGGCGGCTGACGGTTATCCTTGGCAACATCCCATGGAAACCCGGAGACAGATCCATAATCGAGCAGGAGAGGCAGAACAAGAGTGTAAAAAGTCAAGGAGCAGACCAATAGCCAACCCCCCCGCTTAGGCGGCACACTTTAAATCCGGGGCTCTGGCGACCAAGCTGGAGCGGTATATCTCCCACCGTCGCAACTTTCCCCTGCTCACCCACCCCATAAGTCCACGGCGCGTCTGACCCAAAGTGGGCGGGTACGTGGCCTGCGCCTGTTCTCTTTACCAGCCGGGCAGCAGCAAAATAAAAACCCATTCAGCGTCTGAGCCAAGTTGGCCGGCGGAATGGTCTGCGTCTGCGCCGCATCGGCCGGCAGAATATCCAAAACCTGGCGAAAGGTATAAAGCCGCAAACCTGGCAGGAGGTATAAAATGCAACACCTAACTGGAATGTCTGTAAACAACTTTATTACTCCAGGTGGCAGCCACACATGTGGAAATCCACCCTCGGCTAATCCCGAGGCTAGGGCACGGATTCTGGAGGCCCTACCAAACATTCTCCCCAAACCCGCCCCGACGGCGGCACACTTGGCCGTCGGACTAAGCAATGCAACAAGTGCACCCACAACGGACGAAGAAAGCTTGGTGTTTGGGAAAAGGTCAAAGGTCCTAAGGACCCCACCCCAGAACCCGAGCGATGGCACCCCCAAGAGGCCATTAGAAGCGACATCCCCCCTACCAGAGCCCAACCAGCAAAGCGGGTAAAGACCCCCCAGCTAGAAATCGAGGAGATGGGAGCAATCCTGGACGACCTTCTGACGAAGGTCAACCACAACGGGGTGAGGAGCGTCAATCAGGCAATGAAAAACTCATTCGCCAGATTGAAGGAGCTCCAACTAAAGCTGCGCACAAGGCTGCCGGAGGCGGAGAATTCGCATGTCGGACGCACCGCAAGAGCCGATGCTAGCCAACAGACCACCCCTAAGCGCCCCTCCAGCCACGAAGAACCGAGTAAGGGTCCGCGAAGAAAGCCCAGCGATCCGACCACCAGAAGGCAGCGGGACCCAAGCGCCTACCAAGGGCTCCGCCCCAAGCCACTGCAGCGGGAAACAAGACGCAACCAAGATTGCAGCATCCGCCCGGACCGCGCAGGAAGAGACCGCCAAGGGAGAGGCCAGATGCGCTGGTTATCACCCCCTCAGCTGGCTTACCGTACAGCGAAGTGCTGTCGCTGGTCACAAGAGGGCAGGACGCCAGGCTCAGGGCCATCGGGGAGAACGTATCAAGGGTTAAGAGGACGGCCAAAGGCGAACTGCTCCTCGAGCTACGTGCCTCTGCCCAAGACTTGACGCAGAAGCTCAAGATGGACATGGGAGCGGTGCTAGGAGACCGCGCCAGCCTTCGCGCGTTAACTCAATCCAAAGTATTTTTGATTCGCGACCTCGACGAGCTTACTACTGAAGACGAGCTGAGGAGGGTCCTGGAGTCCCGGCATAGATTCCAGCAGCAGTGGTGGCTATCAAGAGCCTCCGTCAAACGCAGTATGGAGGGAAGTCTGCTATAATAGCAGTTCCAGCCAATCTGGCGGACCCGCTGATCAAGCGTGGCAAGCTGAGGGTAGGATGGTCCCAATGTCTGATCAAGGAACTGGAGCCACGCCAAAGATGCTTCAAATGTCTGGAGGAAGGCCACATAGCGGCCCATTGTAGAAGCGCCGTCGACAGAAGCCAGTGCTGCTTCAGATGCGGGTCCGCGGGACACAAGGCCGCAGAGTGTCCCAACGAGGCTAAGTGCTTTTTGTGCGCAAGCAGAGGAAGCCAAGCGACCAACCACCAAGCAGGCACCCGGAAGTGCCCATTGGCGGGCAAAGGAGCACCAAAGGCACCACAATGATGCGTTTGATTCAGCTAAACCTGAATCACTGCACGGCAGCCCAAGACCTGCTAGTGCAGACGGTGCGCGAACGCAGAGTGGAGCTTGCGTTACTTAGCGAGCCCTACCGGACGGCGGACAGCCCAGACTGGGCTTTCGACCGCGCCAAGAAAGCAGCAATCTGGAGGTGCAGCAGAGAAGCCCAACAATTAACCGATGTTTTTTCGGACATCGGGTTTGTTAGGGCAAAGGTGGGCAGATGGTGGGTGTACAGCCGGATGCTAGAGGCCGCACCCAGGTTCTCATAGCTGGCGACTTCAACGCATGGTCAGAGAGCTGGGGCAGTTCAACCACCAACGCGAGAGGCAGGATGGTGCTCGAGGCATTCGCGACGCTGGACCTGGCTCTATTAAACCAAGGGAACCGGCACACGTTCAGGCGTGCCGGACTGGGCTCTGTGGTGGACCTCACCTTCACTAGCGGCTCGTCGTTCAGGCTAACGAGGTGGAGACTCAGCGAGGAATACACTGGCAGTGACCACTTGGCCATCATTTGTGATCTGGGATGCCCTTCCTCGACCCAAGCCCAGCTAGCAGCCCAAGCCAGGATAAAATACAAAACGGACACCCTGGACACGCAGTTATTCCGAGAGCAGTTCCTACCCTCGGTGAGTGGAGAAGGAGCTGAGCTGACGGCAGTGGCGCTGATGAGGCAGCTGAAGACCGCGTGCGACGACAGCATGCAAACAAGCAGGACACATAGCCAACAAAGAGCCCCTGTCTACTGGTGGAACCAGGAGATAGAGACGGCTCGCCGAGAATGCCTCTCCGCCAGACGTCGCTATCAACGCGCTAGAGGTGCGGAGTCCTTTGCCGAACGCCAATCCGAGTATAGAGCCCGCAGGAAAGCACTCAAGCTAGCCATACGGGAGAGCAAGCGGAAATGCTTCCTCGACCTATGCGATTCTGCTGACAGCGACCCATGGGGAAGTGCCTACAAGGTGGTGGTCAAGCAGGCATATACGAGGACTCCCAAGCTACTGGACCCAGCGATGCTCCGCAGTGTAGCGGAACATCTGTTTCCTTTGATGGACAGGTTACGCCCCGCCGACCCAGCCACAGGGGACCACGTCGAAGCCGACGCCACGGTCAGCAGTGAGGAGATCCTGGAGCTGGCGAAACTGCTGAAGGACGGCAAGGCCCCCGGGCCCGACGGCATTCCGATCAGGGCGCTTCGGCTCTCTCTACCTCCAGCCAACTCGTTTGCGAAGGCATTCACCAAGTGCCTGACGGAAGGAGTCTTCCCAAGTTGCTGGAAGGTACAAAAGTGTTGCTCCTCCCAAAACCAGGGAAGCCACCCGAGGAGCCTATATCGTTCCGGCCGATATGCCTCATCGATGGAACTGGCAAGCTCCTGGAGAAACTGGTGTGCATTCGGCTAGAGAGGGCTATCGCAGACGCGGGTGACCTCTCACGGTCCCAGTTTGGCTTCAGGAAAGCGCGGTCCACCGTCGACGCCGTCAACAGAGTGGTCGAAGTAGCGGCCCAAGCAATCGAGGGCACCAGATGGAAGGGGGGTAGCAAAGAGTACTGCCTCATGGTCACACTAGACATCAGG'..b'GACAGGAGAGGCTTCGTACGCAGAGATGCTTCGGAAGCTAAGATCGGACCCGAGCCTTAGCGAACTGGGCAGCCACGTGCGAAAAATCCGGAGAACGCAGAAAGGTGAGCTGTTGCTCGAGGTAGAGGGGAAAGCTTCGGAAAGCGTCCCCAAGTTTAAGAGCGACCTGGAAGCGGCGCTCAATGACTTGGCCTCTGTGCGCACAGGAGCGCAAAGAATAGCTCTATCTTGCAGCGGATTGGACGAGGCTACGACAGCAGAGGAGCTCCACAGCTGCTTGGTCGCCCAATTCCAGGGCCTGCAGATAAATCCTGAAGATATCAGGGGCCTTCGCAGAATGCGGGATGGCACGCAAATAGCCTCAGTGCTGCTGAACGCGAACGTTGCGATACCAGTCCTTAAACAGGGCACCATAACCGTTGGATGGTCAAGATGTCGTATCACCCAGGACGTTCGACCCACGAGATGCTACAGGTGTCTCGGCTATGGGCATCGATCAGCAACCTGCAAGAACACTGACAGGGCAGACTGCTGTCTTAGATGCGGTGAGCGTGGGCACAAGGCAAAGGGGTGCGTTGCAGCACCAAAATGCCTGATCTGCAGCAGCGAGGTGGACAGAAACCACTCGACGGGTAGCTTTGCGTGCCCGACCTACAGAGCGACCCTAAAAGAAGCCAAGAGCCACCTTAATGCACACTCATATTAGCGTAGTACAGCTCAATGTCAATCATTGCGCAGCAGCTCAGAGCCTCCTGGCCCAGACTGCGGCTGAGCGCAATGTAGACATCATGCTCCTAAGCGAACCCTACGTCTCTGGTAGCGGACAATCGTCCATGATCCTTGACGAGACAGGTAAAGCAGCTATCAAATGCTGCAGCTCTCTCCACGTCGAGGAACTGGCTGCTTTACCTATGCGGGGTATCGCTTATGCGAAGTTAAAACACGTGCACTTGTACAGCTGCTACGCTCCGCCGAGCGACACCCCCGATCAGTTCGAGGAGTTTCTGGAGGCGCTCGTGGACCATGCGAGAGGGCGAAGCCCGAAGGTCATTGCCGGCGACTTTAATGCCTGGGCAGTGGAATGGGGCAGCAGGACATCCAACACCAGAGGCCGAGCTGTGATTGACGCCATGGGAATGCTGGACCTTATACTGCTGAACGACGGACGGAAGCCGACGTTTAACAACGATAGGGGTACGTCCTTTATTGACGTTACCTTTGTCAGCAGAGGGCTAGTAGACAACAATAACTGGATGGTCCATGACGTCATGACGCTGAGCGACCACGCCCTGATCTCCTTCAGTCTCTCCCCGGAGGACATGCCCAGGAGACGGCAGAGTAGAGCAGTCGGGAAAGCATGGGACACCAGGAAGATCGATGAGGCCATGCTGGCCTATCAGATCAATTCCCTGGAAATCCCAAGTGGGGACGCAGAGAGTATGGCGGCAGGCCTCATGAATATGCTGGGAAGAATCTGCGACGCAATCATGCCAAGGAAAAATAAGGCACAGCGCAAACCACCCGTTTACTGGTGGAGCGCCTCCCTAAGCCAACTACGGTCTGATTGCCTCAGGGCTAGGAGAATGGCGCAACGAGCCAGAGGCAGTACCCACCACGCGGAACTCTTGGAGGCTTTCAGAAGGAAACGTCTAGAGTTCAAGCACGGCATCGCGGCTGCCAAAGCGCGGTCGTTTAAGGAGCTGCAGGATGGCGTAGACAGCGATACCTGGGGCCTCGCCTACAAGCTTGTTACCAAAAAGCTAAGGAGGAGAGCGGCAACCCCATCCGACCCGGGGGTCCTGGCTAACATAGTAGGGGAGCTATTCCCAAAGCAGACCACACTATGGAGGCCAACAGAGGCAGCCCCTGCCCCAGATTTTCCGTGCGTCACAGAACTTGAAGTCGCCGAGGCAGCCAAGCGCATCAAACCCAACAAAGCCCCTGGACTAGATGGTATTCCTGGAGCTGTTATAAAAGCAGTGGCGCTGGGTAGACCTGAAATCTTCAGGGCCACCTTCCAGCAATGCCTTCTGGACGGAATCTTCCCAACAAGGTGGAAAAGCCAGAAGCTAGTCCTGTTGCCGAAAGGCAAGGGACCAGCACATGCTGCAAACAGCTACCGCCCTCTATGCCTACTGGATATAGTAGGAAAACTGTTCGAACGTATCCTGTATACCAGAATAGAGGCAATCACCGAGAGCATCAACGGCCTGGGAAGTCATCAATATGGCTTCCGGAAAGGTAAGAGCACTCTGGACGCTCTTTCGGCCGTTTGTAACATCGCCAAGACCGCTATTTCTGGTGATAGATGGTTAGGGGGCAGGAAGGAATACTGCGCAATTGTGACTCTGGACGTAAGGAACGCTTTCAACACCGCCAGATGGCCCGTAATCCTCGCGGCCATGTACCGTATGGGGATCCCGGAGTACCTAAGGATAGTCGTTGGCAGCTACTTTAGGGACCGGGTCCTATGGTACGATACGGAAGATGGCCCAAAAAGATACCGAGTTTCGGCAGGTGTTCCCCAAGGATCGGTACTTGGACCAATCCTATGGAACATTATGTACGATGGGATCTTGGGCATCAACAGGCCCGTAGGAGTAGAGCTGCATTGTTTTGCTGACGATGTGGCAATCACAGCTGTCTCGAAAACAATCGCAGGGTTGGAAGACAAATGCAACTCTACGATCGGTGCTGCCATCCGCTGGCTCGAGAAAGCCGGGCTAGCAATAGCGGCTCACAAGACCGAAGCAGTCCTACTAAGCAGCAGGAAAAAGGTGGAGAACATGCTGGTCTCCGTCAAGGGTACACAGGTGACCTCTCAAGAGTCCCTAAAGTACCTGGGGGTAATGATAGATCGCAGACTATCGTTCAAGGACCACGCGAGCCACGCCAGCAAGAAGGCAGCAATCACAGCCTCTTCGTTGGCGAGGCTTATGCCCAACGTCGGAGGCCCAAGACACCCGGCCAGGAAACTGCTGGTGTCAGTAGCAAAGGCTTCGCTACTATACGCTGCACCAGTCTGGAGCAATGCCACTGGCAGGGTCTCATACCTGAAAGGAGCTCGTTCGGTGCTACGGTCAATGTCTCTGAGGCTCATTAGAGGTTTCAGGACCATATCCGAAGACGCGGCGCTAGCGCTGGCAGGCCTGCCGCCGATTGATCTGGAGATCAAGGCTCTCAGCCTAATGCGGAGTGGCGCTTCCAGGCAAGAGGCACACGAGTGGCTATTAGGTGAATGGCAGAGTAGATGGCAAACGTCGCGACGGGGGAGGTGGACTTATCAGCTCATCCCAGAGATGACGGTTTGGGCAGAGTGCCAACACAAATGCTTGGACTACCACCTAACCCAGTTCCTCACGGACCATGGCTGCTTCCGGGCCTATCTACTCCGGTTCCGTCACGTAGAGTCAGCCCAATGCTTGTTCTGCGTCGACGGTGAAGAAACAGCAGAACATGTGCTAATGCACTGCTCCAGGTTCACGGCGGAGAGAGAGCAGCTAAAGACGCTGTCAGGTTCCCCGTTCAGCCCTAGTGGCTTGTTCGCGGCTATGATGGCGAACAGGGGGGCTTGGGAGCGGGGACACAGCATTATCATTAATATGATGAAGCGTGTCCGATCAGACGAGATGGCCAACAGAGTGGATGTCTAAGCCCAAACTGGTGTCCTGGGTGACGGCGGGCGAAGAATTCATCCTCAGCGTCCCCGGCTCGTCGTAAAAGGCGACTAAAGGGTGGAAGGAGGAGCCCCCATGGACTACACTGAAGGAAGGGAGTGCGACCTGGCCTCACATCCTGCTCACCGAAGTCATACCTTGACTGGCAGTCCCGGTGAGCGAGCAAGGACTGTAGAGCACGCGGAGGTTTTTGTTTTAGTACGTAGGCATAATTCCAATAGGGCTTATGAATCGTGCATGCCACCTACGGACGGTAGGTGGTATCTTTAGAAGATTTTAATTTTCCTACCGTAAGTCAAATAATAAAAAAAAAAAAAAAAA\n'
b
diff -r 000000000000 -r 540425dc9746 test-data/tabular_file.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/tabular_file.tsv Fri Apr 22 12:07:53 2016 -0400
b
@@ -0,0 +1,2 @@
+RT1B Rt1b
+RT1C Rt1c
\ No newline at end of file