Mercurial > repos > tyty > structurefold
changeset 70:f76deb490f06 draft
Deleted selected files
author | tyty |
---|---|
date | Tue, 09 Dec 2014 02:49:03 -0500 |
parents | bd02fcf26f7a |
children | b6bdd41440f3 |
files | Iterative_mapping/.DS_Store Iterative_mapping/iterative_map.py Iterative_mapping/iterative_map.xml Iterative_mapping/log.txt Iterative_mapping/map_ex.py Iterative_mapping/rRNA.txt Iterative_mapping/read_file.py Iterative_mapping/read_s_file.py Iterative_mapping/remove_map.py Iterative_mapping/sample.fasta Iterative_mapping/seq_track.py Iterative_mapping/truncate.py Iterative_mapping/unmap.py get_reads/.DS_Store get_reads/get_read.py get_reads/get_read.xml get_reads/read_file.py get_reads/test.bam predict/.DS_Store predict/id_list_test.txt predict/log.txt predict/parse_dis_pac.py predict/predict_RNAs.py predict/predict_RNAs.xml predict/rRNA.txt predict/read_file.py predict/rtts_plot.py predict/test_reactivity.txt predict/test_reference.fa reactivity_cal/dis_f_N1Am_rrna.txt reactivity_cal/dis_f_N1Ap_rrna.txt reactivity_cal/parse_dis_react.py reactivity_cal/rRNA.txt reactivity_cal/react_cal.py reactivity_cal/react_norm_function.py reactivity_cal/reactivity_calculation.xml reactivity_cal/read_file.py |
diffstat | 37 files changed, 0 insertions(+), 2259 deletions(-) [+] |
line wrap: on
line diff
--- a/Iterative_mapping/iterative_map.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,122 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys -import os -from read_file import * -from read_s_file import * -import random -import string - -type_input = sys.argv[1] -seq_file = sys.argv[2] -ref_file = sys.argv[3] -shift = sys.argv[4] -length = sys.argv[5] -t_end = sys.argv[6] -map_type = sys.argv[7] -output_file = sys.argv[8] - - -if map_type!="default": - s = "" - sm = "" - s = s+"-v "+sys.argv[9] - sm = sm+"-v "+sys.argv[9] - sm = sm+" -5 "+sys.argv[10] - sm = sm+" -3 "+sys.argv[11] - s = s+" -k "+sys.argv[12] - sm = sm+" -k "+sys.argv[12] - if sys.argv[13]: - s = s+" -a" - sm = sm+" -a" - if int(sys.argv[14])>=1: - s = s+" -m "+sys.argv[14] - sm = sm+" -m "+sys.argv[14] - if sys.argv[15]: - s = s+" --best --strata " - sm = sm+" --best --strata " - -else: - s = "-v 3 -a --best --strata " - sm = "-v 3 -a --best --strata " - -ospath = os.path.realpath(sys.argv[0]) -ost = ospath.split('/') -syspath = "" -for i in range(len(ost)-1): - syspath = syspath+ost[i].strip() - syspath = syspath+'/' - -syspathrs = os.getcwd() - -os.system("bowtie-build -f "+ref_file+" "+syspathrs+"ref > "+syspathrs+"log.txt") - -os.system("cp "+seq_file+" "+syspathrs+"seq0.fa") - -if type_input == "fasta": - tp = 'fasta' -if type_input == "fastq": - tp = 'fastq' - -k = 0 - -if type_input == "fasta": - os.system("bowtie "+sm+"-f "+syspathrs+"ref"+" "+syspathrs+"seq"+str(k)+".fa --quiet -S > "+syspathrs+"map"+str(k)+".sam") -if type_input == "fastq": - os.system("bowtie "+sm+"-q "+syspathrs+"ref"+" "+syspathrs+"seq"+str(k)+".fa --quiet -S > "+syspathrs+"map"+str(k)+".sam") - -while(True): - os.system("samtools view -Sb -F 0xfff "+syspathrs+"map"+str(k)+".sam > "+syspathrs+"mapped"+str(k)+".bam 2>"+syspathrs+"log.txt") #get mapped reads - os.system("samtools view -Sb -f 0x4 "+syspathrs+"map"+str(k)+".sam > "+syspathrs+"umapped"+str(k)+".bam 2>"+syspathrs+"log.txt") #get unmapped reads - os.system("samtools view -Sb -f 0x10 "+syspathrs+"map"+str(k)+".sam > "+syspathrs+"rmapped"+str(k)+".bam 2>"+syspathrs+"log.txt") #get reversed mapped reads - os.system("samtools merge -f "+syspathrs+"unmapped"+str(k)+".bam "+syspathrs+"umapped"+str(k)+".bam "+syspathrs+"rmapped"+str(k)+".bam") #get reversed mapped reads - os.system("samtools view -h -o "+syspathrs+"unmapped"+str(k)+".sam "+syspathrs+"unmapped"+str(k)+".bam") #get reversed mapped reads - if k>0: - os.system("samtools view -h -o "+syspathrs+"mapped"+str(k)+".sam "+syspathrs+"mapped"+str(k)+".bam") #get reversed mapped reads - os.system("cut -f 1 "+syspathrs+"unmapped"+str(k)+".sam > "+syspathrs+"unmapped"+str(k)+".txt") - os.system("cut -f 1 "+syspathrs+"mapped"+str(k)+".sam > "+syspathrs+"mapped"+str(k)+".txt") - os.system("python "+syspath+"remove_map.py "+syspathrs+"unmapped"+str(k)+".txt "+syspathrs+"mapped"+str(k)+".txt "+syspathrs+"runmapped"+str(k)+".txt") - os.system("rm "+syspathrs+"mapped"+str(k)+".sam") - os.system("rm "+syspathrs+"mapped"+str(k)+".txt") - os.system("rm "+syspathrs+"unmapped"+str(k)+".txt") - else: - os.system("cut -f 1 "+syspathrs+"unmapped"+str(k)+".sam > "+syspathrs+"runmapped"+str(k)+".txt") - - os.system("rm "+syspathrs+"unmapped"+str(k)+".bam") - os.system("rm "+syspathrs+"umapped"+str(k)+".bam") - os.system("rm "+syspathrs+"rmapped"+str(k)+".bam") - os.system("python "+syspath+"seq_track.py "+syspathrs+"runmapped"+str(k)+".txt "+syspathrs+"seq"+str(k)+".fa "+syspathrs+"unmap_seq"+str(k)+".fa "+tp) #get unmapped sequence - os.system("python "+syspath+"truncate.py "+syspathrs+"unmap_seq"+str(k)+".fa "+shift+" "+syspathrs+"seq"+str(k+1)+".fa "+length+" "+t_end) #truncate unmapped sequence - os.system("rm "+syspathrs+"seq"+str(k)+".fa") #Remove sequences being mapped - os.system("rm "+syspathrs+"map"+str(k)+".sam") #Remove mapping file - os.system("rm "+syspathrs+"unmap_seq"+str(k)+".fa") #Remove unmapped sequnce - os.system("rm "+syspathrs+"runmapped"+str(k)+".txt") - os.system("rm "+syspathrs+"unmapped"+str(k)+".sam") - - os.system("wc -l "+syspathrs+"seq"+str(k+1)+".fa > "+syspathrs+"count"+str(k+1)+".txt") - c = read_sp_file(syspathrs+"count"+str(k+1)+".txt") - if c[0][0] == '0': #If no reads is in the sequence file, stop - os.system("rm "+syspathrs+"count"+str(k+1)+".txt") - os.system("rm "+syspathrs+"seq"+str(k+1)+".fa") - break - os.system("rm "+syspathrs+"count"+str(k+1)+".txt") - k = k+1 - if type_input == "fasta": - os.system("bowtie "+s+"-f "+syspathrs+"ref"+" "+syspathrs+"seq"+str(k)+".fa --quiet -S > "+syspathrs+"map"+str(k)+".sam") - if type_input == "fastq": - os.system("bowtie "+s+"-q "+syspathrs+"ref"+" "+syspathrs+"seq"+str(k)+".fa --quiet -S > "+syspathrs+"map"+str(k)+".sam") - - -ss = "" -for i in range(0,k+1): - ss = ss+" "+syspathrs+"mapped"+str(i)+".bam" - - -os.system("samtools merge -f "+output_file+" "+ss) -#print("samtools merge mapped_all.bam"+ss) -os.system("rm "+syspathrs+"mapped*.bam") -os.system("rm "+syspathrs+"ref*") -#os.system("rm -r "+syspathrs) - -
--- a/Iterative_mapping/iterative_map.xml Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,96 +0,0 @@ -<tool id="iterative_map_pipeline" name="Iterative Mapping" version="1.0"> - <description></description> - <command interpreter="python"> - #if $mapping_file.type == "user" - iterative_map.py $file_format.type $file_format.seq_file $reference_file $shift $length $t_end $mapping_file.type $output $mapping_file.param_v $mapping_file.param_five $mapping_file.param_three $mapping_file.param_k $mapping_file.param_a $mapping_file.param_m $mapping_file.param_best - #else - iterative_map.py $file_format.type $file_format.seq_file $reference_file $shift $length $t_end $mapping_file.type $output - #end if - </command> - <requirements> - <requirement type="package" version="1.61">biopython</requirement> - <requirement type="package" version="1.7.1">numpy</requirement> - <requirement type="package" version="0.1.18">samtools</requirement> - <requirement type="package" version="0.12.7">bowtie</requirement> - </requirements> - <inputs> - <conditional name="file_format"> - <param name="type" type="select" label="File format of the reads (Default FASTQ)"> - <option value="fastq">FASTQ</option> - <option value="fasta">FASTA</option> - </param> - <when value="fastq"> - <param name="seq_file" type="data" format="fastq" label="Fastq file"/> - </when> - <when value="fasta"> - <param name="seq_file" type="data" format="fasta" label="Fasta file"/> - </when> - </conditional> - <param name="reference_file" type="data" format="fasta" label="Reference genome/transcriptome"/> - <param name="shift" type="integer" value="1" label="Number of nucleotides trimmed each round"/> - <param name="length" type="integer" value="21" label="Minimum requirement of read length for mapping"/> - <param name="t_end" type="select" label="Trim from 5' or 3' end"> - <option value="five_end">5' end</option> - <option value="three_end">3' end</option> - </param> - - <conditional name="mapping_file"> - <param name="type" type="select" label="Bowtie mapping flags (Default -v 0 -a --best --strata)"> - <option value="default">Default</option> - <option value="user">User specified</option> - </param> - <when value="default"/> - <when value="user"> - <param name="param_v" type="integer" value="0" label="Number of mismatches for SOAP-like alignment policy (-v)"/> - <param name="param_five" type="integer" value="0" label="Trim n bases from high-quality (left) end of each read before alignment (-5)"/> - <param name="param_three" type="integer" value="0" label="Trim n bases from high-quality (right) end of each read before alignment (-3)"/> - <param name="param_k" type="integer" value="1" label="Report up to n valid alignments per read (-k)"/> - <param name="param_a" type="boolean" checked="False" truevalue = "1" falsevalue = "0" label="Whether or not to report all valid alignments per read (-a)"/> - <param name="param_m" type="integer" value="-1" label="Suppress all alignments for a read if more than n reportable alignments exist (-m), -1 for unlimited"/> - <param name="param_best" type="boolean" checked="False" truevalue = "1" falsevalue = "0" label="Whether or not to make Bowtie guarantee that reported singleton alignments are 'best' in terms of stratum and in terms of the quality values at the mismatched positions (--best --strata)"/> - </when> - </conditional> - - </inputs> - <outputs> - <data name="output" type="data" format="bam"/> - </outputs> - <tests> - <test> - <param name="file_format.type" value="fasta" /> - <param name="file_format.seq_file" value="sample.fasta" /> - <param name="reference_file" value="rRNA.txt" /> - <param name="shift" value="1" /> - <param name="length" value="21" /> - <param name="mapping_file.type" value="default" /> - <output name="output" file="mapped.out" /> - </test> - </tests> - - <help> - - -**TIPS**: - ------ - -**Input**: - -* 1. Sequence file type (FASTA/FASTQ) -* 2. Sequence file (fasta/fastq format) -* 3. Reference file (fasta) used to map the reads to -* 4. “Shift” (The length of the sequence that will be trimmed at the 3’end of the reads before each round of mapping) -* 5. “Length” (The minimum length of the reads for mapping after trimming) -* [Optional] -* 1. Bowtie mapping flags (options) [Default: -v 0 -a --best --strata] (-v flag indicates the number of allowed mismatches. Use -5/-3 flag to trim the nucleotides from 5'/3' end of the reads) - ------ - -**Output**: - -A bam file with all of the reads that are mapped - - - - </help> -</tool>
--- a/Iterative_mapping/log.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,1 +0,0 @@ -[samopen] SAM header is present: 4 sequences.
--- a/Iterative_mapping/map_ex.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,31 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys -from read_file import * -from Bio import SeqIO - -map_file = sys.argv[1] -result_file = sys.argv[2] - - -#reads = read_t_file(read_file); - -f = open(map_file); -h = file(result_file, 'w') - -for aline in f.readlines(): - tline = aline.strip(); - tl = tline.split('\t'); - if len(tl)>4: - if int(tl[1].strip())== 0: - h.write(tline) - h.write('\n') - - -f.close(); -h.close() - - - -
--- a/Iterative_mapping/rRNA.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,8 +0,0 @@ ->25s rRNA 3375nts -GCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTAAGCATATCAATAAGCGGAGGAAAAGAAACTAACAAGGATTCCCTTAGTAACGGCGAGCGAACCGGGAAGAGCCCAGCTTGAAAATCGGACGTCTTCGGCGTTCGAATTGTAGTCTGGAGAAGCGTCCTCAGCGACGGACCGGGCCTAAGTTCCCTGGAAAGGGGCGCCAGAGAGGGTGAGAGCCCGTCGTGCCCGGACCCTGTCGCACCACGAGGCGCTGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCCAATCGGGCGGTAAATTCCGTCCAAGGCTAAATACGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGTAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGGGGCCGGCGATGCGTCCTGGTCGGATGCGGAACGGAGCAATCCGGTCCGCCGATCGATTCGGGGCGTGGACCGACGCGGATTACGGTGGCGGCCTAAGCCCGGGCTTTTGATACGCTTGTGGAGACGTCGCTGCCGTGATCGTGGTCTGCAGCACGCGCCTAACGGCGTGCCTCGGCATCAGCGTGCTCCGGGCGTCGGCCTGTGGGCTCCCCATTCGACCCGTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGTGAGTAAACCCGTAAGGCGCAAGGAAGCTGATTGGCGGGATCCTCGCGGGTGCACCGCCGACCGACCTTGATCTTCTGAGAAGGGTTCGAGTGTGAGCATGCCTGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGTAAAGCCAGAGGAAACTCTGGTGGAAGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCTCGGACGCGAGTTCTATCGGGTAAAGCCAATGATTAGAGGCATTGGGGGCGCAACGCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACGTGTCGGCTGCTTTGTTGAGCCGTCACACGGAATCGAGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGGTTACGGTGCCCAACTGCGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGACCTATACCCGGCCGTCGGGGCAAGAGCCAGGCCTCGATGAGTAGGAGGGCGCGGCGGTCGCTGCAAAACCTAGGGCGCGAGGCGCGGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGAGTCGGGGGAAACCCGTCTGATAGCGCTTAAGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCGGAACCGGGACGTGGCGGTTGACGGCAACGTTAGGGAGTCCGGAGACGTCGGCGGGGGCCTCGGGAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCGTGGTGTCCGGTGCGCCCCCGGGCGCCCTTGAAAATCCGGAGGACCGAGTGCCGCTCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCGATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCTCGGGGGTCCCAGTTCCGAACCCGTCGGCTGTCAGCGGACTGCTCGAGCTGCTTCCGCGGCGAGAGCGGGTCGCCGGCTGCCGGCCGGGGGACGACTGGGAACGGCTCTCTCGGGAGCTTTCCCCGGGCGTCGAACAGTCAGCTCAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCTTCGGCGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTACTCCGTGAATCGGAGGCCGGGGTACAACCCCTGTTTTTGGTCCCAAGGCTCGCTTCGGCGGGTCGATCCGGGCGGAGGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTACGAATACGAACCGTGAAAGCGTGGCCTATCGATCCTTTAGACTTCGGAATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGCCCGCGTCGCGATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGAAGCGACGCATGCGCCCGCCGCCCGATTGCCGACCCTCAGTAGGAGCTTAGGCTCCAAAGGCACGTGTCGTTGGCTAAGTCCGTTCGGCGGAACGGTCGTTCGGACCGCCTTGAATTATAATTACCACCGAGCGGCGGGTAGAATCCTTTGCAGACGACTTAAATACGCGACGGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGCCACGATCCACTGAGATTCAGCCCTTTGTCGCTAAGATTCGA ->gi|20197903:2706-4513 Arabidopsis thaliana chromosome 2 BAC F23H14 genomic sequence, complete sequence -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTGTAAGTATGAACGAATTCAGACTGTGAAACTGCGAATGGCTCATTAAATCAGTTATAGTTTGTTTGATGGTAACTACTACTCGGATAACCGTAGTAATTCTAGAGCTAATACGTGCAACAAACCCCGACTTATGGAAGGGACGCATTTATTAGATAAAAGGTCGACGCGGGCTCTGCCCGTTGCTCTGATGATTCATGATAACTCGACGGATCGCATGGCCTCTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAGTGGCCTACCATGGTGGTAACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACTGGGCTCTTTCGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTTAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAACCTTGGGATGGGTCGGCCGGTCCGCCTTTGGTGTGCATTGGTCGGCTTGTCCCTTCGGTCGGCGATACGCTCCTGGTCTTAATTGGCCGGGTCGTGCCTCCGGCGCTGTTACTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACGCTCTGGATACATTAGCATGGGATAACATCATAGGATTTCGATCCTATTGTGTTGGCCTTCGGGATCGGAGTAATGATTAACAGGGACAGTCGGGGGCATTCGTATTTCATAGTCAGAGGTGAAATTCTTGGATTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTCCTAGTCTCAACCATAAACGATGCCGACCAGGGATCAGCGGATGTTGCTTATAGGACTCCGCTGGCACCTTATGAGAAATCAAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACATAGTAAGGATTGACAGACTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGTTAATGAACGAGACCTCAGCCTGCTAACTAGCTACGTGGAGGCATCCCTTCACGGCCGGCTTCTTAGAGGGACTATGGCCGTTTAGGCCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGATGTATTCAACGAGTTCACACCTTGGCCGACAGGCCCGGGTAATCTTTGAAATTTCATCGTGATGGGGATAGATCATTGCAATTGTTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGCGTTGACTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAATGATCCGGTGAAGTGTTCGGATCGCGGCGACGTGGGTGGTTCGCCGCCCGCGACGTCGCGAGAAGTCCACTAAACCTTATCATTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTG ->Arabidopsis thaliana 1 -GGATGCGATCATACCAGCACTAATGCACCGGATCCCATCAGAACTCCGCAGTTAAGCGTGCTTGGGCGAGAGTAGTACTAGGATGGGTGACCTCCTGGGAAGTCCTCGTGTTGCATCCCTC ->gi|186498419|ref|NR_022453.1| Arabidopsis thaliana (AT2G01020) rRNA -AAAACGACTCTCGGCAACGGATATCTCGGCTCTCGCATCGATGAAGAACGTAGCGAAATGCGATACTTGGTGTGAATTGCAGAATCCCGTGAACCATCGAGTCTTTGAACGCAAGTTGCGCCCCAAGCCTTCTGGCCGAGGGCACGTCTGCCTGGGTGTCACAA \ No newline at end of file
--- a/Iterative_mapping/read_file.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,21 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys - - - -def read_t_file(in_file): - f = open(in_file); - result = []; - for aline in f.readlines(): - temp = []; - tline = aline.strip(); - tl = tline.split('\t'); - for i in range(0, len(tl)): - temp.append(tl[i].strip()); - result.append(temp); - f.close(); - return result; - -
--- a/Iterative_mapping/read_s_file.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,22 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys - - - -def read_sp_file(in_file): - f = open(in_file); - result = []; - for aline in f.readlines(): - temp = []; - tline = aline.strip(); - tl = tline.split(' '); - for i in range(0, len(tl)): - if len(tl[i].strip())>0: - temp.append(tl[i].strip()); - result.append(temp); - f.close(); - return result; - -
--- a/Iterative_mapping/remove_map.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,29 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys -from read_file import * - - -unmap_file = sys.argv[1] -map_file = sys.argv[2] -result_file = sys.argv[3] - - -unmap = read_t_file(unmap_file) -mapped = read_t_file(map_file) -h = file(result_file, 'w') - -maps = set() -for i in range(len(mapped)): - maps.add(mapped[i][0]) - - -for i in range(len(unmap)): - name = unmap[i][0] - if name not in maps: - h.write(name) - h.write('\n') - - -h.close()
--- a/Iterative_mapping/sample.fasta Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,1000 +0,0 @@ ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1415:1662#0/1 -TCATTCATCCATTTCCAGTGCTCAGCTAACCCCAACT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1359:1735#0/1 -TGCTGGCGACGCATCATTCAAATTTCTGCCCTATCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1469:1743#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1750:1642#0/1 -AACCGGGACGTGGCGGTTGACGGCAACGTTAGGGAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1899:1627#0/1 -AAAAACGACTCTCGGCAACGGATATCTCGGCTCTCGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1859:1668#0/1 -TACGCTCCTGGTCTTAATTGGCCGGGTCGTGCCCCCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1830:1700#0/1 -ATTTCGATCCTATTGTGTTGGCCTTCGGGATCGGAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2000:1705#0/1 -TTAATGATTAACAGGGACAGTCGGGGGCATTCGTATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2149:1632#0/1 -GATCATACATTACTGACTAAAAGAAGCAAAATCTTGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2052:1637#0/1 -AGAACATGAAACCGTAAGCTCCCAAGCAGTGGGAGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2036:1706#0/1 -AAAACTTAGCTGAGACGACGCAGAAACAGGTGAGATC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2183:1706#0/1 -TTCGAATTGTAGTCTGGAGAAGCGTCCTCAGCGACGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2068:1721#0/1 -AAGTAGCACGTCCCTCAGGAAAGAAGCTCTTCAGATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2162:1740#0/1 -ATTAATCAAGAACGAAAGTTGGGGGCTCGAAGACGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2339:1628#0/1 -TGACGGCAACGTTAGGGAGTCCGGAGACGTCGGCCGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2338:1670#0/1 -TCGCGCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2459:1678#0/1 -CCTCGTCGCTGCGTCTCTCTCCCGCAACCTTCGATTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2492:1685#0/1 -AAAACGATGCCGACCAGGGATCAGCGGATGTTGCTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2286:1687#0/1 -AAGGCGGTGGAGGCCGCCCAGCATTGCCCGCACCTAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2283:1704#0/1 -ACTCTTGTTACAATGATTGTATGACATTCCTGATGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2475:1719#0/1 -TTATGCAGAAATTGCTATAAGAAGAAACCTAAACTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2299:1733#0/1 -CTGTGAAACTGCGAATGGCTCATTAAATCAGTTATAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2464:1744#0/1 -GTGTTTTTATCCAAATCCGGGGATAAACACATTTTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2547:1662#0/1 -AGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2512:1664#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2675:1664#0/1 -GTACAGATCGGAAGAGCACACGTCTGAACTCCAGTCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2694:1675#0/1 -ACTACGAGAGGAACCGTTGATTCGCACAATTGGTCAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2558:1692#0/1 -ATCTTTCATATCCAGAGAGAGAGAAAGAGAACAAAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2587:1709#0/1 -CAACCGTGAAAGCGTGGCCTATCGATCCTTTAGACCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2560:1727#0/1 -TTTCCGAGAGTATGCAGATTTTGTTTTCCAAGAATAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2960:1646#0/1 -CTTGCACATGGGTTAGTCGATCCTAAGAGTCGGGGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2981:1669#0/1 -GATTCATCCCAAAACATTACAAAACGTTACAATGGCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2884:1740#0/1 -TCTCGCGCTTGTACGGCTTTGGCTCGGATTCGTCCGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3172:1696#0/1 -TCGAGTCTGGTAATTGGAATGAGTACAATCTAAATCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3046:1703#0/1 -AGCGTCCTCAGCGACGGACCGGGCCTAAGTTCCCTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3218:1717#0/1 -TCTCGCGCTTGTACGGCTTTGGCTCGGATTCGTCCGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3140:1732#0/1 -ATAAGAAGGTTATTGATTTGGTTAAAGAATACAATGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3212:1744#0/1 -TCCTGGTCTTAATTGGCCGGGTCGTGGCCCCCGCGCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3277:1654#0/1 -TACTCGGATAACCGTAGTAATTCTAGAGCTAATACGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3373:1695#0/1 -CGTTTAGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3255:1702#0/1 -ACGCGGGCTCTGCCCGTTGCTCTGATGATTCATGATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3391:1733#0/1 -AAATAGAAGGGTCAAAAGCTAAGGAAGAAAAGAAAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3606:1635#0/1 -TTTTCATTAATCAAGAACGAAAGTTGGGGGCTCGAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3710:1652#0/1 -CCCCGTGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3551:1662#0/1 -AGAACATGAAACCGTAAGCTCCCAAGCAGTGGGAGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3696:1663#0/1 -ACGCATTTATTAGATAAAAGGTCGACGCGGGCTCTGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3679:1667#0/1 -ACGGGGGGCAGCAGTGGGGAATCTTGGACAATGGGCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3622:1671#0/1 -TCATCCAATTGGAGACGAATCATATCGAGCGATGGAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3506:1682#0/1 -TGCGTTGTGGAAGTCGAAGAGGTTGATGAATATTGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3540:1687#0/1 -AAATTAAACCTCACCGACGGATTCAATTCTCTCGTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3627:1725#0/1 -TCATCCAGATCTCAACTTTCTCTCATCTTCAAATTAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3710:1735#0/1 -GCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3787:1636#0/1 -AGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3996:1694#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3942:1696#0/1 -TGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4104:1635#0/1 -AGGTCGGCGGTTCCATCACCACAACGCCGGACGACAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4243:1713#0/1 -AGATACTCCTTTGACCGAAGAAACCATAACGGAAGCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4091:1714#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4229:1733#0/1 -GGGCCTGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4060:1745#0/1 -TGACTGTGAAACTGCGAATGGCTCATTAAATCAGTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4308:1693#0/1 -TCCTCGGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4384:1697#0/1 -AAAATTTCATCGTGATGGGGATAGATCATTGCAATTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4506:1651#0/1 -GATAATAAAGAGATGGAGATTGTTTTGGAGCAACGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4535:1654#0/1 -AAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4592:1677#0/1 -CTACCTGGTTAATCCTGCCAGTAGTCATATGCTTGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4726:1686#0/1 -TATGTTTTTGTTTGTTCGTAAATTCTTGACATCACTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4544:1694#0/1 -TGGAGCTCCGCTGAATTTTCTTTGCTCCATTTCCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4604:1707#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4996:1665#0/1 -CTTATTTTACGAAGCTCCCCTCGGTTACAGCATTGAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4860:1668#0/1 -AGCGGCTGGAAGAGCACCGCACGTCGCGTGGTGTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4786:1671#0/1 -TATGAAAGACGAACAACTGCGAAAGCATTTGCCAAGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4889:1691#0/1 -ATGGGGGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4843:1693#0/1 -AGGCAGTCCGATCCAACGGCTAGGCACTTACATGGCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4977:1703#0/1 -ATTAGATAAAAGGTCGACGCGGGCTCTGCCCGTTGCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4791:1723#0/1 -TTGTGTTGGCCTTCGGGATCGGAGTAATGATTAACAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5019:1686#0/1 -ACAATGGAGCAACCACTCCTTCCGGCCTCGTCGCCGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5134:1686#0/1 -TCTGCTGTTGTAGAGCCTTACAACAGTGTGCTTTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5307:1664#0/1 -ACGTGCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5278:1674#0/1 -GCATCAAAATCCTCCGACGATGACAACCATAGCTGCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5486:1715#0/1 -TTGTGGTGGCGACGCATCATTCAAATTTCTGCCCTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5541:1641#0/1 -TTCTCCCCGAAATGCGTTGAGGCGCAGCAGTTGACTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5706:1646#0/1 -ACGAGGATCCATTGGAGGGCAAGTCTGGTGCCTGCAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5593:1651#0/1 -AAGGGGCTTCTTGTCATTGATGATGAGCTAGCCACCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5503:1695#0/1 -GAGAGGGAACTAATCATAAGAGATGCAATGAGTGTGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5581:1706#0/1 -ATAAAAACCAGAAGAATCCGTATAAATTATCCTAACA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5713:1729#0/1 -TCTCTTGGAGAGTTCGATCCTGGCTCAGGATGAACGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5831:1656#0/1 -TTCACGTGGCTCAAGTCACTAGCAATGCTCTTGCTTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5942:1680#0/1 -TCCGGTGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5772:1711#0/1 -AGCGCGAACTTCGAAAGGGGATCTGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5957:1723#0/1 -TTACAATAAGTCTGCCTATAGTGGGAGAGGTGACAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5981:1739#0/1 -GAGAAATTTGGAGTTTCGCCGGAATCTTCCTCTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6231:1644#0/1 -AATTGGAAAAGGTGGAGGAGTTGGCGGTGGCATCGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6152:1724#0/1 -TGCAATTCTACCACGACCTCATCGACGAGCTCATAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6100:1731#0/1 -TCCTCTGCGTTTTCACGAAACAGAGAACCTTATCGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6174:1733#0/1 -TCGAATTGTAGTCTGGAGAAGCGTCCTCAGCGACGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6310:1648#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6287:1659#0/1 -TCAACGAGTTCACACCTTGGCCGACAGGCCCGGGTAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6332:1666#0/1 -TTTGGGTTCTCTCCTTATAGTTTGATGAACATTGTTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6295:1704#0/1 -AGATAATCGGAACCTTCGTCCTTGTCTACACGGTCTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6590:1655#0/1 -AGAAGCCACCTCCGGTTCCGGTTTACAAGCCCCCGCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6585:1691#0/1 -CTTTTCCCAGAGAAGAAGCAATGACGGTATCTGGGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6722:1719#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6820:1642#0/1 -AAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7000:1662#0/1 -GGGAAGCGTTGAGGCTTCACCCTCCACTCATCGTGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6873:1673#0/1 -AGCACTTTAGGATGGCATAGCCTTAAAGTTAAGGGTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6770:1699#0/1 -AACTGTCTACAAAATCATTGAAGATCTACCCAAAAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6782:1735#0/1 -GATCCGTCAAATTCAATTGATCCTCTCTCCAAATCAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7159:1658#0/1 -ACCCACCTCCGGTTCCGGTTTACAAGCCACCGCCAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7183:1660#0/1 -ATTTCATCGTGATGGGGATAGATCATTGCAATTGTTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7167:1679#0/1 -TTCTGCCTCCGGCGCTGTTACTTTGAAGAAATTAGAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7223:1688#0/1 -TTGGACGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7410:1647#0/1 -ACCATGCAGTATCGGTTTATATAACATCCACATTGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7387:1710#0/1 -TCTTCGAGTTTTGCTACTTGTATGGGATGATAAGACT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7397:1741#0/1 -TTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7624:1680#0/1 -AATTGTTGTTGTTATCTTCAACGATAGCGTTGTGCTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7600:1744#0/1 -AGTTGTTGCAGTTAAAAAGCTCGTAGTTGAACCTTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7789:1676#0/1 -ACCCGTCTGATAGCGCTTAAGCGCGAACTTCGAAAGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7950:1684#0/1 -TGAACGAGACCTCAGCCTGCTAACTAGCTACGTGGAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7926:1706#0/1 -ACGGTATCTGGGGAATAAGCATCGGCTAACTCTGTGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7757:1711#0/1 -TTGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:7970:1747#0/1 -TCGAAAGGGGATCCGGTTAAAATTCCGGAACCGGGAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8054:1672#0/1 -CGAAAGGGGATCCGGTTAAAATTCCGGAACCGGGACG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8245:1672#0/1 -GATATATAATCATAGATTCCAGAATTTGACATTTTCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8088:1710#0/1 -GAAAGTTGGGGGCTCGAAGACGATCAGATACCGTCCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8244:1713#0/1 -GGGACGCATTTATTAGATAAAAGGTCGACGCGGGCTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8069:1727#0/1 -TCGTCTACACCGTCTACGCCACAGCCGTTGACCCCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8018:1745#0/1 -TTCTCTACTGGATTGCTCAGCTTCTTGGCTCCGTCGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8394:1647#0/1 -CTACAAGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8475:1658#0/1 -ACACTTGATCGGAATAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8367:1664#0/1 -GGGTGAGTAAACCCGTAAGGCGCAAGGAAGCTGATTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8488:1695#0/1 -GCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8442:1727#0/1 -CGGTCGGCGATACGCTCCTGGTCTTAATTGGCCGGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8328:1744#0/1 -TTGTCATTCTCTTCGCCGGAATCTAATCTCTCTCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8520:1660#0/1 -TTGGCCGTTGTTTCCTTCTTCTTCTTCTTCTTCTTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8563:1665#0/1 -AATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8739:1667#0/1 -TCTCTCGGGAGCTTTCCCCGGGCGTCGAACAGTCAGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8596:1682#0/1 -TAGCCCACGAATGCGGTCACAACGCATTCAGCGACTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8643:1688#0/1 -TTGCACGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8727:1745#0/1 -AGGGAGAGCTAATGCTTCTTGGGTATTTAGGTTTGAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8767:1649#0/1 -TCGGTACCAAATCGAGGCAAACTCTGAATACTAGATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8932:1656#0/1 -GCTGGCGACGCATCATTCAAATTTCTGCCCTATCAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8841:1666#0/1 -TCAAACGAGGAAAGGCTTACGGTGGATACCTAGGCAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8951:1673#0/1 -TGGTGGAGCTGGAGGAGGATTTGGTGGAGGAGCTGGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8876:1674#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:8993:1737#0/1 -TTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9241:1664#0/1 -AAGTCACTCTTTCTTGTTGCCTTACTTGTCGGCTCTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9095:1710#0/1 -AGAACGAAAGTTGGGGGCTCGAAGACGATAAGATACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9231:1716#0/1 -TCGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9171:1733#0/1 -AAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9471:1658#0/1 -GACACATACACACATAGCCATGGCCTCTTCTTTCTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9383:1680#0/1 -TTCAGTGTTGATTCGTCTTCCTTCACGCCGTTCTTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9627:1730#0/1 -ATTGTTTGTAAAGGGTGAGAGATTATTTTTCAGTGAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9921:1680#0/1 -ATGGCTTCTCCGGTGAGATACCTGACTCGATTGGTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:9931:1727#0/1 -AAAGCATCGGCTAACTCTGTGCCAGCAGCCGCGGTAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10235:1668#0/1 -AAAAATCTTGAGTAAAAACAAATTTTCCTGTATCTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10040:1686#0/1 -AAAACCCGTCTGATAGCGCTTAAGCGCGAACTTCGAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10169:1689#0/1 -ACGGATCGCATGGCCTCTGTGCTGGCGACGCATCATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10213:1743#0/1 -GGCGCTTAAGCGCGCGACCTATACCCGGCCGTCGGGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10021:1744#0/1 -CAAAGCAAGCCTACGCTCTGGATACATTAGCATGGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10294:1712#0/1 -TTCTCTCTCTAACATTCTTCAGAGAGGGAGACTTTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10392:1736#0/1 -TAGAGTGCTCAAAGCAAGCCTACGCTCTGGATACATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10582:1655#0/1 -ACGGTACTGGACAATGTGGAAGCTTCCCTTGTTCGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10777:1673#0/1 -CACTCTCACCCACAAGTTAGTCATAAAAAAAAAAAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10980:1714#0/1 -GTGGAGAGACTGAAAACCGCGAAGAGGATGTGAATGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:10931:1720#0/1 -TTGTAGTCTGGAGAAGCGTCCTCAGCGACGGACCGGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11171:1717#0/1 -TGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11458:1668#0/1 -GATCACAAGTTTTAAGCAGTATTTGTAAGAAAATGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11388:1696#0/1 -TTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11317:1701#0/1 -ACAACTCAAGCTTCCATCAACTTGACCCACACCGAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11403:1706#0/1 -TAGATAACATCAAGACAACAACCGTCGGTCCCGGAAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11291:1739#0/1 -GAAAATCAAATCTTTTCATTTACAATTATCTTTCTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11593:1673#0/1 -TCCCTTCACGGCCGGCTTCTTAGAGGGACTATGGCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11537:1726#0/1 -CCATCTCCGTATTGTCTTCTACGTAGACAATGTGCCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11709:1733#0/1 -CGAGGCGCTGTCTACGAGTCGGGTTGTTTGGGAATGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11851:1657#0/1 -TAATCAAGATCGAAAGTTGGGGGCTCGAAGACGATCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11822:1687#0/1 -TTGACGGCAACGTTAGGGAGTCCGGAGACGTCGGCGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11950:1691#0/1 -TTATGTTTACAGCTCTCCTCCTCCTCCGGTGAAGTCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11752:1704#0/1 -TGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11895:1708#0/1 -TTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:11756:1739#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12136:1709#0/1 -ATGCGAAAAGTGTAAAGGTGGGAAGATCGGAATTGCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12070:1715#0/1 -ACGAGCAGCTCCCAACCACAGACTACTGAATTAATCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12204:1724#0/1 -GAAAATTTTCCCCATTAAACAAAAAAAAATCAAATCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12140:1746#0/1 -ACTACTCTCTCCACTAAACAAAAACACTAGAGTTAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12332:1664#0/1 -GCGAAAGCATTTGCCAAGGATGCTTTCATTAATCAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12455:1665#0/1 -ACAAGTCTTGTCTCTCGAGTGTTCTTCAAATGTTAGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12252:1728#0/1 -GGAACTCCATGCGAATATGAAGCGCATGGATACAAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12315:1747#0/1 -TGGACCGGTAATTTCATTACATCGCCGGACGGCCGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12640:1665#0/1 -TCTCTTCTACAGTAAACAAAAAATGGCAATGAATGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12666:1668#0/1 -TTATTCTGCACTTGGAAGAAGAACTAGAAAAAGGAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12735:1728#0/1 -ATCCCTTCACGGCCGGCTTCTTAGAGGGACTATGGCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12751:1677#0/1 -TCCTCCTGTTTACAAGTCCCCACCACCACCGGTTAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12821:1679#0/1 -TCTTCTCCGGTGATTTACTTACTTAACAATCATGGCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12935:1691#0/1 -ACTGCCTTCGGATTTGATTTGGTTCGTGGCACCAAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:12996:1719#0/1 -TAATCTCTCTGTTTAATCTTATGATCTGCTGTTTTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13223:1661#0/1 -GTTGATGTGTTTATTCCCAGAGATCGAAGGACTGGTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13442:1665#0/1 -TTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13331:1684#0/1 -GGGGGTCGCAGTGACCAGGCCCGGGCGACTGTTTACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13451:1685#0/1 -TGCTCAAATTTCTTCTTTAGAAGATTAAAAATCTTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13309:1690#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13312:1742#0/1 -AAAACGATGCCGACCAGGGATCAGCGGATGTTGCTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13704:1696#0/1 -GACTCGGAGCAGAGATTTAGGGTCTGTAATTTGTATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13563:1703#0/1 -TATAGTCAGAGGTGAAATTCTTGGATTTATGAAAGAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13735:1728#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13899:1667#0/1 -CGTTATTTTACTTACTCCGTGAATCGGAGGCGGGGTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13836:1707#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13886:1718#0/1 -GAACAGAAAATAGAAAGAAGTAACAAAACCAAAGCAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13866:1724#0/1 -TCAATGAGCCATGGGTTTTCTCGCACGCTGGCTATGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:13943:1728#0/1 -TCGAAGACGATCAGATACCGTCCTAGTCTCAACCATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14097:1712#0/1 -CCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14116:1729#0/1 -GTTCTCACGTTCGAAGACCATTTCTTGTTCTTTGGAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14699:1669#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14594:1718#0/1 -AATTTCCTCATGTTGAGAGGTACTTCTGGACTGTGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14743:1729#0/1 -AACTCACCTGCCGAATCAACTAGCCCCGAAAATGGAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14510:1734#0/1 -TTCACCCACCGCAGCTTCACCACCGGCACCTCCGACG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14821:1705#0/1 -AACTGGCTAACACGTATTGGGTTGAGTATCTCTCTAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14892:1717#0/1 -CTTTCGGATATTCCACCAGTCTCTCGCAATCTTCGCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:14835:1743#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15239:1702#0/1 -TCTGACGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15059:1717#0/1 -TGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15152:1718#0/1 -GGGCAGGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15444:1702#0/1 -GATATCTATTTATTCAATAACCCTTACAACACCGAAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15407:1747#0/1 -TCGGATACGGGTCGGGCTTCTTAGCTGTTTGAAGAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15681:1670#0/1 -AATTGCCACAACATGGGCGTTCTTCTTAGCAAGAATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15630:1695#0/1 -TTATTAGATAAAAGGTCGACGCGGGCTCTGCCCGGTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15506:1715#0/1 -TTTTTCATTAATCAAGAACGAAAGTTGGGGGCTCGAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15976:1688#0/1 -ATCATCCATCACATCTCCTCTTGCAAACCAACGTAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:15940:1745#0/1 -AACAAGGTAGCCGTACTGGAAGGTGCGGCTGGATCAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16043:1680#0/1 -ACGTATGTGGCAAAATACGGGGATGACTTGTGGCTAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16175:1683#0/1 -ATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16074:1695#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16238:1700#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16229:1727#0/1 -TCGAAGACGATCAGATACCGTCCTAGTCTCAACCATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16025:1727#0/1 -CCGGGAAGGACGCACCTCTGGTGTACCAGTTATCGTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16429:1678#0/1 -ACGGATCGCATGGCCTCTGTGCTGGCGACGCATCATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16255:1695#0/1 -CTAAGAAAGTTGATCCACCGCCGGTGCCAGTCCACAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16494:1739#0/1 -AGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16656:1687#0/1 -TTAAATCAGTTATAGTTTGTTTGATGGTAACTACTAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16685:1715#0/1 -TAAAACGTCGTGGACTTTTTGAGTCTGACGCTGCATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16885:1690#0/1 -CTCAGGATCGGAAGAGCACACGTCTGAACTCCAGTCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16994:1709#0/1 -ATAACCGTAGTAATTCTAGAGCTAATACGTGCAACAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16768:1715#0/1 -TCGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:16899:1742#0/1 -GGTAAACTTCGAGCCTGTCCGACCCAGAAGGCACAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17201:1693#0/1 -TCTTTGGATAACAATATCCCAAACTGAAAATGGCTAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17179:1704#0/1 -TTAAGTCCTCCGCTGCCTTCCCAGCCACCCGCAAGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17158:1711#0/1 -ACTAATGTAAAGGAAGCCTGTGCTTGGCTTGGATATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17051:1725#0/1 -ATAACGGTCCTAAGGTAGCGAAATTCCTTGTCGGGTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17448:1685#0/1 -ACAATGACTGGGCCTCCACCTGCCATGGTGATGCCTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17551:1710#0/1 -GGTTTGTCTTCAAAATCGTCAGAAGAAGAAGAAGAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17662:1746#0/1 -GCAACACGGGGAAACTTACCAGGTCCAGACATAGTAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17823:1706#0/1 -TCCCCCGGTTGGATTGAAGGGTTGAAAAAATTAGACA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:17951:1723#0/1 -TGATCGGAGGATGTTGCGACGGAGCCGTCCTTTGACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18174:1676#0/1 -ATTAAATCCTAAAATCCATTATTGATTGAATCTTCGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18241:1694#0/1 -CCAAATCTAATAAATCTAAGTGTAGTTTTCGGTGTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18095:1727#0/1 -ACAAGCAACGGCGGAAGAGTTAACTGCATGCAGGTGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18074:1746#0/1 -ACCACCAAATCGCCGCCATGTTTAAACAAGCTTCTCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18318:1679#0/1 -GAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18410:1680#0/1 -GCAAGCCTACGCTCTGGATACATTAGCATGGGATAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18290:1681#0/1 -TCAGGCCTTGGAGGACCGAACCCACGTATGTGGCAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18280:1722#0/1 -GAGTTCGATCCTGGCTCAGGATGAACGCTGGCGGCAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18429:1742#0/1 -TAGACTACGGATGGGACACCGCCGGACTTTCAGCTGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18675:1682#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18535:1684#0/1 -CCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18657:1722#0/1 -GAGAAGATAAAGAGATAAAGGAAAGACTAACGTTAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18618:1729#0/1 -TGAACACACACAAACACACACACACACAGCCTTTTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:18823:1701#0/1 -ACCTGACCCAGATAGCGAGAAGTTTCATGGATAAGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19063:1699#0/1 -ACGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19104:1705#0/1 -AAAAACGACTCTCGGCAACGGATATCTCGGCTCTCGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19019:1718#0/1 -AGACGATCAGATACCGTCCTGGTCTCAACCATAAACG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19433:1728#0/1 -AAATAGCGTATATTTAAGTTGTTGCAGTTAAAAAGCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19355:1731#0/1 -AATCAAGAACGAAAGTTGGGGGCTCGAAGACGATCAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19500:1683#0/1 -TTGTAACACGGACCAAGGAGTCTGACATGTGTGCGAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19657:1698#0/1 -GGGATTGGCTTTGGGCTTTTCCTGCGCAGCTTAGGTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19640:1749#0/1 -TTTAATTAATAACAATAAATGTTCTTTTTCAGTTTTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19866:1690#0/1 -AAGCCCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:19966:1707#0/1 -AAAATGCCAAGACGGACGATCAGGATACGAGGCTTAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20090:1682#0/1 -CAGGTCCCCGAGTGGCTCACACGATATGCTTCACGTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20183:1689#0/1 -GATATCGAGCGATGGATTTGGCAGAACTGTGGGCGAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20206:1747#0/1 -TCGAAAGTTGGGGGCTCGAAGACGATCAGATGCCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20292:1695#0/1 -AGGAACGGAGACGGCAGGAACGATGAGTTCTATAGTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20306:1713#0/1 -CCGATGGTTGTGGACAACATGTATTATAAGAACATCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20402:1713#0/1 -TTACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20275:1726#0/1 -AACTGCGAATGGCTCATTAAATCAGTTATAGTTTGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20403:1737#0/1 -AAATAAGAAGACATATTTATCAACTTGATCAACTTGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20539:1702#0/1 -CCTTCACGGCCGGCTTCTTAGAGGGACTATGGCCGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20612:1731#0/1 -AGCGTCCTCAGCGACGGACCGGGCCTAAGTTCCCTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20566:1745#0/1 -AGTTCGGTCTCTCTGCCGGAGTCGGATCATTAAACGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20889:1691#0/1 -CTTTCATTTCAGAGTCTTGGTGTTGTTTATGGTGATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20841:1709#0/1 -TTTGCTGGCATAATGGGAATGGGTTTTCCACCTTACA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:20980:1742#0/1 -TCCACTACTTTTAACGTTATTTTACTTACTCCGTGAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:21184:1708#0/1 -CGATCAGATACCGTCCTAGTCTCAACCATAAACGATG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:21173:1745#0/1 -TCGGTTGCTAATGGTTTGATCAATTTCCTCAACATAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:21427:1722#0/1 -CGTTAACGAACGAGACCTCAGCCTGCTAACTAGCTAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1449:1766#0/1 -TCAACTGCGAAAGCATTTGCCAAGGATGTTTTCATTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1303:1793#0/1 -TAACCATAAACGATGCCGACCAGGGATCAGCGGATGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1430:1865#0/1 -TCTTCATCCTCGTCTACTGCACCGCCGGTATCTCTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1450:1892#0/1 -AGCAACTGCCAAAGCACCCGCAACAAAATTATAAAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1342:1935#0/1 -ATTGATGATGTCTTTACTTCTTCAAGAGGATCTACCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1406:1941#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1676:1764#0/1 -TGGTGAGACAAAAACGACGATATTTTCCTCTTCCTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1512:1774#0/1 -AAAAACAATAAACGAAAACTGAGAGAGAGATTGAAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1677:1808#0/1 -ATTGGATCACTTTCAATGAGCCATGGGTTTTCTCGCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1579:1824#0/1 -TTTTGTGTTTGTCCACCACCTCCTCCATGTTATTCTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1744:1840#0/1 -GGGTGAGAGCCCCGTTGTGCCCGGACCCTGTCGCACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1579:1852#0/1 -AGAAGAAGAAGAAGAAAAAGTGGAGCAAGCTTCGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1550:1869#0/1 -AACTCTGTGCCAGCAGCCGCGGTAATACAGAGGATGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1565:1898#0/1 -AGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1738:1918#0/1 -ACATTCCTCACCAAACCCTCTCCAAAACACACCCACA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1547:1922#0/1 -TCGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1732:1964#0/1 -TCTCGCGCTTGTACGGCTTTGGCTCGGATTCGTCCGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1654:1991#0/1 -GATTATATAAGGGAATGTTCAGTTCCAGTGACTGAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1518:1992#0/1 -GGTGGAGGTTTACAAACACCACCAATCTTCTCTCTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1865:1796#0/1 -GATTCATCCCAAAACATTACAAAACGTTACAATGGCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1886:1815#0/1 -GGGCGTAAAGCGTCTGTAGGTGGCTTTTTAAGTCCGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1855:1840#0/1 -TGGTATCGGTGGACTCGGCGGTGCAGGTGGGCTAGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1960:1855#0/1 -ACCTCACTGCCGCCGATTAGACTCCGCCGGATGCAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1808:1879#0/1 -TTACCATAAACGATGCCGACCAGGGATCAGCGGATGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1869:1890#0/1 -TGCTTCTTGGGTATTTAGGTTTGACACAGCTTCACAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1898:1925#0/1 -TCCCATGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:1765:1950#0/1 -AACTCATATCAACCTTCGCCGGAAATAATGGCTTTCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2096:1773#0/1 -ATAGCACCGATAACAATCTACTCTCTTTAAAAGAAAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2186:1774#0/1 -TTGAGAAAATAAACGAGGAGGTGGCTCATCCTGAGAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2019:1774#0/1 -AAGACGATCAGATACCGTCCTAGTCTCAACCATAAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2236:1797#0/1 -GTGTAGTCTGGAGAAGCGTCCTCAGCGACGGACCGGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2218:1825#0/1 -ACCTATCTCACTCTAAAATCTCTCTCTGCCAATCTCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2067:1830#0/1 -ACATGTCTGTGAAGATGCGGACTACCTGCACCTGGAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2183:1833#0/1 -AGGGCGCGAGCCCGGGCGGAGCGGCCGTCGGTGCAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2095:1843#0/1 -GACACAACACACCTCAAGCTTTATAACTTCTAAAACA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2184:1923#0/1 -AAGAGTCGGGGGAAACCCGTCTGATAGCGCTTAAGCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2086:1933#0/1 -AAAAACGACTCTCGGCAACGGATATCTCGGCTCTCGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2134:1944#0/1 -AGCGTCCTCAGCGACGGACCGGGCCTAAGTTCCCTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2220:1966#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2066:1971#0/1 -TGAAGCATTTTCCAAAGAGAAAGAGAGAGAAATGGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2239:1991#0/1 -ATTATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2113:1996#0/1 -TTTGGTGTGCATTGGTCGGCTTGTCCCTTCGGTCGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2369:1755#0/1 -TGATCCTTTCGTCTTTTTCTGACTCTTCAATCTCTCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2281:1791#0/1 -TTAATTCCGGAACCGGGACGTGGCGGTTGACGGCAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2431:1837#0/1 -AAAATTTCATCGTGATGGGGATAGATCATTGCAATTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2272:1843#0/1 -GGGGATCCGGTTAAAATTCCGGAACCGGGACGTGGCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2316:1843#0/1 -TGGCTTGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2451:1850#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2264:1872#0/1 -ATGATAACTCGACGGATCGCATGGCCTCTGTGCTGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2443:1872#0/1 -ACAGGTCTGTGATGCCCTTAGATGTTCTGGGTCGCAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2297:1890#0/1 -ATAACATCATAGGATTTCGATCCTATTGTGTTGGCCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2472:1986#0/1 -ACTACCACTCTCCACCTCCTCCGGCGAAGTCCCCACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2564:1768#0/1 -GGGGCCTGATAGGCGGTGGTTTACCCTGTGGCGGATG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2674:1786#0/1 -TAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2648:1802#0/1 -GCGATAATACAGAGGATGCAAGCGTTATCCGGAATGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2691:1831#0/1 -CAGTATAATCAATCAGAAAACAAGTAGAAACTTTAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2560:1839#0/1 -TCGAAGACGATCAGATACCGTCCTAGTCTCGACCATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2612:1876#0/1 -TCTTGGGCCTTTGCCACCAACTTTGTTCCCGGAAAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2503:1919#0/1 -TCAGACGAGGAAAGGCTTACGGTGGATACCTAGGCAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2640:1953#0/1 -CACCGGGAGAAAATCCTCCTCCGCTGTCGTGAGAGCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2553:1969#0/1 -GATCATCACCTTCCCCACTAATACTCTATAGTTTGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2669:1987#0/1 -GGATCGTGAGACTCCGATGGTTGTGGACAACATGTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2782:1800#0/1 -GACATTTTCTGTTTCCGTCTACAAGAACCACTTTGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2957:1811#0/1 -ATTAATTCACATTTAAACACTTCTCTGCATATATTTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2990:1818#0/1 -TATTTTACTTACTCCGTGAATCGGAGGCGGGGTACAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2806:1852#0/1 -TGAAAATAAGCGTAGATCCGGAGATTCCCGAATAGGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2899:1856#0/1 -ACTGATGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2903:1882#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2913:1931#0/1 -TTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2816:1932#0/1 -GCATCAGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2795:1958#0/1 -TCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:2993:1984#0/1 -GACGATCAGATACCGTCCTAGTCTCAACCATAAACGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3163:1754#0/1 -AGGCAAGAGACAACCTGGCGAACTGAAACATCTTAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3082:1793#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3054:1825#0/1 -TAGATGTTGAGACTCTAATCCCTAACCACAATGACTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3100:1835#0/1 -CTATCTTAAAACTTCTTACCTAAAATAGAAATTTGAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3199:1865#0/1 -TTTCTTAAAAATTGGATTTTGTGTTGGGTTTTTCTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3032:1907#0/1 -AGAGAGAAGAAGTAGGCAGACAAAGAAGAAGAAGAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3232:1919#0/1 -ATCACAAGCAAACAAGAGAAAACATTTTATTGTTATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3075:1937#0/1 -ACAGACTGTGAAACTGCGAATGGCTCATTAAATCAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3005:1941#0/1 -TTTTAAGTCCGCCGTCAAATCCCAGGGCTCAACCCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3026:1990#0/1 -AAGAAAGAGATTCCCCCGCCGGTTCCGGTTTACGATC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3131:1992#0/1 -GGCTCTCGCATCGATGAAGAACGTAGCGAAATGCGAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3319:1777#0/1 -GCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3337:1789#0/1 -GACGCGGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3416:1846#0/1 -AACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3292:1846#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3491:1888#0/1 -ATCTTTTCGAAGAGCGGAAGCTAAGGAGAGGCGAATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3266:1903#0/1 -TATAGAAATGGCCAAAGACGTGGAAGGACCTGAGGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3339:1904#0/1 -GTGAAGACACCAGAGACGCCTAGTTTGGTGGGAAAGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3435:1918#0/1 -AGCGTCCTCAGCGACGGACCGGGCCTAAGTTCCCTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3478:1938#0/1 -CCGGAGAATAATATCCGATCTGCTAGTGCGGTTAATA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3381:1938#0/1 -ATCAGCGACTCTCCCACTCGCTCGTGTCGTCGAAGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3311:1972#0/1 -ACATTCATCCCAAAACATTACAAAACGTTACAATGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3471:1996#0/1 -CCCATGTCCACCTAAATACAGTCCTCCTGTGGAGGTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3408:1998#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3714:1760#0/1 -TGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3734:1790#0/1 -ATACAGCAGCTGAAGCTGTGTATCGGAAAGCTCAATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3699:1795#0/1 -ACAAAAGACAAGTTTTTAAACTGCAGAACCGCATTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3651:1798#0/1 -TCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3557:1799#0/1 -TGATAGTGCTTAAGCGCGAACTTCGAAAGGGGATCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3531:1811#0/1 -TACAGACACACACGTGGCTCATCACCTGTTCTCGACA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3526:1856#0/1 -TCTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3693:1860#0/1 -AAAACAACTCTGCTTCACTCTCTATCTTTCTTAAGTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3616:1916#0/1 -AGCTTGAAAATCGGACGTCTTCGGCGTTCGAATTGTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3599:1930#0/1 -AGACGATCAGATACCGTCCTAGTCTCAACCATAAACG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3620:1956#0/1 -GAATCTCTCTGTGTTTTTTCTATCTCTCTCTTTCTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3596:1973#0/1 -TGTAAGAGCTAGGCAGCAGGGATTATGTGTACGCAAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3721:1974#0/1 -AAGCCTGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3507:1998#0/1 -ACAAGGTGCTGGTGCTGGAGGAGGATATGGAGGTGGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3756:1769#0/1 -ACGCCCTCGACCTATTCTCAAACTTTAAATAGGTAGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3901:1846#0/1 -TACAAGTCTCCTCCGCCACCAACTCCGACATATGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3892:1871#0/1 -ATCACCGCCTCCATATTCTTTCGCGTCTTTTGCTTCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3765:1925#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3842:1953#0/1 -TCGAGCATTTTTGACGCCAAGGCTGGAATTGCATTCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3758:1970#0/1 -AACCCCGACTTATGGAAGGGACGCATTTATTAGATAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3931:1972#0/1 -CTCCGTGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:3828:1991#0/1 -CCTTCGGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4152:1771#0/1 -TCCTGAGATTTTTTATATATTTTCTCCAGATCTGCTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4212:1780#0/1 -GACTCAACCAATTTCTTCTCAGGTAATACTCGTAAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4130:1806#0/1 -TTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4183:1813#0/1 -AAGGCACGTGTCGTTGGCTAAGTCCGTTCGGCGGAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4010:1857#0/1 -ACTCTGCTTCACTCTCTATCTTTCTTAAGTAAACAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4206:1859#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4051:1895#0/1 -TCAAGCGTTATCCGGAATGATTGGGCGTAAAGCGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4226:1939#0/1 -TGATCATCACTTTCACAATCTTCTTCATCGATTTCTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4381:1809#0/1 -GCAGCATCAGCAACAACAGAGCAGTCCTGGCTTTCTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4456:1814#0/1 -TTCATGGACGTTGATAAGATCTTTCCATTTAGCAGCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4311:1831#0/1 -AAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4464:1844#0/1 -TACGCTTGGGCCTTCGTCGCCAAGACTTCTCAAGTTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4254:1850#0/1 -AAAAGGAGGTAGGGGTGCAGAGACAGCCAGGAGGTTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4286:1883#0/1 -ATTTAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4465:1887#0/1 -AACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4329:1895#0/1 -CCGTTCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4379:1906#0/1 -ACTACTCTCTCCACTAAACAAAAACACTAGAGTTAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4486:1907#0/1 -TAAGAGCCAAAGGTTGAGAATGTGACTCTTGGACCAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4456:1996#0/1 -GAGGATGCGAAAAGATACATCCGGCAACTTCCCAACT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4674:1782#0/1 -TTTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4634:1791#0/1 -GAATCACTTCACTCTCTCTAATCAAAAAGCTTTTAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4501:1806#0/1 -TCGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4629:1820#0/1 -TGATCGTTCTTATTGACCCTAGCCGCTACACACTTTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4590:1838#0/1 -ATTCATTTCAATCAATCTTCTTCTTCTTCTTCTTCTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4741:1847#0/1 -AACGACTCTCGGCAACGGATATCTCGGCTCTCGCATC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4708:1892#0/1 -TTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4508:1902#0/1 -TTAGCATGGGATAACATCATAGGATTTCGATCCTATT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4691:1903#0/1 -AGTGAAATACCACTACTTTTTACGTTATTTTACTTAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4648:1966#0/1 -AAATTTCAAAATCAGATCCAACAAATCTTCTTCTTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4963:1798#0/1 -AGACGTCGGCGGGGGCCTCGGAAAGAGTTATCTTTTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4766:1882#0/1 -CTGTCGCACCACGAGGCGCTGTCTACGAGTCGGGTTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4860:1888#0/1 -ATACTCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4947:1899#0/1 -CATCAATACTCCTGTGAGAACAAAATGAAGCTTTCTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4982:1926#0/1 -AGACTCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4879:1942#0/1 -TCGAGTCAGGTAATTGGAATGAGTACAATCTAAATCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:4914:1944#0/1 -GTGCAAAGGTTTCCTCGGGCCGGACGGAGATTGGCCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5091:1754#0/1 -TTTATGTTTCTCATTATTACTGCGGGAATTTCAATTA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5145:1756#0/1 -TATCGGTAGGGGAGCGTTCCGCCTTAGGGGGAAGCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5015:1781#0/1 -TTTTCATTAATCAAGAACGAAAGTTGGGGGCTCGAAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5166:1833#0/1 -TTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5035:1836#0/1 -TGGCGACGCATCATTCAAATTTCTGCCCTATCAACTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5195:1862#0/1 -TTCACCCATTTCTTGGCTTACAACAACAAATCTTAAA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5062:1871#0/1 -TTAACTCTGTGCCAGCAGCCGCGGTAATACAGAGGAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5235:1878#0/1 -ACGGAAATGTCTTCATGGGTTCTTCCGAACATGTTCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5231:1897#0/1 -GGAACGAACACACCACCTTCTCTCCAATCTGGATCTG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5168:1901#0/1 -ACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5220:1915#0/1 -CCACCTCCGGTTCCGGTTTACAAGCCCCCGCCAAAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5013:1950#0/1 -ACTTTCAATGAGCCATGGGTTTTCTCGCACGCTGGCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5175:1985#0/1 -CGTGAAATACCACTACTTTTAACGTTATTTTACTTAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5145:1985#0/1 -ATTTAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5453:1770#0/1 -CATCAAAACCCAGACGCTGTATGGTTATGGGGAATGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5412:1781#0/1 -ATGTCGGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5412:1816#0/1 -TAGGACTCCGCTGGCACCTTATGAGAAATCAAAGTTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5496:1822#0/1 -AAAAACCTAAAACAAAAAAAATCTCTTTCCTTCTTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5346:1823#0/1 -AAGCCACCACCAAAGGTGGAGCTTCCACCGCCTATTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5333:1831#0/1 -TCGAGTCTGGTAATTGGAATGAGTACAATCTAAATCC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5305:1833#0/1 -AGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5371:1867#0/1 -GTAGCGTCCTCAGCAACGGACCGGGCCTAAGTTCCCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5374:1893#0/1 -ATGTTTTCATTAATCAAGAACGAAAGTTGGGGGCTCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5377:1943#0/1 -TGTTCGGGAAACATTGACGACAAAGGAAAGTTTGGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5313:1973#0/1 -TGTATACAAGTCTCCTCCGCCACCAACTCCGACATAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5620:1756#0/1 -AAAAACTTTCTCTCAATTCTCTCTACCGTGATCAAGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5716:1779#0/1 -TCCCTTCACGGCCGGCTTCTTAGAGGGACTATGGCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5667:1857#0/1 -GTATTCAACGAGTTCACACCTTGGCCGACAGGCCCGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5654:1887#0/1 -GTAACGGGTGACGGAGAATTAGGGTTCGATTCCGGAG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5636:1908#0/1 -TTCTCGCGCTTGTACGGCTTTGGCTCGGATTCGTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5715:1927#0/1 -CCGTCGGGGCAAGAGCCAGGCCTCGATGAGTAGGAGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5610:1936#0/1 -GAAGAAGCAATGACGGTATCTGGGGAATAAGCATCGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5832:1784#0/1 -GCCCGGATCGGAAGAGCACACGTCTGAACTCCAGTCA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5917:1794#0/1 -AGTCGCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5769:1883#0/1 -AGCAAAGTTTTATGTAATCAAATCGTACAGTGAAGAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5796:1889#0/1 -TTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5992:1905#0/1 -ATGTGTGTATTAATTTATCTTCTTGTTTTAAAGAGAC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5885:1923#0/1 -AAGAAGAGCCAATGGCGATGAAGACATCACATGTTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5976:1937#0/1 -AGCGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:5957:1978#0/1 -TTAGTTGAACCTTGGGATGGGTCGGCCGGTCCGCCTT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6197:1781#0/1 -ACTTAGGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6180:1789#0/1 -ATTTTGGCTGGTGCTGAATACGGTAGTGGAAGTTCTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6038:1789#0/1 -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6177:1825#0/1 -TTGATCCCGAGACTGAAGCTATGACCAGGAGAATTGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6159:1830#0/1 -CGGGCCGATCGGAAGAGCACACGTCTGAACTCCAGTC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6151:1878#0/1 -ATACGGTGTATGAATCCGAATTACACAGAGTTCAAGT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6123:1878#0/1 -AGCGCTAACTTCGAAAGGGGATCCGGTTAAAATTCCG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6196:1879#0/1 -ATTTCTGCCCTATCAACTTTCGATGGTAGGATAGTGG ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6237:1895#0/1 -AAGATCCCAGACGAAATGGCTCAGAAAGTGGTGCTGA ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6023:1896#0/1 -ACAACCGCTGAATATTTGGCTTATGAATGTGGAAAGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6123:1904#0/1 -ATGATAACTCGACGGATCGCATGGCCTCTGTGCTGGC ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6125:1922#0/1 -ATGGATCGTTGCACGTCGTCGTTTTTGCTTCCCACAT ->DGM97JN1_120925_0255_AD166MACXX:4:1101:6184:1926#0/1 -GATCATCAAAAAACACCTCAAAGAATTATTCATTCAG
--- a/Iterative_mapping/seq_track.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,38 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys -from read_file import * -from Bio import SeqIO - -unmap_file = sys.argv[1] -reads_file = sys.argv[2] -result_file = sys.argv[3] -tp = sys.argv[4] - - -unmap = read_t_file(unmap_file); - -h = file(result_file, 'w') - -reads = SeqIO.parse(reads_file,tp) -um = set() -for i in range(0, len(unmap)): - id_r = unmap[i][0] - um.add(id_r) - -for read in reads: - if read.id in um: - h.write('>') - h.write(read.id) - h.write('\n') - h.write(read.seq.tostring()) - h.write('\n') - - - -h.close() - - - -
--- a/Iterative_mapping/truncate.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,36 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys -from Bio import SeqIO - -fasta_file = sys.argv[1] -shift_in = sys.argv[2] -result_file = sys.argv[3] -length = sys.argv[4] -t_end = sys.argv[5] - -shift = int(shift_in) - -fasta_sequences = SeqIO.parse(open(fasta_file),'fasta'); -h = file(result_file,'w') -for seq in fasta_sequences: - nuc = seq.id; - sequence = seq.seq.tostring(); - if (len(sequence)-shift)>=int(length): - h.write('>'+nuc) - h.write('\n') - if t_end == 'three_end': - h.write(sequence[0:(len(sequence)-shift)]) - if t_end == 'five_end': - h.write(sequence[(shift):(len(sequence))]) - h.write('\n') - - - - -h.close() - - - -
--- a/Iterative_mapping/unmap.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,31 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys -from read_file import * -from Bio import SeqIO - -map_file = sys.argv[1] -result_file = sys.argv[2] - - -#reads = read_t_file(read_file); - -f = open(map_file); -h = file(result_file, 'w') - -for aline in f.readlines(): - tline = aline.strip(); - tl = tline.split('\t'); - if len(tl)>4: - if int(tl[1].strip()) != 0: - h.write(tl[0].strip()); - h.write('\n'); - - -f.close(); -h.close() - - - -
--- a/get_reads/get_read.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,80 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys -from Bio import SeqIO -import os -from read_file import * -import random -import string - -fasta_file = sys.argv[1] -map_file = sys.argv[2] -result_file = sys.argv[3] - -syspathrs = os.getcwd() - -os.system("samtools view -F 0xfff "+map_file+"|cut -f 3,4 > "+syspathrs+"map_info.txt") - -fasta_sequences = SeqIO.parse(open(fasta_file),'fasta'); -length_seq = {}; -for seq in fasta_sequences: - nuc = seq.id; - length_seq[nuc] = len(seq.seq.tostring()); - - - -mapping = {} -transcripts = [] - -f = open(syspathrs+"map_info.txt"); -for aline in f.readlines(): - tline = aline.strip(); - tl = tline.split('\t'); - if tl[0].strip() not in transcripts: - transcripts.append(tl[0].strip()); - mapping[tl[0].strip()] = []; - - mapping[tl[0].strip()].append(tl[1].strip()); - -distribution = {}; -coverage = {}; -for transcript in length_seq: - distribution[transcript] = []; - for i in range(0, length_seq[transcript]): - distribution[transcript].append(0); - sum_count = float(0); - if transcript in mapping: - for j in range(0, len(mapping[transcript])): - index = mapping[transcript][j]; - #count = reads[mapping[transcript][j][0]]; - sum_count = sum_count + 1; - distribution[transcript][int(index)-1] = distribution[transcript][int(index)-1] + 1; - coverage[transcript] = float(sum_count)/float(length_seq[transcript]); - else: - coverage[transcript] = 0 - - - - - -h = file(result_file, 'w') -for transcript in length_seq: - h.write(transcript); - h.write('\n') - for i in range(0, length_seq[transcript]): - h.write(str(distribution[transcript][i])) - h.write('\t') - h.write('\n') - h.write('\n') - -#os.system("rm -r "+syspathrs) - - - -f.close(); -h.close() - - - -
--- a/get_reads/get_read.xml Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,44 +0,0 @@ -<tool id="get_read_pipeline" name="Get RT Stop Counts" version="1.0"> - <description></description> - <command interpreter="python">get_read.py $lib_file $map_file $output </command> - <requirements> - <requirement type="package" version="1.61">biopython</requirement> - <requirement type="package" version="1.7.1">numpy</requirement> - <requirement type="package" version="0.1.18">samtools</requirement> - </requirements> - <inputs> - <param name="lib_file" type="data" format="fasta" label="Reference genome/transcriptome"/> - <param name="map_file" type="data" format="bam" label="Mapped file"/> - </inputs> - <outputs> - <data name="output" format="txt"/> - </outputs> - <tests> - <test> - <param name="lib_file" value="test.bam" /> - <param name="map_file" value="com_rna.txt" /> - <output name="output" file="get_RT_stop_test.out" /> - </test> - </tests> - <help> - - -**TIPS**: - ------ - -**Input** - -* 1. A mapped (bam) file from Bowtie (or any other mapping program) -* 2. Reference library sequences (fasta) used to map the reads to - ------ - -**Output**: - -A text file with reverse transcription stop counts mapped to each nucleotide (RTSC file) - - - - </help> -</tool>
--- a/get_reads/read_file.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,21 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys - - - -def read_t_file(in_file): - f = open(in_file); - result = []; - for aline in f.readlines(): - temp = []; - tline = aline.strip(); - tl = tline.split('\t'); - for i in range(0, len(tl)): - temp.append(tl[i].strip()); - result.append(temp); - f.close(); - return result; - -
--- a/predict/id_list_test.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,1 +0,0 @@ -AT3G05880.1
--- a/predict/log.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,3 +0,0 @@ -a /Users/yintang/Project/galaxy/galaxy-dist/tools/pipeline_programs/predict/output_qicbsuLr/AT3G05880.1.ct -a /Users/yintang/Project/galaxy/galaxy-dist/tools/pipeline_programs/predict/output_qicbsuLr/AT3G05880.1.ps -a /Users/yintang/Project/galaxy/galaxy-dist/tools/pipeline_programs/predict/output_qicbsuLr/AT3G05880.1.tif
--- a/predict/parse_dis_pac.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,43 +0,0 @@ -#parse reactivity file into a dictionary - -import sys - -def parse_dist(in_file): - result = [] - distribution = {} - name = [] - f = open(in_file) - for aline in f.readlines(): - line = aline.strip() - dis = line.strip() - dist = dis.split('\t') #split the line and the reactivites or reads are in a list - if len(dist) > 0: - if len(dist) == 1: - if dist[0].strip().find('coverage')==-1: - name.append(line) #add the name in the name list - flag = 1 - t_name = line - else: - distri = [] - for i in range(0, len(dist)): - distri.append(dist[i].strip()) - distribution[t_name] = distri #add the list of reactivities into a dictionary - result.append(name) - result.append(distribution) #Output the dictionary - f.close() - return result - - - - - - - - - - - - - - -
--- a/predict/predict_RNAs.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,95 +0,0 @@ -#RNA structure prediction & Output and illustrate reactivities - -import sys -import shlex -import subprocess -import tarfile -from parse_dis_pac import * -from read_file import * -from Bio import SeqIO -import os -from rtts_plot import * -import random -import string - - -id_file = sys.argv[1] -seq_file = sys.argv[2] -output_file = sys.argv[4] - - -flag = False -if sys.argv[3]!='None': #input reactivity file if provided - react_file = sys.argv[3] - react = parse_dist(react_file) - react = react[1] - flag = True - -syspath = os.getcwd() - -ids = read_t_file(id_file) -sequences = SeqIO.parse(seq_file, 'fasta') - - -seqs = {} -for seq in sequences: - seqs[seq.id] = seq.seq.tostring() - -if len(ids)>100: #setup a limit of the number of sequence to be predicted - print("Number of sequences exceeds limitation!") - sys.exit(0) - - -#predict RNA structures -output_directory = os.path.join(syspath, "output_files") -if not os.path.exists(output_directory): - os.makedirs(output_directory) -for i in range(len(ids)): - id_s = ids[i][0] - print(id_s) - #Put RNA sequence and reactivities into files - if id_s in seqs: - fh = file(os.path.join(syspath,"temp.txt"), 'w') - fh.write('>'+id_s) - fh.write('\n') - fh.write(seqs[id_s]) - fh.close() - if not flag: - command = shlex.split('Fold %s %s' % (os.path.join(syspath, 'temp.txt'), os.path.join(output_directory, '%s.ct' % id_s))) - subprocess.call(command) - else: - if id_s in react: - fh = file(os.path.join(syspath, "constraint.txt"), 'w') - make_plot(react[id_s], id_s, output_directory) #make a plot of the distribution of the reactivites of the input RNA - for j in range(0, (len(react[id_s]))): - if react[id_s][j]!='NA': - fh.write(str(j+1)) - fh.write('\t') - fh.write(str(react[id_s][j])) - fh.write('\n') - #h.write(str(react[id_s][j])) #Output the reactivities - #h.write('\t') - fh.close() - #h.write('\n') - #h.write('\n') - command = shlex.split("Fold %s -sh %s %s" % (os.path.join(syspath, "temp.txt"), - os.path.join(syspath, "constraint.txt"), - os.path.join(output_directory, "%s.ct" % id_s))) - subprocess.call(command) - else: - print(id_s+" not in the data of react!") - command = shlex.split('draw %s.ct %s.ps' % (os.path.join(output_directory, id_s), os.path.join(output_directory, id_s))) - subprocess.call(command) - else: - print(id_s+" not in the data of sequences!") - -#Remove the unnecessary files -tarball = tarfile.open(output_file, 'w:') -for filename in os.listdir(output_directory): - filepath = os.path.join(output_directory, filename) - print filepath - tarball.add(filepath, arcname=filename) -print os.listdir(syspath) -print os.listdir(output_directory) -# tarball.add('%s.tif' % os.path.join(syspath, id_s), arcname='%s.tif' % id_s) -tarball.close() \ No newline at end of file
--- a/predict/predict_RNAs.xml Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,59 +0,0 @@ -<tool id="predict_pipeline" name="RNA Structure Prediction" version="1.0"> - <description></description> - <command interpreter="python">predict_RNAs.py $rna_list $reference_file $reactivity_file $output </command> - <requirements> - <requirement type="package" version="1.61">biopython</requirement> - <requirement type="package" version="1.7.1">numpy</requirement> - <requirement type="package" version="1.2.1">matplotlib</requirement> - </requirements> - <inputs> - <param name="rna_list" type="data" format="txt" label="List of RNA ids to predict"/> - <param name="reference_file" type="data" format="fasta" label="Reference genome/transcriptome"/> - <param name="reactivity_file" type="data" optional = "true" label="Reactivity file"/> - - </inputs> - <outputs> - <data name="output" format=".tgz"/> - </outputs> - <tests> - <test> - <param name="rna_list" value="id_list_test.txt" /> - <param name="reference_file" value="cdna.txt" /> - <param name="reactivity_file" value="mRNA_react_test2.txt" /> - <output name="output" file="structures.out" /> - </test> - </tests> - <help> - - -**TIPS**: - ------ - -**Input**: - -* 1. A file with transcript Ids (Max num. 20), (each ID one line) -* 2. Reference file (fasta) used to map the reads to -* [Optional]: -* 1. A reactivity file with structural reactivity for each nucleotide on the sequence provided - ------ - -**Output**: - -* 1. .ct files with predicted RNA structures [transciptID.ct] -* 2. .ps files which depict the predicted RNA structures [[transciptID.ps] -* [Optional] -* 3. .png files that shows the distribution of the reactivity of each nucleotide on the transcripts of interest. [transciptID.png] -* 4. A .txt file that includes the reactivities of all the nucleotides on the transcripts of interest. [transciptID.txt] - ------ - -**Attention** - -Make sure any of the transcript Ids does not contain "|" or space! - - - - </help> -</tool>
--- a/predict/rRNA.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,8 +0,0 @@ ->25s rRNA 3375nts -GCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTAAGCATATCAATAAGCGGAGGAAAAGAAACTAACAAGGATTCCCTTAGTAACGGCGAGCGAACCGGGAAGAGCCCAGCTTGAAAATCGGACGTCTTCGGCGTTCGAATTGTAGTCTGGAGAAGCGTCCTCAGCGACGGACCGGGCCTAAGTTCCCTGGAAAGGGGCGCCAGAGAGGGTGAGAGCCCGTCGTGCCCGGACCCTGTCGCACCACGAGGCGCTGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCCAATCGGGCGGTAAATTCCGTCCAAGGCTAAATACGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGTAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGGGGCCGGCGATGCGTCCTGGTCGGATGCGGAACGGAGCAATCCGGTCCGCCGATCGATTCGGGGCGTGGACCGACGCGGATTACGGTGGCGGCCTAAGCCCGGGCTTTTGATACGCTTGTGGAGACGTCGCTGCCGTGATCGTGGTCTGCAGCACGCGCCTAACGGCGTGCCTCGGCATCAGCGTGCTCCGGGCGTCGGCCTGTGGGCTCCCCATTCGACCCGTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGTGAGTAAACCCGTAAGGCGCAAGGAAGCTGATTGGCGGGATCCTCGCGGGTGCACCGCCGACCGACCTTGATCTTCTGAGAAGGGTTCGAGTGTGAGCATGCCTGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGTAAAGCCAGAGGAAACTCTGGTGGAAGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCTCGGACGCGAGTTCTATCGGGTAAAGCCAATGATTAGAGGCATTGGGGGCGCAACGCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACGTGTCGGCTGCTTTGTTGAGCCGTCACACGGAATCGAGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGGTTACGGTGCCCAACTGCGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGACCTATACCCGGCCGTCGGGGCAAGAGCCAGGCCTCGATGAGTAGGAGGGCGCGGCGGTCGCTGCAAAACCTAGGGCGCGAGGCGCGGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGAGTCGGGGGAAACCCGTCTGATAGCGCTTAAGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCGGAACCGGGACGTGGCGGTTGACGGCAACGTTAGGGAGTCCGGAGACGTCGGCGGGGGCCTCGGGAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCGTGGTGTCCGGTGCGCCCCCGGGCGCCCTTGAAAATCCGGAGGACCGAGTGCCGCTCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCGATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCTCGGGGGTCCCAGTTCCGAACCCGTCGGCTGTCAGCGGACTGCTCGAGCTGCTTCCGCGGCGAGAGCGGGTCGCCGGCTGCCGGCCGGGGGACGACTGGGAACGGCTCTCTCGGGAGCTTTCCCCGGGCGTCGAACAGTCAGCTCAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCTTCGGCGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTACTCCGTGAATCGGAGGCCGGGGTACAACCCCTGTTTTTGGTCCCAAGGCTCGCTTCGGCGGGTCGATCCGGGCGGAGGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTACGAATACGAACCGTGAAAGCGTGGCCTATCGATCCTTTAGACTTCGGAATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGCCCGCGTCGCGATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGAAGCGACGCATGCGCCCGCCGCCCGATTGCCGACCCTCAGTAGGAGCTTAGGCTCCAAAGGCACGTGTCGTTGGCTAAGTCCGTTCGGCGGAACGGTCGTTCGGACCGCCTTGAATTATAATTACCACCGAGCGGCGGGTAGAATCCTTTGCAGACGACTTAAATACGCGACGGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGCCACGATCCACTGAGATTCAGCCCTTTGTCGCTAAGATTCGA ->gi|20197903:2706-4513 Arabidopsis thaliana chromosome 2 BAC F23H14 genomic sequence, complete sequence -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTGTAAGTATGAACGAATTCAGACTGTGAAACTGCGAATGGCTCATTAAATCAGTTATAGTTTGTTTGATGGTAACTACTACTCGGATAACCGTAGTAATTCTAGAGCTAATACGTGCAACAAACCCCGACTTATGGAAGGGACGCATTTATTAGATAAAAGGTCGACGCGGGCTCTGCCCGTTGCTCTGATGATTCATGATAACTCGACGGATCGCATGGCCTCTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAGTGGCCTACCATGGTGGTAACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACTGGGCTCTTTCGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTTAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAACCTTGGGATGGGTCGGCCGGTCCGCCTTTGGTGTGCATTGGTCGGCTTGTCCCTTCGGTCGGCGATACGCTCCTGGTCTTAATTGGCCGGGTCGTGCCTCCGGCGCTGTTACTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACGCTCTGGATACATTAGCATGGGATAACATCATAGGATTTCGATCCTATTGTGTTGGCCTTCGGGATCGGAGTAATGATTAACAGGGACAGTCGGGGGCATTCGTATTTCATAGTCAGAGGTGAAATTCTTGGATTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTCCTAGTCTCAACCATAAACGATGCCGACCAGGGATCAGCGGATGTTGCTTATAGGACTCCGCTGGCACCTTATGAGAAATCAAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACATAGTAAGGATTGACAGACTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGTTAATGAACGAGACCTCAGCCTGCTAACTAGCTACGTGGAGGCATCCCTTCACGGCCGGCTTCTTAGAGGGACTATGGCCGTTTAGGCCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGATGTATTCAACGAGTTCACACCTTGGCCGACAGGCCCGGGTAATCTTTGAAATTTCATCGTGATGGGGATAGATCATTGCAATTGTTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGCGTTGACTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAATGATCCGGTGAAGTGTTCGGATCGCGGCGACGTGGGTGGTTCGCCGCCCGCGACGTCGCGAGAAGTCCACTAAACCTTATCATTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTG ->Arabidopsis thaliana 1 -GGATGCGATCATACCAGCACTAATGCACCGGATCCCATCAGAACTCCGCAGTTAAGCGTGCTTGGGCGAGAGTAGTACTAGGATGGGTGACCTCCTGGGAAGTCCTCGTGTTGCATCCCTC ->gi|186498419|ref|NR_022453.1| Arabidopsis thaliana (AT2G01020) rRNA -AAAACGACTCTCGGCAACGGATATCTCGGCTCTCGCATCGATGAAGAACGTAGCGAAATGCGATACTTGGTGTGAATTGCAGAATCCCGTGAACCATCGAGTCTTTGAACGCAAGTTGCGCCCCAAGCCTTCTGGCCGAGGGCACGTCTGCCTGGGTGTCACAA \ No newline at end of file
--- a/predict/read_file.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,21 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys - - - -def read_t_file(in_file): - f = open(in_file); - result = []; - for aline in f.readlines(): - temp = []; - tline = aline.strip(); - tl = tline.split('\t'); - for i in range(0, len(tl)): - temp.append(tl[i].strip()); - result.append(temp); - f.close(); - return result; - -
--- a/predict/rtts_plot.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,58 +0,0 @@ -#!/usr/bin/env python -#Make a plot of reactivity distribution - -import sys -import os -import numpy as np -import matplotlib -from pylab import * -import math - -#Convert the reactivities (Make NA to 0) -def convert_react(a): - r = [] - for i in range(len(a)): - if a[i]!='NA': - r.append(float(a[i])) - else: - r.append(float(0)) - return r - - -#Make a plot of the distribution -def make_plot(ar,id_s,path): - N = len(ar) - a = convert_react(ar) - w = 1 - ind = np.arange(N) - - fig = figure() - fig, ax = subplots() - ax.bar(ind+w, a, width = w, color = 'r',edgecolor = 'r') - ax.set_ylabel('Structural Reactivity') - ax.set_xlabel('Nucleotide Index') - - - mag = int(math.log(N,10))-1 - tail = 10**mag - - intervel = int(math.ceil(float(N)/tail/5)) - print(N) - print(intervel) - tl = [] - k = 0 - upmax = int(math.ceil(float(N)/intervel/tail)*intervel*tail)+1 - ax.set_xticks(np.arange(0,upmax,intervel*tail)) - print(np.arange(0,upmax,intervel*tail)) - ax.set_xticklabels(np.arange(0,upmax,intervel*tail)) - - ax.set_title(id_s+" reactivity distribution") - savefig(os.path.join(path, id_s+'.tif')) - - - - - - - -
--- a/predict/test_reactivity.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,2 +0,0 @@ -AT3G05880.1 -0.943887685769 0.421815158787 NA 1.01455360981 NA NA NA NA 0.503726666615 NA 0.562759466181 0.53286496306 NA 0.452307806554 NA NA NA NA 0.234006609126 NA 0.356521303582 0.3345952334 NA 0.938455477986 0.961629159648 0.58445845106 0.277563382428 NA NA NA 0.381285618597 0.510385809404 0.263300197836 0.351983737127 NA 0.478451311944 NA 0.0 NA NA 0.249061701962 NA 0.602014314955 0.768409570219 0.479108914417 0.609654847688 0.395147907741 NA NA 0.316409963987 NA NA 1.01642560569 0.178529288881 1.1258499175 NA 0.102264245055 NA 0.588862283199 0.675885983569 NA NA NA 0.0 NA NA NA NA 0.8152009763 NA 0.730574123452 NA NA 0.196012732449 NA NA 0.748188202713 NA 0.0 NA 0.925269643553 0.0 0.506395998703 NA 0.511028818599 0.354285255052 NA 1.01563235674 NA NA NA 0.602118316823 0.486534824365 NA 0.266635693932 0.176995791343 0.887089878761 0.654802870139 NA 0.24940376078 NA NA NA NA NA 0.835049477972 NA NA NA 0.230188979227 NA 0.145932219541 0.510982455489 NA 0.70545494854 NA NA NA NA NA NA NA NA 0.0 NA NA NA NA NA NA NA 0.0607994838688 NA NA NA NA NA NA NA 0.0 NA 0.510982455489 NA NA NA NA NA NA NA NA NA NA NA NA 0.805809423851 0.214474701586 NA 0.320112197187 NA 0.886851602907 0.0 NA NA NA NA NA NA 0.173824155265 NA 0.499351609605 NA NA 0.119452482914 0.0 NA NA NA NA 0.985352919102 NA 0.0 0.0 NA 0.925509063242 NA 0.54084940725 0.0 NA 0.622064968928 0.285526636999 0.373974554632 NA NA NA 0.0 NA NA NA 0.0 0.369187155673 NA 0.644843692277 0.0 0.0 0.0 0.0 0.155248951804 0.0 NA NA 0.0 NA NA NA 0.0 0.0 0.0464264694222 0.0 NA 0.0 NA 0.250790026642 NA 0.11120052998 0.0299680537584 NA 0.0723351276735 0.0 NA 0.069968383925 NA 0.394969636508 0.0 NA NA NA 0.270970925021 0.0436999866019 0.0 0.172881011784 NA 1.24794080936 NA NA NA NA 0.0 0.0 NA NA 0.241516034212 NA NA NA NA NA 0.19903265234 NA 0.289893769912 0.835049477972 NA 0.83678872047 NA 0.769301566905 NA NA NA NA NA NA 0.486001309495 1.00671172955 NA NA 0.392970275151 NA NA 0.369187155673 0.0330308799953 NA 0.0 NA NA NA NA 0.322006332632 NA NA NA NA NA 1.10146992643 NA NA NA 0.602394928175 0.052285391313 NA 0.0 0.474447727012 NA 0.258266798648 NA NA NA NA NA NA 0.173824155265 NA NA NA NA NA 0.435796833817 0.341824194398 0.0 NA NA 0.971161850563 0.0 NA NA NA 0.594354216766 0.0 NA NA 0.0 0.0666024493389 NA 0.36331086056 0.0 NA 0.838839492047 0.078362328999 0.54084940725 NA NA NA NA NA NA NA NA NA NA NA 0.0 0.0 NA NA NA NA NA 0.454308208169 NA 0.0 NA 0.0 0.653920441757 0.369187155673 NA NA NA NA NA NA NA NA NA NA 0.0 NA 0.0 NA 0.0 0.0 0.602118316823 0.0 NA 0.0 0.0 NA 0.0 NA 0.0 NA 0.0 NA NA NA NA NA NA NA NA NA NA 0.0 0.0 NA NA NA NA NA NA NA NA 0.0 0.0 NA 0.0 NA NA NA NA NA NA 0.0 0.0 0.0 0.0 0.0 NA 0.0 NA 0.0 NA NA NA NA NA NA NA NA 0.0 NA NA 0.0 0.0 0.465862322301 0.0 NA 0.0 0.0 0.0 NA NA NA NA 0.0 0.0 0.0 NA NA NA NA NA NA NA NA 0.0 0.0 NA NA NA NA NA NA NA 0.0 NA 0.0 0.0 0.0 0.0 NA NA 0.0 0.0 0.0 0.0 0.0 0.0 0.0 NA NA 0.0 0.0 0.0 0.0 0.0 NA
--- a/predict/test_reference.fa Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,8 +0,0 @@ ->AT3G05880.1 | Symbols: RCI2A | Low temperature and salt responsive protein family | chr3:1755497-1756540 REVERSE LENGTH=495 -AAGCTTTTATAATATTTTCTCAGAAACTTTCAAAGAGCTTAGAAAAATGAGTACAGCTACTTTCGTTGATATTATTATCG -CCATCCTCTTGCCTCCACTCGGTGTCTTTCTCAGATTTGGTTGCGGGGTTGAGTTTTGGATATGTTTGGTTTTGACGCTA -CTTGGGTATATTCCTGGGATCATATACGCCATTTATGTCCTCACCAAATGATTTACCATCTATCATCATCTCCTTGAACA -GCTGTTCCGTCGTGTTCTCCTATCTTTGTGACTGATTCAGCGTTTCTTTTTCTTTCATCAGAGTTTTTATGTTTCAAGTA -ATTTAATTAATCATCACTGTTGTGTTTGCATTGTTATATAAATGTTGTGTTGATATAAAAGAAGAGAGCGTTGGTTTGTA -CTTTGTGTGAAGATTTTTTAAAAATATAGTTGGTTTATTACAATAAATTGGAAATTGTGTTGCCTTGGTGGATCACAGGA -CCACCATTAACCATT
--- a/reactivity_cal/dis_f_N1Am_rrna.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,12 +0,0 @@ -gi|186498419|ref|NR_022453.1| -146241 38142 180120 134243 5639 6848 2492 1596 695 104 1741 160 1505 3009 210 1349 2366 197 353 97 3173 453 4575 656 218 3344 196 19655 540 360 303 351 1377 300 2479 445 3882 2244 293 272 3155 540 218 1849 1902 292 1037 15050 641 989 470 770 949 177 907 927 748 2819 796 490 117 237 272 723 994 173 162 157 86 147 65 296 86 342 115 1694 380 83 205 159 332 357 255 1017 697 80 599 217 474 673 246 170 327 468 47 818 403 25 100 57 84 527 158 349 409 220 94 111 177 27 207 64 770 309 108 92 47 63 17 6 25 10 33 4 117 35 64 27 1 69 42 43 163 12 9 133 81 44 213 125 136 106 26 1349 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:3826.28048781 -25s -881535 25444 3717 6666 4105 1066 5312 343 7553 1085 1543 5253 1667 4505 459 1269 413 1261 730 607 10420 1646 3144 15184 1253 844 238 933 1794 175 404 2754 1743 7660 4387 6957 6100 2702 2614 1344 34079 3185 11237 6583 14826 17602 9766 3553 2416 1976 1029 924 1317 493 2836 2337 7838 5981 4087 7747 4284 3160 1343 5529 7297 2897 1831 9203 24331 4407 27066 6161 1895 2462 9713 1400 500 535 2222 2026 2424 6289 6223 9688 4505 5981 11264 1102 514 2659 945 2177 4547 2493 3746 1433 2051 6678 3942 2867 3626 2142 2436 9252 5393 2318 3421 1770 3056 5925 598 13029 3780 4258 22078 9323 25339 10247 42891 7507 23054 20111 3098 1782 418 28408 873 3285 15629 4864 8369 23169 1872 5569 7312 3476 2407 9044 29647 4041 17941 5740 24376 140713 22800 9594 21798 14222 23929 13867 3985 8217 5057 5324 16195 13884 10203 186562 14369 2116 967 15121 3910 2528 19370 3819 4080 134820 2777 1441 13904 1835 779 318 10123 5901 1159 989 279 5817 4101 2100 5160 21152 11194 3346 5936 5458 1245 1072 646 3531 3013 7250 6407 10119 15469 2266 578 462 3143 507 1729 2757 4586 110 23 20 0 2 187 4 1 0 1 11 2431 788 424 226 1770 949 1003 12533 2294 1752 615 629 549 299 517 518 329 3892 2430 599 3623 558 2222 2591 751 1693 881 40147 3941 4139 185549 11408 5121 3102 2862 1508 2045 583 2113 1398 10303 202204 3622 3050 12547 2119 1551 981 944 3969 275 2145 1086 476 2576 1110 1499 1140 500 431 575 447 366 1653 2580 787 692 1220 1000 72 134 170 392 2413 754 2470 1029 415 456 203 262 169 1348 1142 1750 1301 818 3021 1232 2038 1909 210 176 1567 525 304 1196 79 123 359 173 606 776 1023 386 316 1540 98 83 49 278 129 251 335 487 194 68 644 148 240 81 2390 319 600 624 71 181 749 2860 256 4145 540 258 183 903 183 115 295 41 50 331 141 412 795 108 1191 3252 125 792 288 555 2688 962 337 369 36 104 615 897 136 148 526 585 967 663 956 620 313 132 226 180 348 1070 341 574 584 391 190 401 116 266 436 302 436 101 289 392 244 507 548 76 55 714 14 365 224 47 183 536 160 101 194 342 1200 145 131 54 811 115 77 204 564 1395 338 538 76 197 622 116 196 1803 627 965 31 79 259 177 63 305 61 98 622 67 39 89 1080 526 146 100 284 73 124 1039 109 134 29 279 340 573 2185 3550 2405 91 152 124 91 243 140 28 12 89 277 127 1296 4515 315 428 739 473 709 233 264 97 119 400 271 498 489 170 65 509 505 8 145 979 125 206 128 232 64 1530 91 130 839 91 100 227 85 89 219 39 27 100 300 344 1329 1666 1800 141 135 48 47 26 67 752 1616 608 361 657 520 484 1332 704 1705 160 151 61 164 92 156 153 118 113 45 22 1134 18 46 92 47 29 60 23 4 179 32 936 133 2 191 370 51 19 51 46 70 226 47 251 123 36 308 45 37 328 11 19 0 25 29 133 189 171 2865 183 53 84 43 2 17 13 35 3 101 46 288 151 21 402 259 24 100 98 210 2 9 19 2 26 1 23 56 52 192 58 28 41 4 0 11 74 235 191 15 19 62 35 4 0 14 1 45 56 225 10 156 236 13 4 13 7 160 10 200 74 76 3377 294 2508 3920 701635 17382 4008 16108 3395 387 274 1543 742 163 2534 764 204 1105 673 467 1137 628 318 286 5461 203 12872 442 805 613 182 473 1075 172 500 492 403 4364 532 7276 4864 240 535 202 498 310 1165 2788 1473 6240 2749 1484 6599 311 1998 1414 2399 1160 2224 851 3635 514 156 960 757 3193 1210 519 376 693 572 0 0 0 0 0 2 0 0 3 1 237 5 712 406 367 54 215 2451 2120 13909 1135 1526 485 377 795 935 100 1703 893 95 101 761 90 32 704 678 28 120 2392 292 443 975 551 172 2966 10624 444 934 2095 704 1639 526 1703 743 1979 3742 727 960 245 1113 6843 294 723 1212 1322 814 594 677 167 1324 879 403 4692 122 361 139 479 294 496 1894 243 1355 281 400 626 128 301 190 1866 2018 6127 6314 424 1715 216 576 617 373 356 1380 7208 1759 729 5065 185 421 369 389 403 146 1025 906 352 142 298 222 1246 2757 716 1375 510 457 332 265 622 147 696 566 2292 1014 15081 8878 7033 3273 439 587 151 350 1512 157 119 734 286 40 86 288 115 895 397 252 478 307 637 719 1100 1862 652 274 178 3315 2155 1053 450 517 695 3772 591 1731 1861 401 332 221 1214 46 280 1227 732 82 174 1609 472 411 54 472 496 970 1142 1221 306 718 589 130 360 872 307 568 274 1251 166 399 2354 189 2909 444 2266 2441 525 227 596 1266 741 85 4900 726 177 2269 1958 1182 350 1957 570 180 612 1103 251 121 74 211 327 34 1411 563 328 303 1862 1044 2108 946 225 141 210 334 464 2672 399 2743 822 908 4185 805 3000 969 607 1012 559 106 1241 271 147 1012 720 194 503 6541 1403 6636 860 1169 3860 938 3076 1174 608 709 3117 1851 270 687 708 1813 5048 2130 1318 652 476 1684 6117 1627 2989 766 1736 7241 3872 2282 1703 851 1320 1963 1841 575 147 16 0 0 0 0 0 0 1 15 99 89643 5883 1671 2969 1064 710 7147 505 215 7254 1012 1856 3127 2333 1853 1271 959 5795 5912 952 2700 6021 1959 4209 2842 2506 13855 3762 3321 1732 31128 2827 1291 1431 3650 997 170 8627 951 5781 495 314 3554 102 630 643 386 942 897 1418 581 3460 1630 2323 2373 1278 904 627 169 1157 127 1038 1646 715 4994 544 8701 535 1083 2287 626 3386 3746 420 1112 3243 288 1256 309 190 920 1437 194 6532 1729 674 643 265 177 250 1130 155 5891 3418 2612 1696 1619 1869 985 706 1629 2682 1991 2234 771 4649 440 1587 1559 719 437 490 1133 88 739 1767 538 991 196 913 812 198 5311 1290 1080 395 1879 324 662 484 395 1410 1587 526 1268 219 1381 625 2733 935 853 4610 199 492 452 132 504 377 4520 1193 4787 3028 197 827 929 431 352 423 420 844 445 476 3419 335 867 1654 2721 652 1305 857 618 388 682 16131 8438 2014 3340 715 940 324 1054 1353 1387 584 761 237 511 1895 204 1340 8353 4498 2056 5609 8653 908 12519 883 4480 39771 941 4475 432 264 2588 669 507 276 370 512 553 5417 965 12947 1546 1042 394 4780 5063 4441 12265 1156 3809 4986 2651 1057 2359 415 630 1161 618 1769 3594 3054 798 1153 1204 1411 515 1372 2945 5705 4063 7862 53609 4064 21774 24325 1750 3532 486 4491 754 532 535 949 1874 684 2732 2257 7631 13668 443 9914 9458 2248 1342 949 949 485 372 1779 2176 5474 5065 7304 2403 10023 3567 22185 2920 87159 31 0 0 1 0 2 48 4555 1854 1127 2614 585 17990 768 299 9449 1107 1953 7179 12336 3232 2854 576 1670 965 1755 985 31331 1199 1026 7084 395 801 532 3625 4148 1864 8345 4157 1994 6956 22918 6714 4236 10599 1538 5603 785 679 3979 822 785 6173 944 2095 4165 2027 3125 7796 1618 718 2343 484 1183 1296 1567 20771 616 728 980 820 208 546 2744 272 923 499 2348 3783 11308 6232 1271 1847 24 2 0 0 0 0 0 0 0 0 0 0 89 351 300 288 535 110 626 156 786 1092 50 298 121 2875 159 782 3165 173 1966 1142 1261 2122 2596 8551 240 9115 3643 368 2669 2014 880 1423 3378 880 609 8414 5844 4706 3602 7001 11501 12022 13679 10476 23836 10074 18582 5676 19445 3902 14070 7599 15154 2121 3513 6813 660 10245 8800 1932 14556 9167 5257 2119 4239 3906 543 1612 3336 1401 984 7956 17650 28824 6810 1928 1904 2059 8619 9682 3260 6091 5340 1575 3606 4469 1964 708 32185 2953 3689 7683 2417 10341 29009 2138 9499 5668 4387 64377 10067 6360 5021 3530 2408 96306 4508 54595 2345 5773 6140 4749 12010 19459 4768 2410 20651 2802 4126 4573 8447 3004 5393 16449 33261 8840 11096 4911 3010 14364 1486 2601 1586 6591 10130 29606 16771 14509 19592 4231 7699 748 18213 25767 19 0 0 19 0 0 0 2 2 106 75958 1669958 97659 24232 106371 33825 6463 63558 113856 11992 26904 139901 12300 18514 9374 20104 16368 8938 4227 3220 5052 16174 6583 1259 10946 26334 34393 118377 51455 33413 36320 14123 105334 5480 6410 3394 2884 5449 2323 5835 10053 4526 1633 34245 1519 1125 42849 3545 6084 6963 1783 3680 4631 5594 9651 101194 9719 4729 68124 3916 9185 16656 5965 5896 23260 2361 5478 5453 4941 6890 4002 668 3113 2763 2649 5164 1178 1464 1723 4459 2436 917 37184 8455 1646 7487 421 787 1733 791 2170 1758 883 212 2891 1048 949 7401 670 2527 1527 1339 11105 3050 2546 5543 3210 11959 2827 18338 14858 4205 5478 2753 2779 2873 1383 2014 4145 10799 10980 6751 14549 11772 2384 2135 712 629 660 668 673 3561 1629 813 907 405 528 574 904 782 3258 1146 1767 15269 1393 1936 405 414 2816 1284 760 445 731 572 276 320 3325 7010 941 1325 867 1339 265 275 1850 2634 518 2729 2637 363 526 376 239 862 389 687 2026 1220 298 1306 694 61 1277 288 438 434 215 6225 2357 1361 3662 416 7488 743 746 485 249 366 210 97 331 84 190 376 150 404 211 67 23 59 21 9 189 78 145 380 12 3 17 97 266 136 1011 371 850 345 610 217 205 189 30 54 138 46 760 35 79 327 1057 67 290 307 5139 2297 8529 547 117 188 233 147 36 566 37 39 39 37 335 23 82 1565 257 49 192 589 84 862 130 4209 195 253 313 74 344 281 32 981 1193 71 1660 83 160 47 24 162 87 178 386 287 129 173 268 54 581 1061 713 299 108 113 61 133 40 321 149 19 566 124 104 983 294 293 60 838 2816 1781 305 1237 576 463 325 125 205 543 589 1120 382 337 333 33 1738 345 91 1641 185 358 1188 4629 3364 2637 1178 2596 455 790 560 960 335 409 488 1877 784 2693 3142 354 765 2282 223 590 524 3005 3024 1016 1894 1990 1733 811 3949 1603 273 1344 292 405 1112 297 762 409 1519 449 688 362 716 370 292 1189 600 581 2013 288 370 382 899 334 537 4576 468 421 352 1790 750 395 1111 344 535 162 686 15966 1584 1396 277 303 4401 182 667 259 728 433 520 12626 997 3152 1536 474 85 236 1867 146 594 298 332 1529 151 226 771 4171 223 1378 653 520 104 2532 3701 1666 1825 274 409 825 164 144 1333 2166 444 545 224 7301 179 663 2659 138 1230 805 329 0 1 0 1 1 0 0 0 1 3 1 142 200 72 98 1160 1050 104 111 1370 226 132 773 1882 712 1192 7761 689 2853 369 282 234 303 414 116 1887 415 2774 566 81 778 693 873 939 1093 1615 230 123 253 156 1 27 824 208 1686 5087 1382 860 4543 7350 2482 2873 743 2996 149 1325 2715 581 1511 208 1659 233 1199 1763 369 568 1920 556 363 1911 3636 248 508 5458 1960 3502 1676 673 315 1004 2845 1404 762 1160 1109 104 600 1065 538 690 2119 2507 2120 1750 1881 3465 3830 3768 1541 571 1341 5618 3599 1903 714 623 499 257 3354 339 72 520 77 152 673 346 144 130 182 55 311 123 151 565 409 315 229 192 350 497 1361 422 433 1674 266 449 919 39 1471 144 453 585 254 3505 406 387 323 332 136 106 420 476 61 1484 1086 503 123 146 446 224 590 769 490 5915 815 433 2607 2716 744 1538 974 1822 304 608 2051 2013 2283 1409 1845 2559 670 3516 378 838 1723 366 1165 2334 779 630 251 1022 374 918 150 489 2756 299 123 1086 184 141 497 172 456 40 461 943 649 393 3455 9512 3623 3138 13746 597 2652 2875 1148 179 490 4042 1253 2920 3073 1873 1147 831 1096 1192 244 413 846 1439 2691 1286 2657 358 1039 215 439 1239 161 441 7350 28 4257 1728 143 1973 2777 5188 2349 2634 1536 1710 268 278 1705 50 473 241 1265 232 7867 774 1727 1644 944 471 783 709 3086 2582 4045 885 19507 1069 1472 3112 2132 2758 2162 440 377 433 456 1629 989 266 620 383 3298 3134 1830 369 385 2491 47 1446 2313 633 378 2058 682 1503 209 773 1157 428 890 2023 192 7210 1563 2425 32109 1892 10465 1207 840 680 2859 901 554 851 176 3037 4944 270 577 701 647 331 698 234 362 707 958 2128 1034 1431 3016 2860 302 6284 738 274 203 955 1419 2004 1370 3673 9598 765 6901 11602 456 2508 2622 141 847 1223 1904 7081 1511 296 1716 1789 613 8853 414 801 5372 1461 3507 464 3118 2826 548 2162 2759 303 1181 6000 1904 3554 6528 1379 2379 2758 2683 8105 2662 9700 601 863 7023 1678 1915 581 2901 2528 653 2972 876 1987 4498 3446 860 2689 4054 1803 25217 8111 10173 3781 1572 944 1417 1228 587 8564 3238 2548 1040 3595 932 5971 1897 3007 7696 2903 38995 21340 31470 3068 4031 10895 8550 20036 17508 12619 1616 1348 17528 762 3552 28634 4541 5892 6047 13672 1584 6897 17395 3338 7007 6943 3467 13132 8107 4118 1225 3170 6059 1810 1080 1541 2157 159 427 162 9 1 0 0 0 5 1 0 14 80 110 366 248 753 223 254 163 202 181 1081 14294 2402 5225 31062 1281 737 390 652 1043 2075 2079 1041 656 478 295 250 151 320 134 367 255 914 414 294 107 68 54 61 157 100 51 488 152 170 134 43 277 92 40 656 109 56 267 338 77 161 67 85 132 100 27 62 409 52 134 2132 717 787 266 138 126 977 35 2295 105 61 85 164 159 46 188 1019 416 232 144 38 419 173 48 75 175 139 45 603 92 217 238 113 3152 108 2152 1077 62 154 338 1375 981 1032 277 309 880 352 3016 230 632 872 150 458 80 1401 614 225 105 32 7518 203 177 330 829 395 102 1574 203 34 343 127 256 634 160 1878 3338 71 91 423 223 736 1975 441 4934 675 1420 655 2009 2015 255 1184 183 658 48 224 110 201 52 695 2739 3226 991 225 792 274 342 242 1101 3375 1349 615 307 506 284 118 571 67 463 367 1136 895 528 1495 458 473 195 401 155 2547 821 641 773 3203 192 1967 547 310 3089 239 979 2227 435 337 7724 407 372 341 762 532 81 538 840 1001 443 444 561 372 204 508 130 124 377 217 376 369 9 5 0 0 0 0 0 0 2 125 39 123 1176 1041 265 240 1029 206 241 747 1290 3205 1842 1714 535 588 402 716 256 175 449 970 623 1385 109 2189 606 946 2854 413 6218 2909 1602 269 1480 1387 1911 837 200 2638 464 535 5487 418 3451 1159 1492 537 3699 1351 2751 1973 731 950 776 576 183 1552 477 673 195 372 663 595 1185 555 1032 136 776 250 1910 393 368 1594 8778 684 10221 1571 996 6691 602 270 5658 455 805 568 1840 886 1314 2585 2045 2385 1707 612 516 872 1354 801 136 851 2593 1221 405 6194 331 587 1549 156 811 133 307 1678 400 155 1201 364 965 187 3068 4439 1601 15657 1316 803 970 273 501 814 411 791 1407 3896 1035 2249 2427 2207 869 184 1617 487 487 2515 493 11642 694 706 890 469 188 264 1724 410 525 287 1804 1951 295 392 270 235 73 1145 101 1050 2496 6971 480 1251 672 939 180 116 3268 175 747 987 121 4347 9976 736 1235 740 897 17387 36155 97860 6230 1808 2216 3012 1205 178 126 3421 152 1559 319 708 1187 700 8075 272 5300 2935 1951 1034 1787 5461 2144 7541 5725 2993 861 2410 350 1519 261 2335 5529 1393 1916 973 5156 560 343 579 951 433 3374 164 1035 1384 251 1731 1434 1545 6242 13046 3997 2158 4740 3898 4140 2744 6003 2040 709 2574 680 227 1789 3921 881 696 4904 419 2183 4713 5727 8957 2600 777 741 1430 2317 2730 9235 3564 1146 2497 1540 1176 2237 604 1318 562 15311 4047 5112 6831 2689 1817 903 531 4965 211 10519 874 325 419 258 357 269 375 952 998 742 6080 2333 2486 1526 822 1872 7156 746 360 641 1827 1497 154 1090 392 393 4726 401 330 869 1184 1429 651 253 1677 758 686 355 394 300 333 596 589 595 562 1148 8644 5295 901 6555 811 1132 4710 998 2525 421 1928 5434 355 1612 267 2751 4048 1828 1094 4299 1362 910 3308 302 2409 1639 874 1702 853 805 463 483 1445 675 770 4616 2689 1329 2285 14951 5151 277 600 3685 2095 7211 3099 7803 4609 1289 237 333 314 689 142 656 1333 704 886 738 1094 1577 1751 8486 4665 882 942 4077 1357 982 1967 1361 817 1370 6514 1484 15293 2222 2384 3915 4 0 1 0 3 0 2 88 569 288 408 296 1776 2817 455 1517 1116 1350 814 122 11881 772 2562 586 208 2711 449 1150 777 243 543 315 241 200 614 645 128 77 12 22 18 22 118 3 11 26 31 5 19 51 37 136 68 22 52 9 9 44 21 4 2 0 22 17 2 8 3 22 163 25 19 49 69 146 69 114 57 107 115 32 29 53 156 8 91 21 1 2 0 10 0 0 3 0 269 20 51 151 26 26 8 1 14 0 1 5 15 0 2 29 3 2 17 2 1 74 15 19 44 38 8 17 4 60 0 55 0 7 303 18 7 3 14 35 64 215 191 62 97 330 92 33 38 6 5 17 24 73 18 16 4 8 2 13 1 1 7 34 86 306 256 70 3 15 17 1 1 2 8 0 0 1 0 0 2 0 0 16 18 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:3967.112 -Arabidopsis -3576 59 260 50 109 47 4 158 108 38 202 49 126 56 11 88 6 7 123 13 81 27 273 29 127 9 191 47 19 52 39 89 83 3 8 19 37 90 3 20 1 19 67 2 25 0 0 0 1 4 33 10 2 12 3 12 4 0 2 0 2 0 0 1 0 31 0 5 0 0 0 0 0 17 11 0 1 0 0 1 33 1 2 1 0 17 1 0 0 27 0 3 0 0 0 8 1 0 33 0 8 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:55.6776859504 -gi|20197903:2706-4513 -664844 19584 4512 8188 8869 807 1179 1838 1586 921 607 1482 290 699 1111 1305 635 1275 5971 1179 4954 1240 1531 6628 1388 27681 3268 6430 4637 1469 2014 3018 748 2327 1924 1076 8566 2026 2590 5458 6251 3000 29511 8288 3592 3814 2097 1650 2200 2406 6471 1220 4400 1142 22480 693 4580 2842 3536 1989 8994 4179 2077 3824 17310 8031 1121 2926 12754 1692 2944 12550 39746 82946 103909 35885 9457 9934 16206 3476 4979 6430 3370 6737 1616 13661 7418 887 1298 2649 1170 9062 1515 11022 907 1687 1151 864 6742 2720 34680 9511 7118 15779 5712 10571 4170 1341 7539 3114 10598 13699 11500 3081 6725 5103 1940 1993 2048 2275 1567 7186 1901 2083 5306 2537 2261 5461 2635 7179 18457 2027 11585 90440 3816 15265 5042 2611 13193 933 1674 2093 29483 3178 1315 4260 2904 2233 957 7267 5625 3740 8214 7715 9121 6022 7373 2831 4289 7253 997 5268 5199 2267 8245 14334 7108 1785 13819 1244 2162 2539 6363 1071 15654 29440 17948 12642 9103 13633 877 1166 3673 368 1350 12855 9487 10620 8071 39600 14068 4994 2977 4056 5970 41418 1299 1239 15876 2006 8971 3516 41725 10930 12997 8058 18683 6234 5983 9932 5611 31845 342908 112205 14220 12651 13688 4426 2215 22024 1068 1862 18098 2251 2601 2067 1823 9482 1109 2781 11972 19528 12623 2655 1159 4393 3154 22317 10622 7090 3766 16259 8754 13582 21038 2308 37832 4403 3558 20759 7681 16935 1935 31800 64462 4552 20884 2409 15769 4583 744 15590 1678 3356 15092 3458 4406 777 13401 66912 2520 3482 1625 15533 3057 640 3028 940 3159 28004 344212 214281 42282 148322 15460 16340 9728 8684 14160 598 1611 11418 1615 11035 2250 31897 18582 7879 19658 10420 36192 29084 17723 9600 20741 8246 7233 5613 2394 1883 887 1639 1053 1766 3104 12503 33150 2237 13088 8880 4069 3305 2482 13206 2144 1701 4600 1293 883 734 552 1293 1578 432 8626 3588 3282 3207 622 214 1037 1353 323 320 3070 1178 360 3458 648 485 336 486 470 1593 650 2059 3987 156 1066 181 689 558 429 4770 343 265 533 1270 1183 3431 6261 2038 1896 1338 1526 1465 779 1252 3207 408 1327 3972 338 1400 502 398 299 264 614 505 961 1075 1052 254 52 211 259 332 337 409 831 1915 609 914 8376 160 1324 793 251 157 2753 208 256 5222 209 2465 2013 883 427 5929 4381 2020 692 1344 1345 1068 898 309 2363 721 1152 1553 496 94 315 694 449 1761 651 13976 10935 7836 1980 507 2405 491 699 880 1760 554 967 175 791 262 823 3946 1066 12897 680 1191 828 120 153 1291 535 897 1786 774 1254 377 403 9594 1370 3962 9192 4206 9554 2167 9910 1258 3750 10106 3045 6387 1813 874 2302 529 344 88 555 153 239 983 874 17160 36573 440626 12682 13300 8366 5816 2874 1231 2949 403 904 3168 2219 35730 27479 5426 1530 1906 3166 6493 524 967 5143 1814 2394 13203 5245 6919 7640 7142 1933 4778 5909 2238 2250 732 441 1043 879 4700 1055 4024 28436 1290 818 6324 3923 1581 7174 16715 2892 6104 27838 4195 1729 2361 1444 2128 2720 3114 5545 603 20528 2917 1446 4450 1042 1545 1916 1683 340 1115 1915 1505 4843 4265 2738 1528 1835 1107 1498 883 1945 8718 5116 7390 21865 13665 2598 10052 5750 1173 6885 1179 1058 3757 1590 16889 17482 25590 10363 1814 7732 3469 4304 11242 20846 12543 206888 30140 20555 5083 23778 11712 3836 13382 3148 3452 6940 2250 3093 3095 18212 9127 21513 15736 28391 31012 8063 4515 8365 1748 1311 16363 3564 2104 14771 12754 3593 14205 12076 3760 1286 11426 4762 7344 4553 1567 7522 7594 2545 8636 1538 18103 2667 1654 8824 1022 1914 2478 1963 3725 2503 1937 5444 5399 668 2276 5734 6230 20711 12826 13399 12489 11736 4466 3694 4814 31552 16213 68719 6544 8953 3954 1915 5200 585 6225 5832 5120 64944 3869 2336 3941 2128 18719 9654 13437 6721 14526 11861 5504 16169 1599 5772 7011 7185 19109 8869 12053 35372 5364 1835 2053 35541 4586 3268 7467 3093 16799 135282 7492 8490 35564 26985 122709 27102 10252 6491 2495 1014 569 35051 1725 2304 146622 3965 5681 2029 6419 3092 1801 4838 5681 1353 9116 5566 2967 4630 27222 36971 16499 1821 8357 20475 4172 10081 10468 9828 1771 17474 9233 7044 15969 17181 32298 8821 14480 10649 4068 8906 3394 3564 1486 4256 40799 34618 5777 10405 7947 26370 12510 22031 2509 14303 8987 4719 34257 73258 9721 2550 2154 5237 1202 12015 3441 4884 30129 5130 92243 11309 82439 25721 8193 11232 16084 4389 77025 4587 3101 4353 2055 35287 5054 8028 30793 1882 23537 40334 5311 17780 17307 7010 9830 4570 40768 5520 4769 12705 1860 2095 8289 5302 995 1429 10420 14674 9100 1971 7869 10580 12761 11475 2077 1253 2663 3338 2080 6933 26858 7540 25514 14264 998 17039 12078 1760 1579 4691 11199 10762 31838 6990 72150 30655 9333 73128 39521 15581 24584 54402 15465 12320 10409 3667 3912 30971 14474 8626 3910 22307 2319 3167 2799 2783 5397 28612 29905 34939 7630 28768 2819 9438 22698 34915 3824 6286 33361 14469 38288 19161 11188 8439 34170 4546 22868 2460 9456 4218 9343 9126 26929 31871 19970 14362 19537 21187 5832 12562 6312 4898 5788 59726 20518 17851 20273 61446 15708 13619 8455 34807 3887 3132 85705 5958 5021 37196 150956 6976 37456 37148 5704 6902 19600 8376 19456 25363 21697 13905 15276 7275 63037 17528 9280 3988 14370 40614 10653 66891 39572 14272 3823 132462 24073 35227 63510 20084 11101 66418 10769 147577 45703 42097 29466 83254 48962 8076 64662 185605 17800 11836 505929 68907 31508 21129 56762 28777 18922 19761 4103 5013 6966 1436 11706 3561 14687 164845 9477 8591 55886 37650 22474 92985 8417 3062 43393 27607 15292 41719 19221 26992 4894 25987 19248 6765 2461 58729 14552 4541 31251 10509 14202 26568 5099 73898 19781 16738 31415 15382 20421 107908 86035 27870 17288 61677 6051 7074 22804 10797 3336 14022 1787 1905 38007 8645 6530 21764 5691 3712 2378 22041 25834 2171 6764 2764 1136 1224 815 25524 2618 4681 3069 1625 2110 2242 15920 12001 68089 29332 12018 5145 2081 6627 438 2302 660 609 703 969 1708 1777 1684 179 8048 815 504 3452 1788 6154 484 564 1069 581 983 392 1212 1502 1215 568 2044 913 928 2185 1096 521 249 54 135 327 142 110 435 102 56 83 71 190 258 136 508 801 477 532 409 1117 71 129 315 103 393 138 770 227 164 114 318 112 404 164 475 1089 200 1123 1570 543 649 1083 3060 611 564 753 1148 253 90 1390 219 399 268 737 828 162 379 133 42 373 83 12 373 72 77 486 151 123 532 206 124 160 67 51 119 48 38 441 346 12 269 625 382 892 1806 960 1498 655 702 289 787 2651 5539 113880 87284 6002 5671 1997 11349 548 190 433 316 1383 274 1208 2291 912 366 240 5390 2279 186 6122 386 412 2025 1251 1426 569 815 9874 3104 5782 2530 5808 2491 1176 1695 3187 7538 569 2392 1322 707 417 4272 1007 596 443 2206 439 563 467 1936 460 2450 535 3704 47219 1393 1521 3606 3698 1146 2176 550 3103 1904 1991 3758 459 2536 1431 664 6732 1074 478 1392 1161 440 2922 2052 848 5417 3711 785 26047 1056 719 585 1719 1354 352 9201 4149 1823 863 5013 4140 1012 997 1165 3135 774 714 940 1269 642 1532 646 1767 12456 6933 5326 1112 2604 4358 343 4361 6205 4815 9839 19013 6906 7165 2050 3029 2070 3562 3082 17744 1465 9525 12001 3158 3422 3596 48310 1976 6145 3100 1095 10107 699 963 9350 3643 2831 1830 2341 586 3926 2996 3169 2039 9574 10042 3331 2034 4768 4877 1358 1472 23895 4192 3601 2608 943 1318 3942 4524 9164 6857 82241 67542 32820 11002 1544 8654 4139 625 18461 980 1112 2882 10559 1903 5415 2082 1058 4076 24523 3904 10790 7816 4672 3290 3631 3155 358 3431 41867 8588 3107 18282 3822 1542 897 2563 1736 11816 23153 25312 9509 7488 4296 3117 5434 1284 6696 8269 4647 1083 14955 6786 14167 171751 172871 7227 5767 8462 6969 6007 21838 31757 46315 16731 27427 36246 2670 81174 9126 7668 10516 3961 5267 7784 3707 4923 13191 2113 1178 3105 5142 3910 5987 27511 13176 5570 34542 6277 3342 17860 8058 3250 6706 3920 1047 2720 2352 12670 2945 4647 67084 5025 7032 3923 6095 2556 9447 1552 10554 38393 5899 44231 6108 8287 2618 46807 3952 10152 13759 24063 10133 51288 4343 18775 28580 2182 6278 17574 5287 25614 17408 19796 120363 6585 81013 12888 2659 3959 1759 490 250 1963 1463 1791 21634 3834 6960 11880 1166 415 1636 770 2447 2160 7540 8943 3339 17768 14512 6606 7994 12307 5877 9936 13451 9254 28653 8081 7425 21963 2041 10890 7362 1481 2686 2354 1397 14777 4637 1984 1402 2639 3108 12492 6124 6092 1011 6926 7711 1599 17933 2649 1778 2591 4517 13666 5636 8725 2332 2001 892 673 343 497 2018 535 1268 5157 235 4114 3191 383 443 2401 19630 5818 5322 1750 763 2090 703 123 720 863 262 710 339 301 106 32 172 22 519 233 1913 787 55 1369 544 53 883 20 57 75 16 429 135 195 418 30 11 320 23 104 642 39 22 26 50 21 29 61 16 114 73 169 214 465 427 110 302 506 121 583 70 649 106 74 55 53 2575 71 74 259 28 48 5 259 268 783 443 2699 1043 1060 1764 21130 7175 8395 6374 3451 8792 1893 1191 2094 2591 1385 2204 1853 907 222 231 1141 631 268 216 129 258 258 29 136 37 744 2427 56 295 38 34 118 7 6 290 44 6 39 59 10 14 32 80 46 71 162 11 44 73 29 2 13 0 0 3 3 0 164 1 13 23 0 35 13 72 16 6 32 53 9 19 1 14 131 12 41 3 60 105 39 0 23 4 82 61 20 60 148 56 33 3 5 11 28 2 3 29 74 3 67 6 68 22 8 109 5 16 21 98 172 113 18 43 35 16 12 0 7 24 0 3 10 0 11 44 52 63 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:10529.2378319
--- a/reactivity_cal/dis_f_N1Ap_rrna.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,12 +0,0 @@ -gi|186498419|ref|NR_022453.1| -120950 30299 169046 110541 5621 6575 2125 2733 591 78 681 257 1074 2477 161 1445 2282 224 589 156 2244 822 3768 1088 175 2330 246 32371 797 555 234 396 867 146 1141 349 2490 2039 111 259 2632 434 257 2169 2418 271 1574 16513 624 504 309 402 1100 102 714 765 857 8624 861 446 75 144 255 863 432 143 133 31 23 84 131 130 159 341 148 4789 473 108 132 123 236 438 183 1011 881 229 617 194 632 338 81 115 547 725 43 453 636 21 210 34 329 1140 189 439 115 228 62 204 221 14 67 15 476 590 514 11 16 26 10 13 11 2 3 8 177 382 104 8 11 9 2 185 61 14 12 30 19 15 130 575 59 16 23 963 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:3510.65853658 -25s -3160472 70217 7776 5133 2982 754 2925 902 6259 1264 1816 2767 752 4406 732 1556 536 1391 399 364 5590 2101 1495 7419 931 550 195 570 2390 211 1195 976 1957 4087 2585 4950 2485 2586 2338 418 11451 4182 4426 4128 7610 9905 7473 4201 2120 1600 1698 1540 613 335 2455 1234 7537 3443 2798 5504 4177 3390 1792 4855 5692 1855 1313 5978 14121 2649 14494 31539 2416 2286 6855 1012 360 710 1230 586 1483 2938 5425 20760 3031 3671 5551 464 594 1156 1019 1372 2671 2558 3369 1180 1270 4844 1916 1616 3996 1607 1949 6636 3503 3180 4028 1974 1435 3331 427 7963 2308 3851 54392 7103 14598 9361 89394 24134 11950 9382 1848 900 1222 12808 182 1305 7616 3497 4268 8371 2210 8622 5111 2192 2002 8630 18071 2313 12842 6275 27446 598639 83151 6938 18353 15860 44948 6369 2027 6487 4230 4869 13733 26704 14133 485231 23075 2747 2397 11888 2352 4795 16159 1940 2289 297883 6325 2594 13678 3575 885 467 10460 21099 1263 1126 675 4599 6013 3097 8008 17044 14240 2873 3927 3576 1049 1236 522 2346 1780 5999 10767 29170 14153 2746 377 628 1881 337 3319 2947 4670 88 167 16 3 0 576 27 2 1 10 56 1428 823 282 147 1197 1238 1796 24396 2938 2290 825 712 346 257 454 854 531 3883 7407 1477 3695 651 2092 3870 1461 3114 2016 102489 11072 16810 207605 13610 12019 4675 4935 1109 944 427 2311 1178 6596 164355 2934 2141 12380 2889 1557 1271 839 2364 357 1309 625 290 2384 1474 1853 833 388 233 647 844 540 2704 6103 4785 603 584 1099 91 168 189 355 2672 2190 2028 1627 704 2064 203 182 142 1676 1652 1938 2149 3039 13586 3390 3994 980 381 100 1389 583 81 1475 287 413 461 150 445 1460 1491 680 214 1433 97 297 242 130 79 123 346 678 157 57 1030 324 147 73 1301 232 282 303 76 143 606 11413 197 2083 888 251 188 425 70 51 175 90 82 365 218 439 670 213 5206 22665 477 976 293 1048 12454 11327 762 715 99 155 1647 2565 135 134 189 762 2633 3133 3890 2256 576 351 370 294 796 751 284 1124 2099 313 324 287 41 136 453 225 157 71 147 521 400 645 407 202 47 1151 43 363 93 44 169 1050 90 141 244 344 3183 61 137 146 427 92 90 69 294 1627 253 183 82 125 285 149 549 588 2202 518 43 40 155 72 21 262 21 91 161 49 43 363 1058 1455 169 142 147 30 170 1744 96 127 141 422 793 1572 5683 6573 2958 80 198 138 106 134 364 30 104 108 197 92 1082 5153 314 627 942 495 779 143 194 69 106 501 114 169 210 126 27 513 473 43 143 559 105 316 122 129 205 959 147 180 606 138 62 133 99 109 588 75 57 255 306 872 2317 2851 5736 409 129 153 43 17 96 695 835 694 413 906 629 436 2016 1535 1929 705 215 110 180 59 112 72 49 121 84 153 578 86 73 144 15 37 169 17 33 39 0 261 172 3 179 172 8 134 29 16 26 204 27 465 103 19 286 26 36 98 11 12 0 20 4 70 235 347 3917 272 81 266 14 18 1 27 17 13 136 100 427 218 38 497 470 33 68 101 26 2 33 11 14 47 12 144 36 15 24 5 7 27 8 2 9 110 103 9 20 17 52 17 23 1 37 3 1 24 77 40 23 8 10 9 16 19 17 1 61 52 25 1433 183 1527 3104 507034 13115 2403 11156 3091 228 166 1095 765 361 1608 1180 186 718 254 423 1031 213 236 933 3246 160 6528 228 528 336 110 304 879 159 361 502 537 5311 332 3824 45927 1222 1596 474 470 384 1762 4474 2659 6586 3747 2533 86064 1475 3914 14159 13563 4279 5489 6824 25438 1313 352 1511 1082 8377 2873 904 787 1354 1286 7 0 0 0 6 1 1 0 8 2 305 35 681 1067 186 173 214 3678 1729 16159 1238 3106 317 439 617 621 64 1548 3591 119 309 394 148 125 288 842 68 19 1289 455 375 691 508 154 3183 72776 2388 2739 4683 4296 9881 1508 4633 3913 5154 21439 1755 1314 654 1669 7229 457 940 1267 2905 1246 303 739 415 1416 723 284 4660 113 369 503 866 444 534 1397 188 1573 371 301 1121 93 174 164 2696 2111 6846 15540 456 1165 516 708 611 372 358 1036 8042 1791 484 3670 74 373 178 674 308 35 1175 1353 221 250 166 486 1073 2776 825 7360 3272 1179 123 353 614 154 1265 964 2517 1619 30015 8097 18838 1509 217 891 132 378 1546 71 401 617 550 366 157 251 44 890 595 241 867 165 1026 999 4122 1708 1275 518 307 4091 10249 3674 755 1009 1109 16250 6904 15392 6434 790 482 118 1454 51 998 3656 702 185 320 3121 658 422 65 325 987 926 1268 807 703 1064 670 195 416 1112 466 481 432 2362 804 857 1854 750 2605 235 2560 4128 780 257 685 2311 922 77 3224 1439 457 1804 1613 989 719 2468 891 70 488 534 162 105 157 139 253 52 1113 249 320 360 1323 1361 2396 783 271 121 287 333 623 1835 371 3183 1486 662 3085 831 2999 742 420 695 596 60 1577 192 310 616 515 190 1183 5599 4359 6022 693 1128 3997 1085 2654 951 437 583 1834 1428 206 697 507 2121 3664 1844 2022 1078 710 1073 5000 1586 4369 1484 1718 6133 4395 1992 1492 1006 1363 2877 1804 512 208 23 4 5 8 1 2 3 7 54 173 65288 4763 972 1827 471 644 5053 370 180 5532 1194 581 1502 2066 2866 889 697 2619 3612 878 3281 4948 1269 2071 1700 1747 9068 3947 2861 3836 25599 2219 969 774 1882 814 209 3383 1504 8313 611 217 1874 109 242 459 91 301 469 832 478 1867 1392 1853 1576 650 514 455 184 745 82 789 737 672 2152 398 2255 757 1873 1545 582 2434 2431 151 451 1795 351 981 127 131 507 629 201 2616 821 280 144 120 150 83 358 103 2498 1027 1636 1246 616 996 575 254 1135 2139 1880 2611 643 2219 352 787 1585 857 432 264 1175 63 258 1001 618 1301 357 1624 359 338 2809 747 786 327 1237 209 560 511 164 1060 5813 480 224 359 1008 342 1689 303 252 1749 194 276 378 150 792 312 1649 791 2560 1633 136 419 303 87 130 238 155 587 331 407 3031 815 1038 2540 2502 428 338 977 742 122 1413 10329 9529 1398 11833 1333 948 181 939 1676 1477 763 1153 347 331 2795 941 2683 10238 5552 2100 9658 113576 3141 13973 1376 8661 297556 5134 6052 2271 1716 1814 1036 657 259 875 909 1392 4499 713 8604 3543 1283 1035 8788 40049 18645 17080 9901 10591 9064 9247 3055 3852 161 1167 1538 655 1548 4547 9202 1917 1703 1411 2171 1212 3956 5528 16982 9275 18861 487491 18157 69822 144097 7900 4868 1124 3177 2556 687 637 1124 2217 834 4561 2915 9158 23401 877 13556 32475 3687 2221 1020 1333 359 401 1520 1841 5619 6552 22847 5786 16753 7239 17545 2472 42506 46 1 0 1 8 0 163 5839 2439 1791 2199 605 13763 421 425 11142 1585 2249 7419 11081 3924 1901 415 871 770 1588 759 14006 904 845 4384 410 869 420 1610 4948 2303 6636 7248 2001 9413 28171 6110 4417 12212 2191 5024 849 557 2872 485 1061 5742 1640 2312 4370 2864 2906 6964 2628 1090 1909 1677 2054 828 1389 13934 658 998 588 926 223 2159 6205 157 746 713 2627 3098 13609 25716 3496 7880 33 2 0 0 0 0 0 0 0 0 0 2 75 367 266 210 538 107 632 121 602 1200 347 203 441 1907 102 422 3394 214 1442 843 707 2292 2047 6033 2064 8211 5508 451 2672 1627 779 1221 3679 1635 998 5851 4609 4448 2553 6848 12922 7943 9396 13161 28683 14377 13190 6924 9891 3432 10803 12518 18312 5647 5469 8617 1661 10296 17593 4302 15343 6273 4521 2414 3148 6604 1802 2319 2548 1059 848 4336 34260 26791 5869 4048 2155 1775 7643 7946 11333 19871 8545 1072 2264 2645 1230 584 14483 5267 3448 8473 2570 15416 350181 10644 19662 6422 5570 205826 79123 30956 5990 3283 3071 65633 6340 26438 2668 6403 7173 7248 15695 15678 3775 3963 16322 2381 2796 4328 8573 2452 2962 12401 20436 14814 14379 3791 4406 8783 1307 3190 1351 5120 10832 30780 20818 21966 42888 19268 3136 1900 15381 12057 18 8 2 94 6 1 19 0 14 82 29178 1537402 154384 25671 53736 26917 5254 40974 306473 20984 28256 62025 9982 17188 8747 33620 31590 16776 5449 4884 8264 11900 7839 1094 6551 15535 25616 144487 95336 76982 100883 22690 926579 23942 7415 8152 6064 5299 2423 4923 17367 7371 2245 25656 1891 2504 65222 4861 10338 11619 2198 5366 5167 6502 10101 78663 10651 4257 57027 3155 8599 14624 4392 4156 20607 2322 4843 5209 4444 6195 6809 1135 5736 3385 6272 4170 618 1627 3526 5352 2357 1138 59786 14708 1787 6419 467 674 2443 509 2032 1653 524 280 1895 747 645 3479 675 2902 1474 1268 9649 7729 2240 5452 4036 9431 2816 15525 24052 5170 5377 2488 3433 2484 913 2689 3730 8775 10795 6995 15727 13549 2151 2214 729 485 481 1041 763 7173 1466 775 621 186 579 458 890 911 3408 2175 1525 52543 2221 1998 456 397 3503 1292 737 310 450 384 113 367 3571 12068 677 1134 714 2285 448 171 1900 1990 437 1930 5171 170 506 148 158 914 293 504 1889 1424 226 1189 557 82 685 400 512 607 378 5884 3303 1380 2561 494 5727 675 667 547 190 696 118 32 227 48 208 203 117 318 175 188 51 30 8 13 124 49 114 315 32 13 38 52 71 93 825 570 750 284 529 369 267 178 32 82 26 22 401 74 10 290 4528 110 425 267 3854 1696 6510 738 108 65 144 139 39 285 105 18 13 43 376 12 54 818 149 53 205 294 86 358 331 2968 251 136 810 311 743 581 263 8755 16380 497 1558 1393 187 37 20 94 35 198 263 434 318 420 164 49 764 1379 398 134 260 32 22 404 22 316 40 44 359 179 311 771 3078 326 42 766 4734 1524 426 1390 4721 684 333 601 665 471 467 598 1060 983 185 56 1239 1044 67 941 116 447 801 7383 4548 2549 1427 5010 1023 822 418 812 341 423 664 1534 1242 1819 5296 278 702 1107 156 1720 587 3655 11652 5076 4351 13937 12898 782 3517 1200 215 1630 267 171 735 343 875 232 1197 719 626 505 404 292 257 1240 191 221 1019 95 225 245 582 176 925 3174 819 250 467 1481 1294 219 456 240 606 254 1063 77562 4222 1026 738 820 4285 100 640 128 659 293 401 8725 595 3196 3253 492 172 500 1660 358 426 300 226 2034 162 138 798 13925 294 1217 835 524 187 2828 4384 2329 3875 308 643 1222 155 316 1365 9469 613 932 304 11778 531 593 1700 106 686 380 152 0 8 0 0 2 4 0 0 5 1 8 139 169 368 114 1467 5642 184 161 1606 377 176 1368 6094 3675 3854 18621 1643 8970 463 322 158 272 774 171 4555 1108 8622 1129 118 1117 1284 643 968 842 1460 142 119 255 69 14 170 1194 472 1746 8194 5742 2594 9161 26159 12020 2616 2397 4471 214 2687 10382 1234 1206 487 1646 735 3761 2337 570 840 2334 733 888 5406 13700 868 618 5200 1745 5654 4129 869 382 1627 5101 2970 2530 2425 903 133 620 1022 1020 453 2171 1821 2899 1837 2608 7062 5140 4630 2064 1836 1804 5177 3837 1068 943 747 907 137 3000 465 69 278 174 97 382 298 53 199 93 18 89 75 242 408 464 1032 354 1738 389 1022 2881 1620 260 2051 546 722 569 90 913 182 445 605 163 4852 507 453 262 170 48 307 424 247 58 4394 5172 409 64 346 408 318 367 873 1032 11527 1595 696 4121 1534 479 1632 2501 7686 1055 1383 2488 5116 5866 3456 11651 3146 1056 2062 252 811 2135 546 916 2071 1134 397 237 561 95 506 127 435 1916 341 145 668 160 85 158 94 586 20 571 780 1089 311 2306 8669 25195 15288 7826 976 1538 3036 1129 272 481 5685 1505 3889 2638 906 2833 1383 967 572 458 914 773 891 4075 8191 8811 921 550 856 596 1180 254 992 7579 191 3584 1616 576 1234 1877 4880 1918 1231 1000 2206 84 73 884 95 712 537 1755 680 48062 1985 1096 1212 937 932 1218 274 2262 3394 2932 443 13519 576 1150 1762 2784 3052 1838 137 324 236 103 896 1493 188 256 379 1711 2908 1031 193 319 1787 32 615 843 282 104 832 986 711 283 520 1043 374 594 1175 1291 89476 2818 2262 13420 1453 7048 1479 1019 356 2025 1044 2973 753 125 2392 4004 222 362 419 327 186 314 226 266 503 662 1892 6392 1281 5489 2667 263 4233 522 369 199 682 1353 1470 1505 10217 131899 5353 28255 177502 3990 9196 14586 976 818 1384 2277 11565 2843 249 2561 1728 738 5854 1218 936 5442 1665 2945 491 2292 1726 384 1943 1666 282 1006 5470 2276 1860 5077 1376 2308 2986 2734 9890 3971 15139 647 724 7827 1642 1868 423 2430 3178 995 4260 1611 2788 4185 2882 877 2009 4663 1812 17862 13636 8091 4300 1551 859 1431 1413 482 5868 2672 1735 787 2973 1086 11358 2559 3376 9141 5016 87757 68150 82320 5003 3940 14233 17321 39992 55967 11173 2008 2124 21935 760 3840 40615 4191 5698 4603 11610 1579 6718 36719 5363 16460 9673 3149 12763 11395 3109 1324 2289 4908 2465 976 1328 2228 94 385 132 3 1 0 0 0 6 1 0 6 152 267 676 314 628 252 255 146 235 515 1636 32184 5558 7355 37593 1459 793 476 778 1282 1594 2591 778 439 656 277 175 140 251 451 1675 211 1561 516 670 35 94 22 16 282 78 32 252 79 468 297 47 509 73 78 690 38 36 249 2738 112 151 309 133 92 466 43 108 718 43 359 1083 1447 428 224 87 59 566 23 1579 126 25 49 110 89 15 153 417 345 74 33 15 653 14 24 75 133 69 169 323 107 1627 222 310 4537 1007 4143 9816 248 257 396 1169 870 1019 381 882 1008 429 2206 149 595 764 83 277 171 1061 727 200 154 16 6602 329 145 317 962 558 164 892 432 40 233 237 53 688 133 1543 51682 764 222 1725 813 767 1295 7413 52303 2396 3868 11139 16721 23459 437 1757 361 957 59 361 229 195 614 1031 2981 3884 2162 363 1007 425 387 178 1544 6060 7005 3820 825 1213 1012 104 615 299 391 626 1236 1113 405 1578 646 622 297 463 362 3426 1452 296 492 2856 362 2608 790 616 1521 798 698 3052 1002 680 6059 461 414 222 1235 565 215 748 948 1197 469 563 802 581 132 382 191 37 252 86 340 372 2 8 0 0 0 1 18 12 10 131 55 150 1047 2731 351 109 831 166 218 418 527 5838 1211 1227 451 200 204 850 510 357 268 935 592 835 109 1379 207 270 1221 225 3231 1916 1004 172 1207 818 1261 346 48 1190 535 179 1034 118 755 726 819 383 1611 3069 1526 1854 444 780 370 361 129 359 91 92 167 137 208 170 698 427 285 41 457 229 7222 262 175 477 1943 406 3183 1271 481 23697 507 154 1468 513 271 383 665 562 932 846 979 821 664 236 454 404 698 283 79 478 522 250 235 3631 918 219 377 95 652 44 82 563 179 54 413 146 368 100 463 1441 407 3066 574 336 439 63 89 323 282 254 332 1182 346 905 7118 1451 173 44 369 147 173 766 511 4570 276 180 310 96 136 67 610 225 309 519 980 490 56 263 113 40 67 342 109 495 966 2220 142 924 410 226 50 43 1387 221 1348 316 174 41150 139269 2836 1430 1283 1873 23095 48834 119183 5769 4067 2610 1673 1580 99 121 2152 125 1507 579 500 1515 1416 7771 555 4300 13322 1502 542 645 4436 3790 4889 5713 2034 506 1931 1240 786 128 1937 3905 1270 1468 1308 2864 478 358 342 1269 777 9281 207 1267 985 307 1809 946 2390 5013 121475 5193 4599 5166 3358 4790 3287 4257 1932 1002 3876 1395 375 2840 5012 1839 1156 4408 675 1710 3286 8687 6027 5844 1477 861 3990 8955 8261 16777 4152 1096 2974 1247 1023 1728 1166 779 608 6974 3706 4827 27271 2298 1809 933 470 3133 87 6463 907 261 282 250 469 202 144 452 589 573 4498 1743 2354 1224 852 5204 36242 2114 310 414 2114 1365 142 981 215 348 2159 111 315 310 1110 1619 911 102 776 988 533 533 232 80 313 233 313 354 657 920 5498 15877 953 3723 2547 539 2418 738 1796 267 1283 11297 857 1474 340 11479 10067 1473 763 2684 2079 755 1460 268 1484 2382 615 4436 1198 479 281 242 924 607 478 3481 1222 1099 1786 48351 14317 406 651 3860 1672 5628 2051 6211 12893 1024 383 394 262 421 70 407 749 437 676 436 861 1024 1710 6525 4102 638 788 3317 688 660 1226 1225 811 992 4113 1432 11115 2354 1906 3151 8 3 0 0 0 1 6 70 442 149 212 133 934 1983 308 864 873 2505 752 126 4610 888 4907 572 147 1616 253 973 654 181 521 185 295 134 488 1766 227 63 33 38 9 31 70 4 10 68 22 5 23 49 75 226 39 7 17 3 27 48 23 4 4 11 17 22 1 8 28 9 33 15 28 34 278 710 66 160 215 34 181 25 15 22 139 9 72 26 9 4 0 16 3 1 1 12 260 77 83 138 44 145 10 38 9 4 7 27 1 0 1 43 13 7 7 8 0 45 18 21 30 48 21 30 86 6 5 18 7 2 91 18 17 5 36 34 48 133 147 74 133 421 155 37 60 15 7 3 11 46 22 11 3 0 0 2 8 2 0 161 43 97 72 80 4 0 9 1 3 1 3 1 0 0 0 0 21 0 2 3 0 0 0 1 5 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:6327.99377778 -Arabidopsis -2309 150 152 44 94 20 31 66 129 49 181 10 86 26 10 36 96 5 158 13 45 27 145 13 85 1 70 41 1 16 21 44 28 21 7 6 27 263 8 43 2 24 108 7 0 9 0 0 1 3 14 33 1 12 3 5 8 2 13 13 1 9 2 1 3 17 5 0 1 0 4 7 22 1 4 15 16 0 0 6 26 4 5 0 14 39 38 18 1 26 9 0 0 0 0 0 18 33 5 35 6 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:43.1900826446 -gi|20197903:2706-4513 -918451 43069 4973 6069 5424 764 1308 1439 883 907 987 3034 389 406 952 935 228 1164 4117 891 3486 1385 2729 4818 1258 26713 4029 5575 4375 1242 1070 2107 920 1244 1091 1165 4373 1897 5508 17168 30987 6744 39793 35181 2869 4645 4692 3044 1437 1272 3410 3227 3218 950 11595 1582 3975 4126 3534 2904 9622 9201 2662 5093 17776 53180 1503 5034 36896 3073 2696 12752 92843 89306 51420 20625 12112 19628 14536 7588 16552 7625 2887 5143 2395 77142 8914 1213 1504 2871 807 9425 1820 12549 1146 1756 873 702 4748 1983 28475 12593 4907 15539 18662 26723 5381 1232 6179 7188 7257 11050 8482 3815 5990 5082 1806 1922 2605 1940 1266 5733 1528 1833 4406 5121 2372 5536 3055 7605 63077 12644 78932 88354 15542 70445 7243 6242 120346 2540 1657 3245 25109 5755 1160 8889 5851 2503 876 7493 5714 9802 13634 8462 14457 8287 7986 2320 4129 8613 1888 5304 4607 2516 6019 15661 9337 2463 7209 1824 3285 2368 4304 947 36403 95330 40526 20022 54545 77764 3922 2515 3015 414 1370 14283 58088 11847 6695 24021 59631 6958 3539 4469 16242 340311 7244 1837 18429 8372 18021 5639 41746 21583 14255 9732 18318 11221 6535 10615 10301 40428 533599 326270 55341 36178 28527 8780 4316 27359 1402 2267 21704 3585 2449 2389 1205 6044 1632 2498 21387 25280 15320 4162 1764 3727 2635 19546 22097 8739 4664 21700 11278 21131 48044 2632 42293 5936 3669 21387 10312 18637 1858 25311 159741 5693 23447 3845 15343 7781 1209 18376 1883 2889 15421 5395 5221 589 16571 255673 5036 4649 4379 14806 6242 1153 6334 1207 2127 15500 269146 206619 25198 83043 13150 15591 7979 9163 13341 1153 2181 21654 3397 11882 2120 25839 34277 8235 17713 14707 33769 34611 23409 16045 46807 10245 7192 5440 2570 1530 629 5093 2209 1933 4632 13485 118398 3529 13894 12849 5579 3313 3197 12455 2575 1353 4839 1286 818 418 463 855 938 549 6614 4199 3176 3182 462 311 873 513 175 195 2569 689 217 3286 1004 486 365 683 978 2539 987 1931 14123 358 1065 201 1443 638 861 7076 735 494 607 1394 4512 5974 12877 3584 1718 2029 6966 1725 717 1255 2196 587 1166 3496 589 737 859 614 434 174 582 691 588 2404 1393 481 165 413 280 186 191 350 783 1657 971 1473 6521 258 1769 575 323 224 1775 321 167 3255 221 2023 11024 1286 569 4550 17400 11662 718 1234 4560 3160 642 257 2328 529 894 1211 579 256 506 909 688 2805 882 12678 27229 9905 8194 690 1257 786 734 852 2316 1227 1305 203 1235 585 1289 6637 6275 7344 596 2993 1093 199 81 784 866 959 1940 527 2090 452 362 7523 6256 18337 9647 5141 8828 3798 17697 2009 2458 9177 2905 5062 4758 1977 2374 922 306 215 1332 239 332 783 875 5373 16505 153966 10369 17786 5145 3987 2840 388 2542 1062 2393 3988 10780 46495 35443 5441 2750 3089 7490 44543 4522 7389 30017 41341 6083 16256 11272 14499 17752 12640 4905 12457 10533 8046 11038 3131 1047 9235 2518 7924 2114 8155 786504 20595 4724 18877 16816 3257 20972 174536 10915 10591 53044 9521 3903 5021 2460 3040 4609 4420 5187 966 207182 10038 4869 7684 1525 3982 2569 2485 342 1094 2782 1929 8190 6125 3783 3835 3938 1472 2345 1122 3299 13563 7847 15191 53606 151932 10494 12925 6127 1369 14734 2286 1409 4612 2395 20399 21833 37032 17626 2744 15445 6995 5652 15687 23622 24690 300234 38628 20789 7096 26987 63959 6745 13800 4071 5326 10434 3218 2338 5241 24342 17104 31725 24079 54301 80045 16097 14430 19838 3836 1915 20476 5640 2057 19218 17512 9583 19429 14930 4053 2368 36692 28478 17960 12763 3211 15723 17455 4262 15836 5574 17075 2971 1549 11262 1816 2481 3031 1711 2245 3302 2239 5581 5436 898 3189 6402 7369 19431 10181 13982 19518 19378 6052 3397 7060 48792 49466 166394 16294 11481 7588 2631 9634 818 7222 8071 5098 50033 3363 2907 3316 2831 28201 23752 15257 6539 31273 20417 8330 18882 2784 7312 11264 5719 37305 11156 34369 28532 7521 2088 5106 136216 6760 3184 8826 4505 17420 89725 5786 9835 47563 42284 228449 23151 10905 9629 2291 852 539 21600 1595 1643 83308 3168 9230 1691 5252 3309 1515 5225 4626 1267 7645 10913 3289 11718 160149 96128 20051 4231 10627 21149 6156 9864 8341 10069 2123 20394 14350 9726 19497 27938 98863 14126 12365 11455 5934 8883 3699 2200 1856 2930 29028 20229 4265 13036 10997 123690 13292 23786 7293 26281 10459 4324 80443 74236 29597 4360 3106 7668 2936 50151 6032 8456 41215 30315 72582 22633 82098 56991 7444 11502 18815 3986 51306 4799 3007 3601 2699 32496 8227 8523 51338 3731 23833 383982 16734 54704 181869 15780 44891 8843 61934 8722 3511 9541 2014 2082 9791 12879 1256 1769 16492 23018 25711 3425 5757 7748 6637 8538 2421 1180 2306 3558 2511 6676 15736 2895 16995 12150 784 15694 19837 2235 2291 6787 14289 13577 33423 7455 104407 25193 11741 76444 149786 13133 19339 38730 9696 10093 11742 2843 2973 16682 8778 4261 3432 9341 2088 3519 5195 2142 3650 23502 21304 29334 11102 24475 3829 8448 25057 29207 4072 4295 15963 7557 13441 16457 6903 7517 18114 2888 15355 2912 9314 10223 7355 6996 23929 34758 32336 23582 18784 13062 4052 11500 5164 4390 4450 43219 15862 13078 12019 32352 11400 10789 7759 44295 10190 3755 43157 4945 3789 27000 728401 15353 25752 37886 6521 5833 10411 4997 13530 17532 19474 11376 13583 5615 59799 19137 5037 2415 10195 20867 7197 43957 40619 11990 3397 65413 14393 17403 45882 12444 17080 25725 6268 53375 26086 21210 13030 129383 28084 5386 30859 1007498 36810 9120 149119 20793 14276 9005 28255 24819 10532 6806 1929 2209 3994 923 4758 1557 5077 62586 3615 4418 25161 37477 29847 26458 4883 1416 16824 23999 7771 24194 18853 15112 7284 9706 25453 5458 1093 20049 5547 1700 13748 5212 7528 10561 2127 30562 9086 10290 22396 13044 7444 39588 38983 13299 10989 29106 3213 2719 7463 12171 1211 5657 907 946 25627 3807 2467 8638 3158 2323 1169 8655 20054 1144 2165 1022 473 515 318 9968 1982 1785 1586 645 932 1326 18572 6003 23624 24494 5382 4548 1073 2357 145 748 93 132 194 310 543 519 435 90 4330 484 165 904 623 1328 564 238 536 221 273 205 600 900 308 221 1905 591 606 861 459 142 100 18 42 102 37 51 143 25 28 49 15 80 85 30 219 395 310 209 208 2609 58 17 91 62 113 104 170 238 117 203 99 25 65 33 650 499 93 524 459 207 420 1906 39597 754 479 1113 1080 101 56 540 249 224 131 465 759 185 233 72 27 138 32 13 211 60 50 402 134 122 149 95 32 86 45 34 117 55 57 138 80 13 328 510 195 680 1400 373 2025 336 525 103 352 946 3106 48146 65443 4484 25973 1591 6249 333 394 949 267 1063 365 1543 2689 578 477 144 2523 847 129 3781 777 386 968 721 2034 314 9986 7600 6795 2312 2609 3265 3657 1206 1537 34719 81640 1937 1853 3224 4988 714 3826 2129 1135 1260 2243 2459 1314 1287 3252 1490 5798 1287 33839 828802 15071 6467 17694 11929 2470 5783 499 5132 4324 4576 4040 1232 2842 2115 1433 15255 2204 1353 4861 1205 444 2760 1524 838 8666 3804 902 55166 2046 981 760 1848 1086 590 13977 5962 3093 1474 4197 3879 1882 1310 1314 3970 1193 448 1349 1551 886 2579 855 2295 13815 6410 5875 1631 2855 2952 549 8320 6165 4995 9738 15798 9726 13766 3409 3604 1852 4391 4035 19978 1370 11897 15640 4216 4196 5271 98189 3141 6442 2689 1344 10728 1082 1077 9202 4433 4742 3403 2571 684 4671 4971 2838 4010 8424 12091 3648 2359 5308 6442 1811 1627 19424 12480 4202 2763 1678 1400 6800 7776 10122 9578 190337 91025 34402 23174 2379 8401 3013 1489 10760 1976 1679 3867 13143 2621 11394 3139 1164 4008 23586 6376 9367 8775 6496 5845 9468 6204 465 3811 43823 12209 3920 20046 8528 2284 1178 3011 1706 18792 25150 38254 9642 7318 9454 4337 5776 1202 7027 18078 11395 1937 29155 13898 14404 135641 161207 7066 4404 11155 8655 6772 18892 24799 128909 26431 30188 46143 3328 87384 25884 8823 8085 3989 4756 7137 3970 8207 14751 3275 1486 3042 5599 2671 4629 21374 10866 7013 34532 9214 2570 12047 5339 2723 5135 3375 1212 1891 2006 9614 2371 3466 30358 5952 3412 2603 3365 2028 5615 444 6723 21353 4983 25946 6977 8179 2315 24559 2797 6644 7684 13108 9082 26909 3560 15175 27961 3236 5753 15358 9662 43960 13939 28670 208831 16478 275147 37432 3074 4436 1782 536 352 1036 1415 2556 21366 5609 8805 32111 1025 830 1367 477 2793 3119 8611 10826 3384 28549 21014 6481 9057 11687 5277 9019 15543 10283 27900 7132 4644 16608 2018 7261 6962 979 1551 2580 1025 9650 6228 1202 1888 2288 2266 8281 11051 5152 776 6184 6588 1243 11157 2088 1143 1834 3611 10885 7167 16069 1712 2014 709 563 509 343 1480 626 1128 3365 329 5016 2783 345 220 1965 14235 4296 5956 2167 887 1004 456 74 810 994 254 825 255 394 125 31 151 35 868 519 2423 435 80 919 675 18 1111 56 52 59 14 411 133 337 198 19 27 240 9 53 543 15 33 6 10 23 46 36 22 205 72 34 175 166 274 120 228 251 173 562 24 821 202 140 46 30 2102 39 16 40 22 24 0 172 191 512 370 1253 727 423 874 10347 3877 3532 3094 1517 4942 848 334 965 910 546 1048 774 276 104 112 559 997 136 190 61 66 85 20 35 6 489 2961 58 128 29 98 51 3 13 389 51 11 5 12 9 0 68 45 88 29 110 14 72 44 1 3 3 1 0 4 2 1 101 11 0 4 0 59 10 275 38 7 29 272 47 20 0 17 13 8 10 0 122 799 32 17 25 3 10 35 2 149 21 81 19 5 0 31 167 22 4 114 64 12 24 0 44 61 38 37 19 61 19 164 673 51 6 203 88 44 8 0 6 2 4 0 7 12 0 2 5 16 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 -coverage:14437.7997788
--- a/reactivity_cal/parse_dis_react.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,51 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- -import sys - -def parse_dist(in_file): - result = [] - distribution = {} - name = [] - f = open(in_file) - flag = 0 - for aline in f.readlines(): - line = aline.strip() - dis = line.strip() - dist = dis.split('\t') - if len(dist) > 0: - if len(dist) == 1: - if dist[0].strip().find('coverage')==-1: - if flag == 0: - name.append(line) - flag = 1 - t_name = line - else: - distribution[t_name] = 'null' - name.append(line) - flag = 1 - t_name = line - else: - distri = [] - for i in range(0, len(dist)): - distri.append(dist[i].strip()) - distribution[t_name] = distri - flag = 0 - result.append(name) - result.append(distribution) - f.close() - return result - - - - - - - - - - - - - - -
--- a/reactivity_cal/rRNA.txt Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,8 +0,0 @@ ->25s rRNA 3375nts -GCGACCCCAGGTCAGGCGGGATTACCCGCTGAGTTTAAGCATATCAATAAGCGGAGGAAAAGAAACTAACAAGGATTCCCTTAGTAACGGCGAGCGAACCGGGAAGAGCCCAGCTTGAAAATCGGACGTCTTCGGCGTTCGAATTGTAGTCTGGAGAAGCGTCCTCAGCGACGGACCGGGCCTAAGTTCCCTGGAAAGGGGCGCCAGAGAGGGTGAGAGCCCGTCGTGCCCGGACCCTGTCGCACCACGAGGCGCTGTCTACGAGTCGGGTTGTTTGGGAATGCAGCCCCAATCGGGCGGTAAATTCCGTCCAAGGCTAAATACGGGCGAGAGACCGATAGCGAACAAGTACCGCGAGGTAAAGATGAAAAGGACTTTGAAAAGAGAGTCAAAGAGTGCTTGAAATTGTCGGGAGGGAAGCGGATGGGGGCCGGCGATGCGTCCTGGTCGGATGCGGAACGGAGCAATCCGGTCCGCCGATCGATTCGGGGCGTGGACCGACGCGGATTACGGTGGCGGCCTAAGCCCGGGCTTTTGATACGCTTGTGGAGACGTCGCTGCCGTGATCGTGGTCTGCAGCACGCGCCTAACGGCGTGCCTCGGCATCAGCGTGCTCCGGGCGTCGGCCTGTGGGCTCCCCATTCGACCCGTCTTGAAACACGGACCAAGGAGTCTGACATGTGTGCGAGTCAACGGGTGAGTAAACCCGTAAGGCGCAAGGAAGCTGATTGGCGGGATCCTCGCGGGTGCACCGCCGACCGACCTTGATCTTCTGAGAAGGGTTCGAGTGTGAGCATGCCTGTCGGGACCCGAAAGATGGTGAACTATGCCTGAGCGGGGTAAAGCCAGAGGAAACTCTGGTGGAAGCCCGCAGCGATACTGACGTGCAAATCGTTCGTCTGACTTGGGTATAGGGGCGAAAGACTAATCGAACCATCTAGTAGCTGGTTCCCTCCGAAGTTTCCCTCAGGATAGCTGGAGCTCGGACGCGAGTTCTATCGGGTAAAGCCAATGATTAGAGGCATTGGGGGCGCAACGCCTCGACCTATTCTCAAACTTTAAATAGGTAGGACGTGTCGGCTGCTTTGTTGAGCCGTCACACGGAATCGAGAGCTCCAAGTGGGCCATTTTTGGTAAGCAGAACTGGCGATGCGGGATGAACCGGAAGCCGGGTTACGGTGCCCAACTGCGCGCTAACCTAGAACCCACAAAGGGTGTTGGTCGATTAAGACAGCAGGACGGTGGTCATGGAAGTCGAAATCCGCTAAGGAGTGTGTAACAACTCACCTGCCGAATCAACTAGCCCCGAAAATGGATGGCGCTTAAGCGCGACCTATACCCGGCCGTCGGGGCAAGAGCCAGGCCTCGATGAGTAGGAGGGCGCGGCGGTCGCTGCAAAACCTAGGGCGCGAGGCGCGGAGCGGCCGTCGGTGCAGATCTTGGTGGTAGTAGCAAATATTCAAATGAGAACTTTGAAGGCCGAAGAGGGGAAAGGTTCCATGTGAACGGCACTTGCACATGGGTTAGTCGATCCTAAGAGTCGGGGGAAACCCGTCTGATAGCGCTTAAGCGAACTTCGAAAGGGGATCCGGTTAAAATTCCGGAACCGGGACGTGGCGGTTGACGGCAACGTTAGGGAGTCCGGAGACGTCGGCGGGGGCCTCGGGAAGAGTTATCTTTTCTGTTTAACAGCCTGCCCACCCTGGAAACGGCTCAGCCGGAGGTAGGGTCCAGCGGCTGGAAGAGCACCGCACGTCGCGTGGTGTCCGGTGCGCCCCCGGGCGCCCTTGAAAATCCGGAGGACCGAGTGCCGCTCACGCCCGGTCGTACTCATAACCGCATCAGGTCTCCAAGGTGAACAGCCTCTGGTCGATGGAACAATGTAGGCAAGGGAAGTCGGCAAAATGGATCCGTAACTTCGGGAAAAGGATTGGCTCTGAGGGCTGGGCTCGGGGGTCCCAGTTCCGAACCCGTCGGCTGTCAGCGGACTGCTCGAGCTGCTTCCGCGGCGAGAGCGGGTCGCCGGCTGCCGGCCGGGGGACGACTGGGAACGGCTCTCTCGGGAGCTTTCCCCGGGCGTCGAACAGTCAGCTCAGAACTGGTACGGACAAGGGGAATCCGACTGTTTAATTAAAACAAAGCATTGCGATGGTCCCTGCGGATGCTAACGCAATGTGATTTCTGCCCAGTGCTCTGAATGTCAAAGTGAAGAAATTCAACCAAGCGCGGGTAAACGGCGGGAGTAACTATGACTCTCTTAAGGTAGCCAAATGCCTCGTCATCTAATTAGTGACGCGCATGAATGGATTAACGAGATTCCCACTGTCCCTGTCTACTATCCAGCGAAACCACAGCCAAGGGAACGGGCTTGGCAGAATCAGCGGGGAAAGAAGACCCTGTTGAGCTTGACTCTAGTCCGACTTTGTGAAATGACTTGAGAGGTGTAGGATAAGTGGGAGCTTCGGCGCAAGTGAAATACCACTACTTTTAACGTTATTTTACTTACTCCGTGAATCGGAGGCCGGGGTACAACCCCTGTTTTTGGTCCCAAGGCTCGCTTCGGCGGGTCGATCCGGGCGGAGGACATTGTCAGGTGGGGAGTTTGGCTGGGGCGGCACATCTGTTAAAAGATAACGCAGGTGTCCTAAGATGAGCTCAACGAGAACAGAAATCTCGTGTGGAACAAAAGGGTAAAAGCTCGTTTGATTCTGATTTTCAGTACGAATACGAACCGTGAAAGCGTGGCCTATCGATCCTTTAGACTTCGGAATTTGAAGCTAGAGGTGTCAGAAAAGTTACCACAGGGATAACTGGCTTGTGGCAGCCAAGCGTTCATAGCGACGTTGCTTTTTGATCCTTCGATGTCGGCTCTTCCTATCATTGTGAAGCAGAATTCACCAAGTGTTGGATTGTTCACCCACCAATAGGGAACGTGAGCTGGGTTTAGACCGTCGTGAGACAGGTTAGTTTTACCCTACTGATGCCCGCGTCGCGATAGTAATTCAACCTAGTACGAGAGGAACCGTTGATTCGCACAATTGGTCATCGCGCTTGGTTGAAAAGCCAGTGGCGCGAAGCTACCGTGCGCTGGATTATGACTGAACGCCTCTAAGTCAGAATCCGGGCTAGAAGCGACGCATGCGCCCGCCGCCCGATTGCCGACCCTCAGTAGGAGCTTAGGCTCCAAAGGCACGTGTCGTTGGCTAAGTCCGTTCGGCGGAACGGTCGTTCGGACCGCCTTGAATTATAATTACCACCGAGCGGCGGGTAGAATCCTTTGCAGACGACTTAAATACGCGACGGGGTATTGTAAGTGGCAGAGTGGCCTTGCTGCCACGATCCACTGAGATTCAGCCCTTTGTCGCTAAGATTCGA ->gi|20197903:2706-4513 Arabidopsis thaliana chromosome 2 BAC F23H14 genomic sequence, complete sequence -TACCTGGTTGATCCTGCCAGTAGTCATATGCTTGTCTCAAAGATTAAGCCATGCATGTGTAAGTATGAACGAATTCAGACTGTGAAACTGCGAATGGCTCATTAAATCAGTTATAGTTTGTTTGATGGTAACTACTACTCGGATAACCGTAGTAATTCTAGAGCTAATACGTGCAACAAACCCCGACTTATGGAAGGGACGCATTTATTAGATAAAAGGTCGACGCGGGCTCTGCCCGTTGCTCTGATGATTCATGATAACTCGACGGATCGCATGGCCTCTGTGCTGGCGACGCATCATTCAAATTTCTGCCCTATCAACTTTCGATGGTAGGATAGTGGCCTACCATGGTGGTAACGGGTGACGGAGAATTAGGGTTCGATTCCGGAGAGGGAGCCTGAGAAACGGCTACCACATCCAAGGAAGGCAGCAGGCGCGCAAATTACCCAATCCTGACACGGGGAGGTAGTGACAATAAATAACAATACTGGGCTCTTTCGAGTCTGGTAATTGGAATGAGTACAATCTAAATCCCTTAACGAGGATCCATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTTAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGAACCTTGGGATGGGTCGGCCGGTCCGCCTTTGGTGTGCATTGGTCGGCTTGTCCCTTCGGTCGGCGATACGCTCCTGGTCTTAATTGGCCGGGTCGTGCCTCCGGCGCTGTTACTTTGAAGAAATTAGAGTGCTCAAAGCAAGCCTACGCTCTGGATACATTAGCATGGGATAACATCATAGGATTTCGATCCTATTGTGTTGGCCTTCGGGATCGGAGTAATGATTAACAGGGACAGTCGGGGGCATTCGTATTTCATAGTCAGAGGTGAAATTCTTGGATTTATGAAAGACGAACAACTGCGAAAGCATTTGCCAAGGATGTTTTCATTAATCAAGAACGAAAGTTGGGGGCTCGAAGACGATCAGATACCGTCCTAGTCTCAACCATAAACGATGCCGACCAGGGATCAGCGGATGTTGCTTATAGGACTCCGCTGGCACCTTATGAGAAATCAAAGTTTTTGGGTTCCGGGGGGAGTATGGTCGCAAGGCTGAAACTTAAAGGAATTGACGGAAGGGCACCACCAGGAGTGGAGCCTGCGGCTTAATTTGACTCAACACGGGGAAACTTACCAGGTCCAGACATAGTAAGGATTGACAGACTGAGAGCTCTTTCTTGATTCTATGGGTGGTGGTGCATGGCCGTTCTTAGTTGGTGGAGCGATTTGTCTGGTTAATTCCGTTAATGAACGAGACCTCAGCCTGCTAACTAGCTACGTGGAGGCATCCCTTCACGGCCGGCTTCTTAGAGGGACTATGGCCGTTTAGGCCAAGGAAGTTTGAGGCAATAACAGGTCTGTGATGCCCTTAGATGTTCTGGGCCGCACGCGCGCTACACTGATGTATTCAACGAGTTCACACCTTGGCCGACAGGCCCGGGTAATCTTTGAAATTTCATCGTGATGGGGATAGATCATTGCAATTGTTGGTCTTCAACGAGGAATTCCTAGTAAGCGCGAGTCATCAGCTCGCGTTGACTACGTCCCTGCCCTTTGTACACACCGCCCGTCGCTCCTACCGATTGAATGATCCGGTGAAGTGTTCGGATCGCGGCGACGTGGGTGGTTCGCCGCCCGCGACGTCGCGAGAAGTCCACTAAACCTTATCATTTAGAGGAAGGAGAAGTCGTAACAAGGTTTCCGTAGGTGAACCTGCGGAAGGATCATTG ->Arabidopsis thaliana 1 -GGATGCGATCATACCAGCACTAATGCACCGGATCCCATCAGAACTCCGCAGTTAAGCGTGCTTGGGCGAGAGTAGTACTAGGATGGGTGACCTCCTGGGAAGTCCTCGTGTTGCATCCCTC ->gi|186498419|ref|NR_022453.1| Arabidopsis thaliana (AT2G01020) rRNA -AAAACGACTCTCGGCAACGGATATCTCGGCTCTCGCATCGATGAAGAACGTAGCGAAATGCGATACTTGGTGTGAATTGCAGAATCCCGTGAACCATCGAGTCTTTGAACGCAAGTTGCGCCCCAAGCCTTCTGGCCGAGGGCACGTCTGCCTGGGTGTCACAA \ No newline at end of file
--- a/reactivity_cal/react_cal.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,135 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- -import sys -from Bio import SeqIO -import math -from parse_dis_react import * -from react_norm_function import * -import os -import random -import string - - -dist_file1 = sys.argv[1] #plus library -dist_file2 = sys.argv[2] #minus library -seq_file = sys.argv[3] #Reference library(genome/cDNA) -nt_spec = sys.argv[4] #only show reactivity for AC or ATCG -flag_in = sys.argv[5] # perform 2-8% normalization (1) or not (0) -threshold = sys.argv[6] #Threshold to cap the reactivities -output_file = sys.argv[7] - - -distri_p = parse_dist(dist_file1) -distri_m = parse_dist(dist_file2) -threshold = float(threshold) - - -syspathrs = os.getcwd() - -h = file(syspathrs+"react.txt",'w') -flag_in = int(flag_in) - -seqs = SeqIO.parse(open(seq_file),'fasta'); -nt_s = set() -for i in range(len(nt_spec)): - nt_s.add(nt_spec[i]) - -flag = 0 -trans = [] -distri_p = distri_p[1] -distri_m = distri_m[1] - -#thres = int(threshold) - - -transcripts = {} -for seq in seqs: - n = seq.id - trans.append(n) - transcripts[n] = seq.seq.tostring() - - -#print(distri_p) - - -for i in range(0, len(trans)): - h.write(trans[i]) - h.write('\n') - for j in range(len(distri_p[trans[i]])): - distri_p[trans[i]][j] = math.log((int(distri_p[trans[i]][j])+1),math.e) - for j in range(len(distri_m[trans[i]])): - distri_m[trans[i]][j] = math.log((int(distri_m[trans[i]][j])+1),math.e) - s_p = sum(distri_p[trans[i]]) - s_m = sum(distri_m[trans[i]]) - length = len(distri_p[trans[i]]) - if s_p!= 0 and s_m!= 0: - r = [] - for j in range(0, len(distri_p[trans[i]])): - f_p = (float(distri_p[trans[i]][j]))/float(s_p)*length - f_m = (float(distri_m[trans[i]][j]))/float(s_m)*length - raw_react = f_p-f_m - r.append(max(0, raw_react)) - - if s_p!= 0 and s_m!= 0: - for k in range(1,(len(r)-1)): - if transcripts[trans[i]][k-1] in nt_s: - h.write(str(r[k])) - h.write('\t') - else: - h.write('NA') - h.write('\t') - k = k+1 - if transcripts[trans[i]][k-1] in nt_s: - h.write(str(r[k])) - h.write('\n') - else: - h.write('NA') - h.write('\n') - - -h.close() - -if flag_in: - react_norm((syspathrs+"react.txt"),output_file, threshold) -else: - h_o = file(output_file, 'w') - f_i = open(syspathrs+"react.txt") - for aline in f_i.readlines(): - h_o.write(aline.strip()) - h_o.write('\n') -os.system("rm -f "+syspathrs+"react.txt") - -#os.system("rm -r "+syspathrs) - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
--- a/reactivity_cal/react_norm_function.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,82 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- -import sys -from Bio import SeqIO -import math -from parse_dis_react import * - -def cap(a,value): - if a>=value: - return value - else: - return a - -def react_norm(react_file, result_file, capped_value): - print("Normalizing.....") - react1 = parse_dist(react_file) - react = react1[1] - h = file(result_file, 'w') - - capped = int(capped_value) - - all_react = [] - - - for t in react: - if react[t]!='null': - for i in range(len(react[t])): - if react[t][i]!='NA': - all_react.append(float(react[t][i])) - - - all_react.sort(reverse = True) - - - eight = all_react[int(len(all_react)*0.02):int(len(all_react)*0.1)] - meight = sum(eight)/len(eight) - - for t in react: - h.write(t) - h.write('\n') - if react[t]!='null': - for i in range((len(react[t])-1)): - if react[t][i]!='NA': - h.write(str(cap((float(react[t][i])/meight),capped))) - else: - h.write('NA') - h.write('\t') - if react[t][i+1]!='NA': - h.write(str(cap((float(react[t][i+1])/meight),capped))) - else: - h.write('NA') - h.write('\n') - - h.close() - - - - - - - - - - - - - - - - - - - - - - - - - - - -
--- a/reactivity_cal/reactivity_calculation.xml Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,60 +0,0 @@ -<tool id="react_cal_pipeline" name="Reactivity Calculation" version="1.0"> - <description></description> - <command interpreter="python">react_cal.py $dist_file1 $dist_file2 $seq_file $nt_spec $flag_in $threshold $output </command> - <requirements> - <requirement type="package" version="1.61">biopython</requirement> - <requirement type="package" version="1.7.1">numpy</requirement> - </requirements> - <inputs> - <param name="dist_file1" type="data" format="txt" label="RTSC file for (+) library"/> - <param name="dist_file2" type="data" format="txt" label="RTSC file for (-) library"/> - <param name="seq_file" type="data" format="fasta" label="Reference genome/transcriptome"/> - <param name="nt_spec" type="select" label="Nucleotide specificity"> - <option value="AC">AC</option> - <option value="ATCG">AUCG</option> - </param> - <param name="flag_in" type="boolean" checked="true" truevalue = "1" falsevalue = "0" label="Normalization is performed if checked"/> - <param name="threshold" type="float" value = "7" optional = "true" label="Threshold to cap the reactivities"/> - </inputs> - <outputs> - <data name="output" format="txt"/> - </outputs> - <tests> - <test> - <param name="dist_file1" value="dis_f_N1Ap_rrna.txt" /> - <param name="dist_file2" value="dis_f_N1Am_rrna.txt" /> - <param name="seq_file" value="rRNA.txt" /> - <param name="nt_spec" value="AC" /> - <param name="flag_in" value="1" /> - <param name="threshold" value="7" /> - <output name="output" file="DMS_reactivities.out" /> - - </test> - </tests> - - <help> - - -**TIPS**: - ------ - -**Input**: - -* 1. RTSC files (Output of Get RT Stop Counts) for (+) and (-) library -* 2. Reference file (fasta) used to map the reads to -* 3. Nucleotide Specificity (Type of nucleotides to have reactivity, e.g. AC for DMS and ACTG for SHAPE) -* [Optional]: -* 1. A threshold to cap the structural reactivities. {Default: 7} -* 2. Flag that determines whether to perform 2%-8% normalization {Default: Yes} - ------ - -**Output**: - -A text file with structural reactivity for each nucleotide (Reactivity file) - - - - </help> -</tool>
--- a/reactivity_cal/read_file.py Mon Nov 24 18:21:30 2014 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,21 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- - -import sys - - - -def read_t_file(in_file): - f = open(in_file); - result = []; - for aline in f.readlines(): - temp = []; - tline = aline.strip(); - tl = tline.split('\t'); - for i in range(0, len(tl)): - temp.append(tl[i].strip()); - result.append(temp); - f.close(); - return result; - -