# HG changeset patch # User xuebing # Date 1331920756 14400 # Node ID 7cc64021dc90907ef918d03e6434b429a34d81e6 # Parent 8e101f0cac2ff81d6d4533094b76daaa16f861ed Uploaded diff -r 8e101f0cac2f -r 7cc64021dc90 mytools/match.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mytools/match.xml Fri Mar 16 13:59:16 2012 -0400 @@ -0,0 +1,56 @@ + + find short motif occurrences + ./match $motif $seq $output $nmismatch $rc $bed > $log + + + + + + + + + + + + + + +**What it does** + +This tool searches occurrences of a short nucleotide seuqences (allowing mismatches) in a set of longer sequences. + +Example motif file:: + + >motif1 + CAGGTAAGT + >motif2 + GTTTGGGGGCC + +Example sequence file:: + + >hg18_chr6_122208322_122209078_+ + CGTCGTAGCTACTAGCTACGTACGTACGTAGCTAGCATGCATGCTACGTA + CGTAGCTAGCTAAAAAAAAAAAAAAACTGCGGCTAGCTAGCTAGCTACGT + CGATCGTAGCTAC... + >hg18_chr6_1208322_122209023_+ + CGATGCTAGCTAGCTAGCTACGTAGCTAGCTAGTCGATGCTAGCTAGCTA + ATGCTAGCTAGC.... + +Output (bed):: + + chr11 72790893 72790902 ACTTAACTG 1 - antisense 5ss,G4T:CAGTTAAGT-rc hg18_chr11_727 +90846_72791902_+ 47 + chr11 72791880 72791889 CAGGTAAGA 1 + sense 5ss,T9A:CAGGTAAGA hg18_chr11_72790846_72 +791902_+ 1034 + + +Output (tab):: + + Tmod4 802 5ss:CAGGTAAGT-rc ACTTACCTG + Atp7b 77 5ss:CAGGTAAGT CAGGTAAGT + Fnta 665 5ss:CAGGTAAGT CAGGTAAGT + + + + +