# HG changeset patch # User xuebing # Date 1331928679 14400 # Node ID 5a93fe53194d500247b5f683173ee7e42ff87c58 # Parent 7b8a5b55ee1535568e6020a86c921a5fa11ec612 Uploaded diff -r 7b8a5b55ee15 -r 5a93fe53194d mytools/match.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mytools/match.xml Fri Mar 16 16:11:19 2012 -0400 @@ -0,0 +1,54 @@ + + find short motif occurrences + match $motif $seq $output $nmismatch $rc $bed > $log + + + + + + + + + + + + + + +**What it does** + +This tool searches occurrences of a short nucleotide seuqences (allowing mismatches) in a set of longer sequences. + +Example motif file:: + + >motif1 + CAGGTAAGT + >motif2 + GTTTGGGGGCC + +Example sequence file:: + + >hg18_chr6_122208322_122209078_+ + CGTCGTAGCTACTAGCTACGTACGTACGTAGCTAGCATGCATGCTACGTA + CGTAGCTAGCTAAAAAAAAAAAAAAACTGCGGCTAGCTAGCTAGCTACGT + CGATCGTAGCTAC... + >hg18_chr6_1208322_122209023_+ + CGATGCTAGCTAGCTAGCTACGTAGCTAGCTAGTCGATGCTAGCTAGCTA + ATGCTAGCTAGC.... + +Output (bed):: + + chr11 72790893 72790902 ACTTAACTG 1 - antisense 5ss,G4T:CAGTTAAGT-rc hg18_chr11_72790846_72791902_+ 47 + chr11 72791880 72791889 CAGGTAAGA 1 + sense 5ss,T9A:CAGGTAAGA hg18_chr11_72790846_72791902_+ 1034 + + +Output (tab):: + + Tmod4 802 5ss:CAGGTAAGT-rc ACTTACCTG + Atp7b 77 5ss:CAGGTAAGT CAGGTAAGT + Fnta 665 5ss:CAGGTAAGT CAGGTAAGT + + + + +