Mercurial > repos > abims-sbr > pairwise
annotate scripts/S03_run_second_blast.py @ 0:90b57ab0bd1d draft default tip
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
| author | abims-sbr | 
|---|---|
| date | Fri, 01 Feb 2019 10:23:16 -0500 | 
| parents | |
| children | 
| rev | line source | 
|---|---|
| 0 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 1 #!/usr/bin/env python | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 2 # coding: utf-8 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 3 # Author : Victor Mataigne | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 4 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 5 import itertools, argparse, os | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 6 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 7 def main(): | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 8 parser = argparse.ArgumentParser() | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 9 parser.add_argument('query_file', help='fasta file (to translate) for query') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 10 parser.add_argument('db_file', help='fasta files (already translated) for db') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 11 parser.add_argument('file_subname', help='keyword for output file name') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 12 parser.add_argument('evalue', help='evalue for blast') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 13 parser.add_argument('method', choices=['tblastx', 'diamond'], help='alignment tool (tblastx or diamond)') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 14 args = parser.parse_args() | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 15 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 16 if args.method == 'diamond': | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 17 from Bio.Seq import Seq | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 18 from Bio.Alphabet import IUPAC | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 19 # Traduire les best hits | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 20 f_name = 'translated_{}'.format(args.query_file) | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 21 translated_file = open(f_name, 'w') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 22 with open(args.query_file, 'r') as file: | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 23 for name, seq in itertools.izip_longest(*[file]*2): | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 24 s = Seq(seq.strip('\n').upper(), IUPAC.ambiguous_dna) | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 25 translated_file.write(name.strip('\n')+'_orf_1\n') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 26 translated_file.write(s.translate()._data+'\n') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 27 translated_file.write(name.strip('\n')+'_orf_2\n') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 28 translated_file.write(s[1:].translate()._data+'\n') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 29 translated_file.write(name.strip('\n')+'_orf_3\n') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 30 translated_file.write(s[2:].translate()._data+'\n') | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 31 translated_file.close() | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 32 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 33 os.system('diamond makedb --in %s -d %s >> log_diamond.log' %(args.db_file, args.db_file.split('_')[1])) | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 34 os.system('diamond blastp -q %s -d %s --max-target-seqs 1 -o matches_blast2_%s -e %s --more-sensitive >> log_diamond.log' %(f_name, args.db_file.split('_')[1], args.file_subname, args.evalue)) | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 35 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 36 elif args.method == 'tblastx': | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 37 os.system('formatdb -i %s -p F -o T >> log_tblastx.log' %(args.db_file)) | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 38 os.system('blastall -p tblastx -d %s -i %s -o matches_blast2_%s -T F -e %s -F "mS" -b1 -v1 -K 1 -m 8 >> log_tblastx.log' %(args.db_file, args.query_file, args.file_subname, args.evalue)) | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 39 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 40 else : | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 41 print 'Mispecified alignment tool' | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 42 exit() | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 43 | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 44 if __name__ == "__main__": | 
| 
90b57ab0bd1d
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
 abims-sbr parents: diff
changeset | 45 main() | 
