annotate cmpb2016/top10_CDR3_exact_pairing.py @ 9:f4edb9437b95 draft

Deleted selected files
author chmaramis
date Sun, 18 Mar 2018 07:06:56 -0400
parents 8be019b173e6
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
1 # -*- coding: utf-8 -*-
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
2 """
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
3 Created on Mon Apr 18 09:48:00 2016
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
4
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
5 @author: chmaramis
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
6 """
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
7
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
8 import pandas as pd
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
9 import numpy as np
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
10 import sys
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
11
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
12
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
13 if __name__ == "__main__":
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
14
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
15 clonosFN = sys.argv[1]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
16 outFN = sys.argv[2]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
17
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
18 Cl = pd.read_csv(clonosFN,sep='\t',index_col=0)
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
19 T10 = Cl[:10].copy()
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
20
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
21 aa_junction = np.array(T10['AA JUNCTION'])
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
22 geneCol = [x for x in T10.columns if x.upper().endswith('GENE')][0]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
23
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
24 vG_unique = np.unique(Cl[geneCol])
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
25 noVG = len(vG_unique)
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
26
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
27 F = np.zeros((noVG,20))
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
28
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
29 for i in range(0,10):
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
30 taa = T10['AA JUNCTION'][i+1]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
31 sameAA = np.where(Cl['AA JUNCTION'] == taa)[0]+1
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
32 if Cl[geneCol][sameAA[0]] != T10[geneCol][i+1]:
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
33 print('We have a problem here!')
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
34
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
35 # Make original Gene -1
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
36 #orGene = Cl['V-GENE'][sameAA[0]]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
37 #orGeneUn = np.where(vG_unique == orGene)[0][0]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
38 #F[orGeneUn,i] = -1
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
39
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
40 # Other Genes
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
41 for j in range(0,len(sameAA)):
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
42 othGene = Cl[geneCol][sameAA[j]]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
43 othRead = Cl['Reads'][sameAA[j]]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
44 othFreq = Cl['Frequency %'][sameAA[j]]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
45 orGeneUn = np.where(vG_unique == othGene)[0][0]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
46 F[orGeneUn,2*i] += othRead
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
47 F[orGeneUn,2*i+1] += othFreq
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
48
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
49
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
50 K = list(aa_junction+' Reads')
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
51 L = list(aa_junction+' Freq. %')
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
52 columns = [val for pair in zip(K,L) for val in pair]
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
53
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
54 D = pd.DataFrame(F,columns=columns,index=vG_unique)
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
55 D.to_csv(outFN,sep='\t')
8be019b173e6 Uploaded included tools
chmaramis
parents:
diff changeset
56