Mercurial > repos > proteore > proteore_build_protein_interaction_maps
annotate build_protein_interaction_maps.py @ 5:ba96ca3496a2 draft default tip
"planemo upload commit c9a32e920aae2bc186183611bc0abb2040e106f3"
author | proteore |
---|---|
date | Thu, 06 Feb 2020 08:28:04 -0500 |
parents | 0a85d709c4ae |
children |
rev | line source |
---|---|
0
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
1 # -*- coding: utf-8 -*- |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
2 import csv, json, argparse, re |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
3 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
4 def get_args() : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
5 parser = argparse.ArgumentParser() |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
6 parser.add_argument("--species") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
7 parser.add_argument("--database", help="Humap, Bioplex or Biogrid", required=True) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
8 parser.add_argument("--dict_path", required=True) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
9 parser.add_argument("--input_type", help="type of input (list of id or filename)",required=True) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
10 parser.add_argument("--input", required=True) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
11 parser.add_argument("--header") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
12 parser.add_argument("--ncol") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
13 parser.add_argument("--id_type") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
14 parser.add_argument("--network_output") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
15 parser.add_argument("--nodes_output") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
16 args = parser.parse_args() |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
17 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
18 if args.input_type=="file" : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
19 args.ncol = nb_col_to_int(args.ncol) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
20 args.header = str2bool(args.header) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
21 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
22 return args |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
23 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
24 #Turn string into boolean |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
25 def str2bool(v): |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
26 if v.lower() in ('yes', 'true', 't', 'y', '1'): |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
27 return True |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
28 elif v.lower() in ('no', 'false', 'f', 'n', '0'): |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
29 return False |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
30 else: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
31 raise argparse.ArgumentTypeError('Boolean value expected.') |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
32 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
33 #return the column number in int format |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
34 def nb_col_to_int(nb_col): |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
35 try : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
36 nb_col = int(nb_col.replace("c", "")) - 1 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
37 return nb_col |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
38 except : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
39 sys.exit("Please specify the column where you would like to apply the filter with valid format") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
40 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
41 #return list of (unique) ids from string |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
42 def get_input_ids_from_string(input) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
43 ids_list = list(set(re.split(r'\s+',input.replace(";"," ").replace("\r","").replace("\n"," ").replace("\t"," ")))) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
44 if "" in ids_list : ids_list.remove("") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
45 #if "NA" in ids_list : ids_list.remove("NA") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
46 return ids_list |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
47 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
48 #return input_file and list of unique ids from input file path |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
49 def get_input_ids_from_file(input,nb_col,header) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
50 with open(input, "r") as csv_file : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
51 input_file= list(csv.reader(csv_file, delimiter='\t')) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
52 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
53 input_file, ids_list = one_id_one_line(input_file,nb_col,header) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
54 if "" in ids_list : ids_list.remove("") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
55 #if "NA" in ids_list : ids_list.remove("NA") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
56 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
57 return input_file, ids_list |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
58 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
59 #return input file by adding lines when there are more than one id per line |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
60 def one_id_one_line(input_file,nb_col,header) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
61 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
62 if header : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
63 new_file = [input_file[0]] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
64 input_file = input_file[1:] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
65 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
66 new_file=[] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
67 ids_list=[] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
68 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
69 for line in input_file : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
70 if line != [] and set(line) != {''}: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
71 line[nb_col] = re.sub(r"\s+","",line[nb_col]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
72 if ";" in line[nb_col] : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
73 ids = line[nb_col].split(";") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
74 for id in ids : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
75 new_file.append(line[:nb_col]+[id]+line[nb_col+1:]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
76 ids_list.append(id) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
77 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
78 new_file.append(line) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
79 ids_list.append(line[nb_col]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
80 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
81 ids_list= list(set(ids_list)) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
82 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
83 return new_file, ids_list |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
84 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
85 #replace all blank cells to NA |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
86 def blank_to_NA(csv_file) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
87 tmp=[] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
88 for line in csv_file : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
89 line = ["NA" if cell=="" or cell==" " or cell=="NaN" or cell=="-" else cell for cell in line] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
90 tmp.append(line) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
91 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
92 return tmp |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
93 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
94 def biogrid_output_files(ids,species) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
95 network_file=[["Entrez Gene Interactor A","Entrez Gene Interactor B","Gene symbol Interactor A","Gene symbol Interactor B","Experimental System","Experimental Type","Pubmed ID","Interaction Score","Phenotypes"]] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
96 ids_set= set(ids) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
97 ids_not_found=set([]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
98 for id in ids : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
99 if id in ppi_dict['network'] : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
100 network_file.extend(ppi_dict['network'][id]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
101 ids_set.update([interact[1] for interact in ppi_dict['network'][id]]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
102 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
103 ids_not_found.add(id) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
104 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
105 nodes_file = [["Entrez gene ID","Official Symbol Interactor","Present in user input ids","ID present in Biogrid "+species,"Pathway"]] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
106 for id in ids_set: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
107 #get pathway |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
108 if id in ppi_dict['nodes']: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
109 description_pathway=";".join(ppi_dict['nodes'][id]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
110 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
111 description_pathway="NA" |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
112 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
113 #get gene name |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
114 if id in ppi_dict['network']: gene_name = ppi_dict['network'][id][0][2] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
115 else : gene_name="NA" |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
116 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
117 #make line |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
118 nodes_file.append([id]+[gene_name]+[id in ids]+[id not in ids_not_found]+[description_pathway]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
119 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
120 return network_file,nodes_file |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
121 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
122 def bioplex_output_files(ids,id_type,species) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
123 network_file=[[id_type+" Interactor A",id_type+" Interactor B","Gene symbol Interactor A","Gene symbol Interactor B","Interaction Score"]] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
124 ids_set= set(ids) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
125 ids_not_found=set([]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
126 for id in ids : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
127 if id in ppi_dict['network'][id_type] : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
128 network_file.extend(ppi_dict['network'][id_type][id]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
129 ids_set.update([interact[1] for interact in ppi_dict['network'][id_type][id]]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
130 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
131 ids_not_found.add(id) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
132 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
133 if id_type=="UniProt-AC" : nodes_file=[[id_type,"Present in user input ids","ID present in Human Bioplex","Pathway"]] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
134 else: nodes_file=[[id_type,"Official symbol Interactor","Present in user input ids","Present in interactome","Pathway"]] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
135 for id in ids_set: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
136 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
137 if id in ppi_dict['nodes'][id_type]: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
138 description_pathway=";".join(ppi_dict['nodes'][id_type][id]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
139 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
140 description_pathway="NA" |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
141 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
142 #make line |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
143 if id_type=="UniProt-AC": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
144 nodes_file.append([id]+[id in ids]+[id not in ids_not_found]+[description_pathway]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
145 elif id_type=="GeneID": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
146 #get gene_name |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
147 if id in ppi_dict['network'][id_type]: gene_name = ppi_dict['network'][id_type][id][0][2] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
148 else : gene_name="NA" |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
149 nodes_file.append([id]+[gene_name]+[id in ids]+[id not in ids_not_found]+[description_pathway]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
150 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
151 return network_file,nodes_file |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
152 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
153 def humap_output_files(ids,species) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
154 network_file=[["Entrez Gene Interactor A","Entrez Gene Interactor B","Gene symbol Interactor A","Gene symbol Interactor B","Interaction Score"]] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
155 ids_set= set(ids) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
156 ids_not_found=set([]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
157 for id in ids : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
158 if id in ppi_dict['network'] : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
159 network_file.extend(ppi_dict['network'][id]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
160 ids_set.update([interact[1] for interact in ppi_dict['network'][id]]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
161 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
162 ids_not_found.add(id) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
163 |
1
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
164 nodes_file = [["Entrez gene ID","Official Symbol Interactor","Present in user input ids","ID present in Hu.MAP","Protein name","Pathway"]] |
0
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
165 for id in ids_set: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
166 if id in ppi_dict['nodes']: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
167 description_pathway=";".join(ppi_dict['nodes'][id]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
168 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
169 description_pathway="NA" |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
170 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
171 #get gene name |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
172 if id in ppi_dict['gene_name']: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
173 gene_name = ppi_dict['gene_name'][id] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
174 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
175 gene_name = "NA" |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
176 |
1
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
177 #get protein name |
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
178 if id in ppi_dict['protein_name']: |
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
179 protein_name = ppi_dict['protein_name'][id] |
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
180 else : |
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
181 protein_name = "NA" |
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
182 |
0
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
183 #make line |
1
0a85d709c4ae
planemo upload commit 567ba7934c0ca55529dfeb5e7ca0935ace260ad7-dirty
proteore
parents:
0
diff
changeset
|
184 nodes_file.append([id]+[gene_name]+[id in ids]+[id not in ids_not_found]+[protein_name]+[description_pathway]) |
0
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
185 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
186 return network_file,nodes_file |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
187 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
188 #function to sort the csv_file by value in a specific column |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
189 def sort_by_column(tab,sort_col,reverse,header): |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
190 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
191 if len(tab) > 1 : #if there's more than just a header or 1 row |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
192 if header : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
193 head=tab[0] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
194 tab=tab[1:] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
195 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
196 #list of empty cells in the column to sort |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
197 unsortable_lines = [i for i,line in enumerate(tab) if (line[sort_col]=='' or line[sort_col] == 'NA')] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
198 unsorted_tab=[ tab[i] for i in unsortable_lines] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
199 tab= [line for i,line in enumerate(tab) if i not in unsortable_lines] |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
200 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
201 if only_number(tab,sort_col) and any_float(tab,sort_col) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
202 tab = sorted(tab, key=lambda row: float(row[sort_col]), reverse=reverse) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
203 elif only_number(tab,sort_col): |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
204 tab = sorted(tab, key=lambda row: int(row[sort_col]), reverse=reverse) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
205 else : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
206 tab = sorted(tab, key=lambda row: row[sort_col], reverse=reverse) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
207 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
208 tab.extend(unsorted_tab) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
209 if header is True : tab = [head]+tab |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
210 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
211 return tab |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
212 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
213 def only_number(tab,col) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
214 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
215 for line in tab : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
216 if not (is_number("float",line[col].replace(",",".")) or is_number("int",line[col].replace(",","."))) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
217 return False |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
218 return True |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
219 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
220 #Check if a variable is a float or an integer |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
221 def is_number(number_format, n): |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
222 float_format = re.compile(r"^[-]?[0-9][0-9]*.?[0-9]+$") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
223 int_format = re.compile(r"^[-]?[0-9][0-9]*$") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
224 test = "" |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
225 if number_format == "int": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
226 test = re.match(int_format, n) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
227 elif number_format == "float": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
228 test = re.match(float_format, n) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
229 if test: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
230 return True |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
231 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
232 #return True is there is at least one float in the column |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
233 def any_float(tab,col) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
234 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
235 for line in tab : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
236 if is_number("float",line[col].replace(",",".")) : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
237 return True |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
238 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
239 return False |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
240 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
241 def main() : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
242 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
243 #Get args from command line |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
244 global args |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
245 args = get_args() |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
246 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
247 #get PPI dictionary |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
248 with open(args.dict_path, 'r') as handle: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
249 global ppi_dict |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
250 ppi_dict = json.load(handle) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
251 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
252 #Get file and/or ids from input |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
253 if args.input_type == "text" : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
254 ids = get_input_ids_from_string(args.input) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
255 elif args.input_type == "file" : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
256 input_file, ids = get_input_ids_from_file(args.input,args.ncol,args.header) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
257 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
258 #create output files |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
259 if args.database=="biogrid": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
260 network_file, nodes_file = biogrid_output_files(ids,args.species) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
261 elif args.database=="bioplex": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
262 network_file, nodes_file = bioplex_output_files(ids,args.id_type,args.species) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
263 elif args.database=="humap": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
264 network_file, nodes_file = humap_output_files(ids,args.species) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
265 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
266 #convert blank to NA and sort files |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
267 network_file = blank_to_NA(network_file) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
268 network_file = sort_by_column(network_file,0,False,True) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
269 nodes_file = sort_by_column(nodes_file,0,False,True) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
270 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
271 #write output files |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
272 with open(args.network_output,"w") as output : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
273 writer = csv.writer(output,delimiter="\t") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
274 writer.writerows(network_file) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
275 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
276 with open(args.nodes_output,"w") as output : |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
277 writer = csv.writer(output,delimiter="\t") |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
278 for row in nodes_file: |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
279 writer.writerow([unicode(s).encode("utf-8") for s in row]) |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
280 |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
281 if __name__ == "__main__": |
b0ac71686b99
planemo upload commit 968cd5b4f78f0a1da86fc3bc29f8159f86e199aa-dirty
proteore
parents:
diff
changeset
|
282 main() |