annotate run_flock/runFlockMFI.py @ 0:c1e924e37080 draft

Uploaded
author immport-devteam
date Mon, 27 Feb 2017 13:06:23 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
1 #!/usr/bin/env python
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
2 ######################################################################
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
3 # Copyright (c) 2016 Northrop Grumman.
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
4 # All rights reserved.
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
5 ######################################################################
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
6 # version 2
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
7 from __future__ import print_function
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
8
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
9 import sys
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
10 import os
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
11 from argparse import ArgumentParser
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
12 import pandas as pd
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
13 from scipy.stats import gmean
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
14
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
15
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
16 def run_FLOCK(input_file, method, bins, density, output_file, mfi_file,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
17 mfi_calc, profile, tool_directory):
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
18 run_command = tool_directory + "/bin/" + method + " " + input_file
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
19 if bins:
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
20 run_command += " " + bins
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
21 if density:
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
22 run_command += " " + density
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
23
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
24 os.system(run_command)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
25
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
26 move_command = "mv flock_results.txt " + output_file
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
27 os.system(move_command)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
28
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
29 # Here add some way to calculate the count and tack it on to profile file.
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
30 flockdf = pd.read_table(output_file)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
31 if mfi_calc == "mfi":
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
32 MFIs = flockdf.groupby('Population').mean().round(decimals=2)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
33 elif mfi_calc == "gmfi":
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
34 MFIs = flockdf.groupby('Population').agg(lambda x: gmean(list(x))).round(decimals=2)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
35 else:
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
36 MFIs = flockdf.groupby('Population').median().round(decimals=2)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
37
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
38 with open(mfi_file, "w") as outf:
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
39 MFIs.to_csv(outf, sep="\t", float_format='%.0f')
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
40
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
41 (events, columns) = flockdf.shape
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
42 fstats = {}
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
43 fstats['population'] = flockdf.iloc[:, -1:].iloc[:, 0]
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
44 fstats['population_freq'] = fstats['population'].value_counts()
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
45 fstats['population_freq_sort'] = fstats['population_freq'].sort_index()
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
46 fstats['population_per'] = (fstats['population'].value_counts(normalize=True) * 100).round(decimals=2)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
47 fstats['population_per_sort'] = fstats['population_per'].sort_index()
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
48 fstats['population_all'] = pd.concat([fstats['population_freq_sort'], fstats['population_per_sort']], axis=1)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
49 fstats['population_all'].columns = ['Count', 'Percentage']
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
50 fstats['population_all']['Population_ID'] = fstats['population_all'].index
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
51
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
52 flock_profile = pd.read_table('profile.txt')
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
53 profile_pop = flock_profile.merge(fstats['population_all'], on='Population_ID')
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
54 profile_pop.to_csv(profile, sep="\t", float_format='%.2f', index=False)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
55
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
56 # get_profile = "mv profile.txt " + profile
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
57 # os.system(get_profile)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
58 return
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
59
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
60
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
61 if __name__ == "__main__":
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
62 parser = ArgumentParser(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
63 prog="runFlockMFI",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
64 description="Run Flock on text file and generate centroid file")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
65
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
66 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
67 '-i',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
68 dest="input_file",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
69 required=True,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
70 help="File location for the FCS file.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
71
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
72 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
73 '-m',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
74 dest="method",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
75 required=True,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
76 help="Run flock1 or flock2.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
77
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
78 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
79 '-M',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
80 dest="mfi_calc",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
81 required=True,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
82 help="what to calculate for centroids.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
83
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
84 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
85 '-b',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
86 dest="bins",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
87 required=False,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
88 help="Number of Bins.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
89
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
90 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
91 '-d',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
92 dest="density",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
93 required=False,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
94 help="Density.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
95
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
96 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
97 '-o',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
98 dest="output_file",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
99 required=True,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
100 help="File location for the output file.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
101
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
102 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
103 '-t',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
104 dest="tool_directory",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
105 required=True,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
106 help="File location for the output file.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
107
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
108 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
109 '-c',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
110 dest="centroids",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
111 required=True,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
112 help="File location for the output centroid file.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
113
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
114 parser.add_argument(
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
115 '-p',
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
116 dest="profile",
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
117 required=True,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
118 help="File location for the output profile file.")
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
119
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
120 args = parser.parse_args()
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
121 run_FLOCK(args.input_file, args.method, args.bins,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
122 args.density, args.output_file, args.centroids, args.mfi_calc,
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
123 args.profile, args.tool_directory)
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
124
c1e924e37080 Uploaded
immport-devteam
parents:
diff changeset
125 sys.exit(0)