annotate pandas_pivot_table.py @ 4:eaf2444a2a50 draft default tip

"planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
author jjohnson
date Fri, 18 Dec 2020 19:35:57 +0000
parents 4b65133e0722
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
1 #!/usr/bin/env python
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
2
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
3 import argparse
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
4 import json
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
5 import pandas as pd
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
6 import sys
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
7 from json.decoder import JSONDecodeError
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
8
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
9
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
10 def __main__():
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
11 p = argparse.ArgumentParser()
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
12 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
13 '-i', '--input',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
14 type=argparse.FileType('r'),
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
15 required=True,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
16 help='Tabular input file to pivot'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
17 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
18 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
19 '-o', '--output',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
20 type=argparse.FileType('w'),
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
21 required=True,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
22 help='Output file'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
23 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
24 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
25 '-S', '--skiprows',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
26 type=int,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
27 default=0,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
28 help='Input column names'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
29 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
30 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
31 '-H', '--header',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
32 default=None,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
33 help='Input column names'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
34 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
35 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
36 '-P', '--prefix',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
37 default=None,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
38 help='Prefix for input column names'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
39 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
40 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
41 '-I', '--index',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
42 help='index columns'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
43 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
44 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
45 '-C', '--columns',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
46 help='columns values which are returned as columns'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
47 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
48 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
49 '-V', '--values',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
50 help='values'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
51 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
52 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
53 '-F', '--aggfunc',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
54 help='aggregate functions on the values'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
55 )
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
56 p.add_argument(
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
57 '-N', '--fill_value',
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
58 default=None,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
59 help='fill value for missing values'
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
60 )
2
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
61 p.add_argument(
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
62 '-f', '--float_format',
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
63 default='%0.6f',
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
64 help=''
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
65 )
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
66 args = p.parse_args()
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
67
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
68 def getValueType(val):
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
69 if val or 0. == val:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
70 try:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
71 return int(val)
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
72 except ValueError:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
73 try:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
74 return float(val)
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
75 except ValueError:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
76 return val
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
77 return None
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
78
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
79 def getColumn(name, dfcols, value_cols=None):
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
80 dfname = None
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
81 if name in dfcols:
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
82 dfname = name
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
83 else:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
84 try:
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
85 i = int(name) - 1
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
86 dfname = dfcols[i]
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
87 except IndexError:
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
88 sys.exit('%s not an index into %s' % (name, dfcols))
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
89 except ValueError:
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
90 sys.exit('%s not a column in %s' % (name, dfcols))
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
91 if value_cols and dfname not in value_cols:
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
92 sys.exit('%s not a value column in %s' % (name, value_cols))
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
93 return dfname
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
94
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
95 def getColumns(val, dfcols):
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
96 fields = [v.strip() for v in val.split(',')]
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
97 cols = []
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
98 for name in fields:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
99 cols.append(getColumn(name, dfcols))
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
100 return cols
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
101
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
102 def getAggFunc(funcStr, dfcols, value_cols):
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
103 af = funcStr
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
104 try:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
105 af = json.loads(funcStr)
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
106 except JSONDecodeError as de:
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
107 sys.exit('"%s" is not a json string: %s' % (funcStr, de.msg))
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
108 if isinstance(af, dict):
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
109 aggfunc = {getColumn(k, dfcols, value_cols): v
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
110 for k, v in af.items()}
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
111 elif isinstance(af, list):
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
112 aggfunc = af
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
113 else:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
114 aggfunc = af
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
115 return aggfunc
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
116
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
117 if args.prefix:
1
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
118 df = pd.read_table(args.input,
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
119 skiprows=args.skiprows,
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
120 header=None,
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
121 prefix=args.prefix)
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
122 elif args.header:
1
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
123 df = pd.read_table(args.input,
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
124 skiprows=args.skiprows,
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
125 header=args.header)
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
126 else:
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
127 df = pd.read_table(args.input, skiprows=args.skiprows)
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
128 df_columns = df.columns.tolist()
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
129 index = getColumns(args.index, df_columns)
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
130 columns = getColumns(args.columns, df_columns)
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
131 values = getColumns(args.values, df_columns)
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
132 fill_value = getValueType(args.fill_value)
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
133 aggfunc = getAggFunc(args.aggfunc.replace('\'', '"'), df_columns, values)
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
134 pdf = df.pivot_table(index=index, columns=columns,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
135 values=values, aggfunc=aggfunc,
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
136 fill_value=fill_value)
4
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
137 pdf_cols = ['_'.join([str(x) for x in reversed(p)])
eaf2444a2a50 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit de16c12e9e27d41d7c7624d7574c51b5bb8edff1-dirty"
jjohnson
parents: 3
diff changeset
138 if isinstance(p, tuple) else str(p)
1
c02f59711eb6 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit af9d36fa3efb1cf136a69e7ed1a5f06261f9b0d6-dirty"
jjohnson
parents: 0
diff changeset
139 for p in pdf.columns.tolist()]
2
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
140 pdf.to_csv(args.output,
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
141 sep='\t',
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
142 float_format=args.float_format,
6f05390deffa "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 1ca7433aaa606c636f796c75b6cfd8a080e2d5bc-dirty"
jjohnson
parents: 1
diff changeset
143 header=pdf_cols)
0
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
144
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
145
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
146 if __name__ == "__main__":
621144f8dbe9 "planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/pandas_pivot_table/ commit 80684939b0bf75abb5cc70a9878054c1f734b651-dirty"
jjohnson
parents:
diff changeset
147 __main__()