63
|
1 #!/usr/bin/env python
|
|
2 # -*- coding: utf-8 -*-
|
|
3
|
|
4 """
|
68
|
5 Histograms
|
63
|
6
|
|
7 Unicode is awesome; see http://www.alanwood.net/unicode/block_elements.html
|
|
8 """
|
|
9
|
|
10 blocks = """
|
|
11 █
|
|
12 ▉
|
|
13 ▊
|
|
14 ▋
|
|
15 ▌
|
|
16 ▍
|
|
17 ▎
|
|
18 ▏
|
|
19 """
|
|
20
|
|
21 # imports
|
|
22 import argparse
|
|
23 import os
|
|
24 import sys
|
|
25 import time
|
75
|
26 from .data import transpose
|
63
|
27 from .read import CSVParser
|
64
|
28 from collections import OrderedDict
|
63
|
29
|
|
30 # module globals
|
64
|
31 __all__ = ['Histogram', 'HistogramParser', 'main']
|
|
32
|
|
33 class Histogram(object):
|
|
34 """historgram"""
|
63
|
35
|
64
|
36 def __init__(self, bins):
|
73
|
37 self.bins = sorted(bins)
|
64
|
38 assert len(bins) > 1
|
73
|
39 self.data = OrderedDict([(bin, [])
|
|
40 for bin in zip(bins[:-1],
|
|
41 bins[1:])])
|
64
|
42
|
70
|
43 def add(self, *values):
|
|
44 """add values to the histogram"""
|
71
|
45 for value in values:
|
72
|
46 for vmin, vmax in self.data.keys():
|
73
|
47 if vmin <= value < vmax:
|
72
|
48 self.data[(vmin, vmax)].append(value)
|
70
|
49
|
65
|
50 def __iadd__(self, value):
|
71
|
51 self.add(value)
|
65
|
52 return self
|
|
53
|
71
|
54 def __call__(self, *values):
|
|
55 """
|
|
56 add values to the histogram and return
|
|
57 OrderedDict of counts
|
|
58 """
|
|
59 self.add(*values)
|
73
|
60 return OrderedDict([(bin, len(value))
|
|
61 for bin, value in self.data.items()])
|
|
62
|
|
63 def keys(self):
|
|
64 return self.data.keys()
|
71
|
65
|
74
|
66 def max(self):
|
|
67 """return max length"""
|
|
68 return max([len(value) for value in self.data.values()])
|
|
69
|
|
70
|
64
|
71 class HistogramParser(CSVParser):
|
63
|
72 """histogram CLI option parser"""
|
|
73
|
|
74 def __init__(self, **kwargs):
|
|
75 kwargs.setdefault('formatter_class', argparse.RawTextHelpFormatter)
|
|
76 kwargs.setdefault('description', __doc__)
|
69
|
77 CSVParser.__init__(self, **kwargs)
|
63
|
78 self.add_argument('-n', '--bins', dest='n_bins', type=int,
|
|
79 help="number of bins")
|
|
80 self.options = None
|
|
81
|
|
82
|
|
83 def main(args=sys.argv[1:]):
|
|
84 """CLI"""
|
|
85
|
|
86 # parse command line options
|
|
87 parser = HistogramParser()
|
|
88 options = parser.parse_args(args)
|
|
89
|
75
|
90 # read data
|
|
91 data = parser.read()
|
|
92 if not data:
|
|
93 parser.error("No data given")
|
|
94
|
|
95 # transpose to columns
|
|
96 columns = transpose(data)
|
63
|
97
|
|
98 if __name__ == '__main__':
|
|
99 main()
|
|
100
|
|
101
|