63
|
1 #!/usr/bin/env python
|
|
2 # -*- coding: utf-8 -*-
|
|
3
|
|
4 """
|
68
|
5 Histograms
|
63
|
6
|
|
7 Unicode is awesome; see http://www.alanwood.net/unicode/block_elements.html
|
|
8 """
|
|
9
|
|
10 blocks = """
|
|
11 █
|
|
12 ▉
|
|
13 ▊
|
|
14 ▋
|
|
15 ▌
|
|
16 ▍
|
|
17 ▎
|
|
18 ▏
|
|
19 """
|
|
20
|
|
21 # imports
|
|
22 import argparse
|
|
23 import os
|
|
24 import sys
|
|
25 import time
|
|
26 from .read import CSVParser
|
64
|
27 from collections import OrderedDict
|
63
|
28
|
|
29 # module globals
|
64
|
30 __all__ = ['Histogram', 'HistogramParser', 'main']
|
|
31
|
|
32 class Histogram(object):
|
|
33 """historgram"""
|
63
|
34
|
64
|
35 def __init__(self, bins):
|
73
|
36 self.bins = sorted(bins)
|
64
|
37 assert len(bins) > 1
|
73
|
38 self.data = OrderedDict([(bin, [])
|
|
39 for bin in zip(bins[:-1],
|
|
40 bins[1:])])
|
64
|
41
|
70
|
42 def add(self, *values):
|
|
43 """add values to the histogram"""
|
71
|
44 for value in values:
|
72
|
45 for vmin, vmax in self.data.keys():
|
73
|
46 if vmin <= value < vmax:
|
72
|
47 self.data[(vmin, vmax)].append(value)
|
70
|
48
|
65
|
49 def __iadd__(self, value):
|
71
|
50 self.add(value)
|
65
|
51 return self
|
|
52
|
71
|
53 def __call__(self, *values):
|
|
54 """
|
|
55 add values to the histogram and return
|
|
56 OrderedDict of counts
|
|
57 """
|
|
58 self.add(*values)
|
73
|
59 return OrderedDict([(bin, len(value))
|
|
60 for bin, value in self.data.items()])
|
|
61
|
|
62 def keys(self):
|
|
63 return self.data.keys()
|
71
|
64
|
74
|
65 def max(self):
|
|
66 """return max length"""
|
|
67 return max([len(value) for value in self.data.values()])
|
|
68
|
|
69
|
64
|
70 class HistogramParser(CSVParser):
|
63
|
71 """histogram CLI option parser"""
|
|
72
|
|
73 def __init__(self, **kwargs):
|
|
74 kwargs.setdefault('formatter_class', argparse.RawTextHelpFormatter)
|
|
75 kwargs.setdefault('description', __doc__)
|
69
|
76 CSVParser.__init__(self, **kwargs)
|
63
|
77 self.add_argument('-n', '--bins', dest='n_bins', type=int,
|
|
78 help="number of bins")
|
|
79 self.options = None
|
|
80
|
|
81
|
|
82 def main(args=sys.argv[1:]):
|
|
83 """CLI"""
|
|
84
|
|
85 # parse command line options
|
|
86 parser = HistogramParser()
|
|
87 options = parser.parse_args(args)
|
|
88
|
|
89
|
|
90 if __name__ == '__main__':
|
|
91 main()
|
|
92
|
|
93
|