annotate wordstream/main.py @ 21:c05704d14958 default tip

py3
author Jeff Hammel <k0scist@gmail.com>
date Wed, 02 Feb 2022 16:15:36 +0000
parents 0c2b1fe8f53f
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
1 #!/usr/bin/env python
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
2
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
3 import sys
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
4
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
5 import urllib2
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
6
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
7 from optparse import OptionParser
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
8 from pprint import pprint
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
9 from wordstream.api import Corpus
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
10
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
11 def main(args=sys.argv[1:]):
5
0c2b1fe8f53f update documentation a little
k0s <k0scist@gmail.com>
parents: 0
diff changeset
12 parser = OptionParser('%prog [options] <path_or_url> <path_or_url> <...>')
0
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
13 parser.add_option('--print-corpus', dest='print_corpus', default=False,
5
0c2b1fe8f53f update documentation a little
k0s <k0scist@gmail.com>
parents: 0
diff changeset
14 action='store_true',
0c2b1fe8f53f update documentation a little
k0s <k0scist@gmail.com>
parents: 0
diff changeset
15 help="print the given corpus of associations")
0
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
16 parser.add_option('-n', type='int', dest='n', default=1,
5
0c2b1fe8f53f update documentation a little
k0s <k0scist@gmail.com>
parents: 0
diff changeset
17 help='number of words to eat per munch')
0
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
18 options, args = parser.parse_args()
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
19
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
20 corpus = Corpus()
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
21
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
22 corpus.feed_stuff(*args)
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
23 if options.print_corpus:
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
24 pprint(corpus)
5
0c2b1fe8f53f update documentation a little
k0s <k0scist@gmail.com>
parents: 0
diff changeset
25 sys.exit(0)
0
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
26
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
27 n = 1
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
28
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
29 while 1:
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
30 stream = raw_input()
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
31 splitstream = stream.split()
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
32 if splitstream:
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
33 for i in range(n):
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
34 word = corpus.eat(splitstream[-1])
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
35 if not word:
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
36 break
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
37 print word
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
38
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
39 if __name__ == '__main__':
8af3412e907a initial import of wordstream
k0s <k0scist@gmail.com>
parents:
diff changeset
40 main()