view wordstream/main.py @ 0:8af3412e907a

initial import of wordstream
author k0s <k0scist@gmail.com>
date Fri, 01 Jan 2010 19:35:32 -0500
parents
children 0c2b1fe8f53f
line wrap: on
line source

#!/usr/bin/env python

import sys

import urllib2

from optparse import OptionParser
from pprint import pprint
from wordstream.api import Corpus

def main(args=sys.argv[1:]):
    parser = OptionParser()
    parser.add_option('--print-corpus', dest='print_corpus', default=False,
                      action='store_true')
    parser.add_option('-n', type='int', dest='n', default=1,
                      help='number of words to eat')
    options, args = parser.parse_args()

    corpus = Corpus()

    corpus.feed_stuff(*args)
    if options.print_corpus:
        pprint(corpus)

    n = 1

    while 1:
        stream = raw_input()
        splitstream = stream.split()
        if splitstream:
            for i in range(n):
                word = corpus.eat(splitstream[-1])
                if not word:
                    break
                print word

if __name__ == '__main__':
    main()