view python/stripirssi.py @ 516:c78da6f7ca79

python/quotemail.py
author Jeff Hammel <jhammel@mozilla.com>
date Thu, 19 Sep 2013 11:21:07 -0700
parents 3982b7ad596b
children
line wrap: on
line source

#!/usr/bin/env python

import optparse
import os
import sys

"""
strip irssi comments and format
"""

# TODO : -> textshaper

### generic functionality

string = (basestring,)

class splitlines(object):
    def __init__(self, function):
        self.function = function
    def __call__(self, lines, *args, **kwargs):
        if isinstance(lines, string):
            lines = lines.strip().splitlines()
        self.function(lines, *args, **kwargs)

@splitlines
def strip(lines):
    return [line.strip() for line in lines]

@splitlines
def strip_first_column(lines, separator=None):
    """
    removes leading column (defined by separator) from lines of text
    """
    # TODO: -> genericize
    # - and handle whitespace more generically

    length = None # length of first column
    stripped = []
    for line in lines:
        if not line:
            continue # XXX desirable?
        try:
                prefix, rest = line.split(separator, 1)
        except ValueError:
                import pdb; pdb.set_trace()
                prefix, rest = None, None
        if length is None:
            length = len(prefix)
        else:
            if len(prefix) != length:
                if not line[:len(prefix)].isspace():
                    raise AssertionError("Non whitespace found below pre (%s) in line %s" % (length, line))
        stripped.append(line[length:])
    return stripped

@splitlines
def remove_lines(lines, startswith):
    return [line for line in lines
            if line.startswith(startswith)]
    # really, one could take most functions for str and map -> lines

@splitlines
def remove_prefix_stamp(lines, stamp):
    """removes leading stamp: HH:MM"""
    return [line[len(stamp):] for line in lines]

@splitlines
def join(lines):
    """DOCUMENT ME!"""
    last = None
    joined = []
    for line in lines:
        if line:
            if line[0].isspace():
                line = line.strip()
                if not line:
                    if last:
                        joined.append(last)
                    continue
                if last:
                    last = '%s %s' % (last, line.strip())
                else:
                    joined.append(line.strip())
            else:
                if last:
                    joined.append(last)
                    last = line.rstrip()
        else:
            if last:
                joined.append(last)
    return joined

### CLI



def main(args=sys.argv[1:]):

    # parse command line
    usage = '%prog [options]'
    parser = optparse.OptionParser(usage=usage, description=__doc__)
    parser.add_option('-i', '--in-place', dest='in_place',
                      help="rewrite files in place")
    #    parser.add_option - strip timestamps only
    #    parser.add_option - strip nicks
    options, args = parser.parse_args(args)

    log = sys.stdin.read().strip()

    # strip timestamps
    lines = strip_first_column(log)

    import pdb; pdb.set_trace()
    

    print '\n'.join(lines)

if __name__ == '__main__':
    main()