#!/usr/bin/env python import sys sys.path.append('/home/pat/.pylib') import re r_paragraph = re.compile(r'(?ims)]*>.*?

|]*>.*?') abbrs = ['etc', 'ca', 'cf', 'Co', 'Ltd', 'Inc', 'Mt', 'Mr', 'Mrs', 'Dr', 'Ms', 'Rev', 'Fr', 'St', 'Sgt', 'pron', 'approx', 'lit', 'syn'] \ + list('ABCDEFGHIJKLMNOPQRSTUVWXYZ') \ + list('abcdefghijklmnopqrstuvwxyz') t_sentence = r'^.{5,}?(? " + str(i) + "\n" + p