#!/usr/bin/env python
import sys
sys.path.append('/home/pat/.pylib')
import re
r_paragraph = re.compile(r'(?ims)
]*>.*?
|]*>.*?')
abbrs = ['etc', 'ca', 'cf', 'Co', 'Ltd', 'Inc', 'Mt', 'Mr', 'Mrs',
'Dr', 'Ms', 'Rev', 'Fr', 'St', 'Sgt', 'pron', 'approx', 'lit',
'syn'] \
+ list('ABCDEFGHIJKLMNOPQRSTUVWXYZ') \
+ list('abcdefghijklmnopqrstuvwxyz')
t_sentence = r'^.{5,}?(? " + str(i) + "\n" + p