#!/usr/bin/env python
import sys
sys.path.append('/home/pat/.pylib')
import re

r_paragraph = re.compile(r'(?ims)<p[^>]*>.*?</p>|<li(?!n)[^>]*>.*?</li>')
abbrs = ['etc', 'ca', 'cf', 'Co', 'Ltd', 'Inc', 'Mt', 'Mr', 'Mrs', 
         'Dr', 'Ms', 'Rev', 'Fr', 'St', 'Sgt', 'pron', 'approx', 'lit', 
         'syn'] \
   + list('ABCDEFGHIJKLMNOPQRSTUVWXYZ') \
   + list('abcdefghijklmnopqrstuvwxyz')
t_sentence = r'^.{5,}?(?<!\b%s)(?:\.(?= [A-Z0-9]|\Z)|\Z)'
r_sentence = re.compile(t_sentence % r')(?<!\b'.join(abbrs))


def split_paragraphs(text):
 return [para for para in r_paragraph.findall(text)]

def split_sentences(text):
 pass 

if __name__ == "__main__":
  import sys
  content = sys.stdin.read().decode('utf-8')
  #print content
  paras = split_paragraphs(content)
  for x in [para for para in r_paragraph.findall(content)]: print x

  for p in enumerate(paras):
    print "----> " + str(i) + "\n" + p
  
