fork download
  1. import re
  2. documents = ["sent1. sent2. sent3. sent4. sent5.", "sent 1. sent 2... sent 3.... sent 4. sent 5..", "sent1.sent2.sent3.sent4.sent5."]
  3. dot_space_regex = re.compile(r'(?<=\.)\s+')
  4. for doc in documents:
  5. print(dot_space_regex.split(doc))
  6.  
Success #stdin #stdout 0.04s 9392KB
stdin
Standard input is empty
stdout
['sent1.', 'sent2.', 'sent3.', 'sent4.', 'sent5.']
['sent 1.', 'sent 2...', 'sent 3....', 'sent 4.', 'sent 5..']
['sent1.sent2.sent3.sent4.sent5.']