# -*- coding: utf-8 -*-
# http://stackoverflow.com/q/32872917/5290909
#python 2.7.9
import re
text = "Solo voy si se sucedierón o se suceden mañana los siguienñes eventos:"
# Decode to unicode
unicode_text = text.decode('utf8')
matches = re.findall(ur'\b\w+\b', unicode_text, re.UNICODE)
# Encode back again to UTF-8
utf8_matches = [ match.encode('utf-8') for match in matches ]
# Print every word
for utf8_word in utf8_matches:
print utf8_word
IyAtKi0gY29kaW5nOiB1dGYtOCAtKi0KIyBodHRwOi8vc3RhY2tvdmVyZmxvdy5jb20vcS8zMjg3MjkxNy81MjkwOTA5CiNweXRob24gMi43LjkKCmltcG9ydCByZQogICAgIAp0ZXh0ID0gIlNvbG8gdm95IHNpIHNlIHN1Y2VkaWVyw7NuIG8gc2Ugc3VjZWRlbiBtYcOxYW5hIGxvcyBzaWd1aWVuw7FlcyBldmVudG9zOiIKIyBEZWNvZGUgdG8gdW5pY29kZQp1bmljb2RlX3RleHQgPSB0ZXh0LmRlY29kZSgndXRmOCcpCgptYXRjaGVzID0gcmUuZmluZGFsbCh1cidcYlx3K1xiJywgdW5pY29kZV90ZXh0LCByZS5VTklDT0RFKQoKIyBFbmNvZGUgYmFjayBhZ2FpbiB0byBVVEYtOAp1dGY4X21hdGNoZXMgPSBbIG1hdGNoLmVuY29kZSgndXRmLTgnKSBmb3IgbWF0Y2ggaW4gbWF0Y2hlcyBdCgojIFByaW50IGV2ZXJ5IHdvcmQKZm9yIHV0Zjhfd29yZCBpbiB1dGY4X21hdGNoZXM6CiAgICBwcmludCB1dGY4X3dvcmQ=