import unicodedata as ud
text = "des поместья, de la famille Buonaparte. Non, je vous préviens que si vous"
print(' '.join([word for word in text.split() if any('CYRILLIC' in ud.name(c) for c in word)]))
# => поместья,
# If you also need to strip any punctuation:
import string
print(
' '.join([
word.translate(str.maketrans('', '', string.punctuation))
for word in text.split()
if any('CYRILLIC' in ud.name(c) for c in word)
])
)
# => поместья
aW1wb3J0IHVuaWNvZGVkYXRhIGFzIHVkCnRleHQgPSAiZGVzINC/0L7QvNC10YHRgtGM0Y8sIGRlIGxhIGZhbWlsbGUgQnVvbmFwYXJ0ZS4gTm9uLCBqZSB2b3VzIHByJiMyMzM7dmllbnMgcXVlIHNpIHZvdXMiCnByaW50KCcgJy5qb2luKFt3b3JkIGZvciB3b3JkIGluIHRleHQuc3BsaXQoKSBpZiBhbnkoJ0NZUklMTElDJyBpbiB1ZC5uYW1lKGMpIGZvciBjIGluIHdvcmQpXSkpCiMgPT4g0L/QvtC80LXRgdGC0YzRjywKCiMgSWYgeW91IGFsc28gbmVlZCB0byBzdHJpcCBhbnkgcHVuY3R1YXRpb246CmltcG9ydCBzdHJpbmcKcHJpbnQoCgknICcuam9pbihbCgkJCXdvcmQudHJhbnNsYXRlKHN0ci5tYWtldHJhbnMoJycsICcnLCBzdHJpbmcucHVuY3R1YXRpb24pKQoJCQlmb3Igd29yZCBpbiB0ZXh0LnNwbGl0KCkKCQkJaWYgYW55KCdDWVJJTExJQycgaW4gdWQubmFtZShjKSBmb3IgYyBpbiB3b3JkKQoJCV0pCikKIyA9PiDQv9C+0LzQtdGB0YLRjNGP