fork(1) download
  1. import re, sys, unicodedata
  2. s = "test1 this is a sample subscript o₁"
  3. No = [chr(i) for i in range(sys.maxunicode) if unicodedata.category(chr(i)) == 'No']
  4. print([x for x in re.findall(r'\b[^\W\d_]{2,}\b', s) if not any(y in x for y in No)])
Success #stdin #stdout 0.28s 27712KB
stdin
Standard input is empty
stdout
['this', 'is', 'sample', 'subscript']