fork download
  1. import re
  2. text = "ITEM 1. and& ITEM 2. Traceback xd Item 1. ff942> in <mITEM 3. ITEM 4."
  3. i = "tem|TEM"
  4. regex = fr"I{{0,1}}({i})\s*\w+(?=\s*[-–—:<]|\.(?!\S))"
  5. lst = [x.group(1) for x in re.finditer(regex, text)]
  6. new_i = max(set(lst), key=lst.count)
  7. print( new_i )
  8. regex = fr"I{{0,1}}({new_i})\s*\w+(?=\s*[-–—:<]|\.(?!\S))"
  9. print( [x.group() for x in re.finditer(regex, text)] )
  10.  
  11.  
Success #stdin #stdout 0.03s 9572KB
stdin
Standard input is empty
stdout
TEM
['ITEM 1', 'ITEM 2', 'ITEM 3', 'ITEM 4']