Ideone.com

fork download

copy

import re
 
preposition_lst = ['DE LO ', 'DE LA ', 'DE LAS ', 'DEL ', 'DELS ', 'DE LES ', 'DO ', 'DA ', 'DOS ', 'DAS', 'DE ']
cases = ["DE BLAS ZAPATA", "MATIAS DE LA MANO", "LOPEZ FERNANDEZ DE VILLAVERDE", "DE MIGUEL DEL CORRAL", "VIDAL DE LA PEÑA", "MONTAVA DEL ARCO", "DOS CASAS VALLE"]
 
preps = r'(?:D(?:AS?|E(?:[ ]L(?:AS?|ES|O)|LS?)?|OS?) )?'
pattern = fr'^({preps}[^\W\d_]+)( {preps}[^\W\d_]+)?( de {preps}[^\W\d_]+)?$'
for case in cases:
    m = re.search(pattern, case, re.I) # re.I makes it case insensitive
    if m:
        print([x.strip() for x in m.groups() if x])
    else:
        print(f"No match for {case}")

Success #stdin #stdout 0.03s 9528KB

stdin

copy

Standard input is empty

stdout

copy

['DE BLAS', 'ZAPATA']
['MATIAS', 'DE LA MANO']
['LOPEZ', 'FERNANDEZ', 'DE VILLAVERDE']
['DE MIGUEL', 'DEL CORRAL']
['VIDAL', 'DE LA PEÑA']
['MONTAVA', 'DEL ARCO']
['DOS CASAS', 'VALLE']

https://ideone.com/Ts2MSz

language:

Python 3 (python 3.12)

created:

visibility:

public

Share or Embed source code

Discover > Sphere Engine API

The brand new service which powers Ideone!

Discover > IDE Widget

Widget for compiling and running the source code in a web browser!

Discover > Sphere Engine API

Discover > IDE Widget

Choose your language