Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- # -*- coding: utf-8 -*-
- import re
- regex = re.compile(r"((?:\w+ )?(?:del|de|san|la)(?: las| la| los)?(?: \w+)?)")
- def split_last_name(last_name):
- res = regex.search(last_name.lower())
- try:
- comp = res.groups()[0]
- sp = last_name.split(comp)
- names = [_.strip().title() if _ and any(sp) else comp for _ in sp]
- except AttributeError:
- names = [last_name]
- return names
- l = [
- 'guillermo del toro',
- 'de la fuente',
- 'del corral lopez',
- 'de los santos vera',
- 'carrasco de la cruz',
- 'garcia de sobrecasa',
- 'alvarez de arenales',
- 'martinez de hoz',
- 'lopez de lacalle',
- 'velez de guevara',
- 'la algo Jardines',
- 'la cruz marin',
- 'Agape ponte de silva',
- 'paredes bastidas de uribe',
- 'bastidas de uribe chavez',
- 'ruiz gutierrez de perez',
- 'yataco la fauci',
- 'del pielago zevallos'
- ]
- for _ in l:
- print split_last_name(_)
Add Comment
Please, Sign In to add comment