Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- def parseText(text):
- output = 'ADD|BORROWER|MTG|DATE\n'
- months = ['J A N', 'F E B', 'M A R','A P R','M A Y','J U N','J U L','A U G','S E P','O C T','N O V','D E C']
- line_groups = text.split('\n\n')
- prev_date = None
- for line_group in line_groups:
- lines = line_group.split('\n')
- out_line = dict()
- for m in months:
- if m in lines[0]:
- out_line['DATE'] = lines[0]
- prev_date = lines[0]
- lines = lines[1:]
- else:
- out_line['DATE'] = prev_date
- # import ipdb; ipdb.set_trace()
- prev_key = None
- for line in lines:
- # print(line)
- if line.startswith('MTG:'):
- out_line['MTG'] = line.split(': ')[1]
- prev_key = 'MTG'
- elif line.startswith('ADD:'):
- out_line['ADD'] = line.split(': ')[1]
- prev_key = 'ADD'
- elif line.startswith('BORROWER:'):
- out_line['BORROWER'] = line.split(': ')[1]
- prev_key = 'BORROWER'
- # print(prev_key)
- else:
- # print(prev_key)
- q = '%s %s' % (out_line[prev_key], line)
- out_line[prev_key] = q
- prev_key = None
- output += '%s|%s|%s|%s\n' % (out_line.get('ADD', ''), out_line.get('BORROWER', ''), out_line.get('MTG', ''), out_line.get('DATE', ''))
- print(output)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement