Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #!/usr/bin/python
- # -*- coding:utf-8 -*-
- import sys
- def do(filename):
- with open(filename, 'r') as f:
- string = f.read()
- string = string.strip()
- string = string.lower()
- dict_replacement = {
- " ": ["’", "-"],
- "": [",", "?", "!", ".", ":", ";", "\"", "»", "«"],
- "e": ["é", "è", "ê", "ë"],
- "i": ["ï", "î"],
- "c": ["Ç", "ç"],
- "o": ["ô",],
- "a": ["à",],
- "u": ["ù",],
- "oe": ["œ",]
- }
- for k, v in dict_replacement.items():
- for c in v:
- string = string.replace(c, k)
- mots = string.split()
- table = {}
- for pos, val in enumerate(mots):
- try:
- table[val].append(str(pos))
- except KeyError, e:
- table[val] = [str(pos)]
- tables = {}
- cur_len = 0
- tmp_len = 0
- for key, val in table.items():
- try:
- tables[len(val)][key] = val
- except KeyError, e:
- tables[len(val)] = {key: val}
- x = 0
- while True:
- x += 1
- try:
- tables[x] = sorted(tables[x].items(), key=lambda (k, v) : (int(v[0])))
- for k, v in tables[x]:
- print "- {}: {}".format(k, " ".join(v))
- except KeyError:
- if x >= len(tables.keys()):
- break;
- if __name__=='__main__':
- do(sys.argv[1])
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement