Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import io
- import unicodedata
- def isKanji(char):
- return (int("0x4e00", 16) <= int(hex(ord(char)),16) <= int("0x9faf", 16) or
- int("0x3400", 16) <= int(hex(ord(char)),16) <= int("0x4db5", 16))
- filename = input("File name? (Must be in same directory as this file): ")
- spacing = int(input("Kanji per line?: " ))
- with io.open(filename, 'r', encoding='utf8') as file:
- data = file.read()
- kanji = set()
- for char in data:
- if isKanji(char):
- kanji.add(char)
- i = 1
- with io.open("output.txt", 'w', encoding='utf8') as file:
- for k in kanji:
- file.write(k + " ")
- if i == spacing:
- file.write("\n")
- i = 0
- i += 1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement