Advertisement
Guest User

Untitled

a guest
Mar 5th, 2017
172
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.63 KB | None | 0 0
  1. import io
  2. import unicodedata
  3.  
  4. def isKanji(char):
  5. return (int("0x4e00", 16) <= int(hex(ord(char)),16) <= int("0x9faf", 16) or
  6. int("0x3400", 16) <= int(hex(ord(char)),16) <= int("0x4db5", 16))
  7.  
  8. filename = input("File name? (Must be in same directory as this file): ")
  9. spacing = int(input("Kanji per line?: " ))
  10.  
  11. with io.open(filename, 'r', encoding='utf8') as file:
  12. data = file.read()
  13.  
  14. kanji = set()
  15. for char in data:
  16. if isKanji(char):
  17. kanji.add(char)
  18.  
  19. i = 1
  20. with io.open("output.txt", 'w', encoding='utf8') as file:
  21. for k in kanji:
  22. file.write(k + " ")
  23. if i == spacing:
  24. file.write("\n")
  25. i = 0
  26. i += 1
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement