Guest User

Untitled

a guest
Mar 18th, 2018
91
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.01 KB | None | 0 0
  1. # -*- coding: utf-8 -*-
  2. import os, sys, re
  3.  
  4. def main():
  5.  
  6. pattern = re.compile(r"<<(.+?)>>")
  7.  
  8. from collections import defaultdict
  9. frequency = defaultdict(int)/Users/it/home_dl/chainer_rnn/result/op_line_filter_hira_correct_spm_4k_unit=2000/log
  10.  
  11. with open(sys.argv[1]) as f:
  12. for line in f:
  13. line = line.strip()
  14.  
  15. match = re.search(pattern, line)
  16. if match is None:
  17. pass
  18. else:
  19. before = match.group(1)
  20.  
  21. frequency[before] += 1
  22.  
  23. for k, v in sorted(frequency.items(), key=lambda x:x[1],reverse=True):
  24. print (k, v)
  25.  
  26. main()
  27.  
  28. # Python 正規表現でマッチした箇所を利用して置換する
  29. # ラムダ式を使う。
  30.  
  31. import re
  32.  
  33. text = 'あいうえお'
  34. regex_pattern = re.compile('(。|?|\?|\n)')
  35. sentence = re.sub(regex_pattern, lambda m:str(m.group() + '###') , text)
  36. # 'あ###いうえ###お'
  37.  
  38.  
  39. # 半角スペース区切りのテキストを入力し要素ごとの頻度を出力する。
  40.  
  41. import sys
  42.  
  43. from collections import defaultdict
  44. frequency = defaultdict(int)
  45.  
  46. with open(sys.argv[1]) as f:
  47. lines = f.readlines()
  48.  
  49. for line in lines:
  50. line = line.strip()
  51. morphs = line.split(" ")
  52.  
  53. for morph in morphs:
  54. frequency[morph] += 1
  55.  
  56. for k, v in sorted(frequency.items(), key=lambda x:x[1], reverse=True):
  57. print(k, v)
  58.  
  59.  
  60. # pythonの正規表現でのマッチ部分捕捉
  61.  
  62. import sys, re
  63.  
  64. # pn_ja.dic
  65. # 優れる:すぐれる:動詞:1
  66. pattern = re.compile(r"^(\S+?)\:(\S+?)\:(\S+?)\:(\S+)$")
  67.  
  68.  
  69.  
  70. with open(sys.argv[1]) as f:
  71. for line in f:
  72. line = line.strip()
  73.  
  74. if line is None:
  75. pass
  76. else:
  77. match = re.search(pattern, line)
  78. if match is None:
  79. print('Not match')
  80. else:
  81. term = match.group(1)
  82. yomi = match.group(2)
  83. klass = match.group(3)
  84. pn_score = match.group(4)
  85.  
  86. print(term, yomi, klass, pn_score)
Add Comment
Please, Sign In to add comment