Guest User

Untitled

a guest
Feb 22nd, 2018
277
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 3.94 KB | None | 0 0
  1. import pandas as pd
  2. import pymysql
  3. import numpy as np
  4.  
  5.  
  6. db = pymysql.connect(host='localhost', user='root', passwd='',
  7. database='mom_db', charset='utf8')
  8. df = pd.read_sql("SELECT * FROM comments ", db)
  9. cursor = db.cursor()
  10.  
  11. name = df['nickname']
  12.  
  13. count = pd.value_counts(name)
  14.  
  15. a = {count.index[i]:count[i] for i in range(len(count))}
  16. print(a)
  17. #print(count[count>1])-вывод Series
  18.  
  19. {'repeinik': 26, 'podberezowik': 24, 'Павел_Шуков_talks48': 20, 'stupich':
  20. 14, 'kipovets': 14, 'Лайош_Портиш': 13, 'vijigau_mraz': 13, 'наивная баба':
  21. 12, 'genek77': 12, 'Sergey_Petrov': 12, 'Андрей_Иванов_talks19': 11,
  22. 'Пачотны тунеядзец': 10, 'eugenenus_': 10, 'Настя_Романова': 9, 'Kac_Lol':
  23. 9, 'Ириша_Лалапусечка': 9, 'valstar78': 8, 'Сергей Александрович': 8,
  24. 'Tadeush_Тадеуш': 8, 'freedom for us': 7, 'Светлана_Малышкина': 7,
  25. 'Костя_Миронов': 7, 'SIgarA': 6, 'Жанна_Д-урк': 6, 'Fair play': 6,
  26. 'Лукашенко_Федор': 6, 'Lisa_Grodno': 5, 'id350886439': 5,......
  27.  
  28. repeinik 26
  29. podberezowik 24
  30. Павел_Шуков_talks48 20
  31. stupich 14
  32. kipovets 14
  33. Лайош_Портиш 13
  34. .......
  35.  
  36. d = {'repeinik': 26, 'podberezowik': 24, 'Павел_Шуков_talks48': 20, 'stupich': 14, 'kipovets': 14, 'Лайош_Портиш': 13, 'vijigau_mraz': 13, 'наивная баба': 12, 'genek77': 12}
  37.  
  38. print("{:<20} {:<15}".format('Name','Value'))
  39. for v in d.items():
  40. name, val = v
  41. print("{:<20} {:<15}".format(name, val))
  42.  
  43. Name Value
  44. repeinik 26
  45. podberezowik 24
  46. Павел_Шуков_talks48 20
  47. ... ...
  48.  
  49. # pip install tabulate
  50. from tabulate import tabulate
  51.  
  52. d = {'repeinik': 26, 'podberezowik': 24, 'Павел_Шуков_talks48': 20,
  53. 'stupich': 14, 'kipovets': 14, 'Лайош_Портиш': 13,
  54. 'vijigau_mraz': 13, 'наивная баба': 12, 'genek77': 12}
  55. print(tabulate(d.items(), headers=['NAME', 'VALUE'], tablefmt="grid"))
  56.  
  57. +---------------------+---------+
  58. | NAME | VALUE |
  59. +=====================+=========+
  60. | repeinik | 26 |
  61. +---------------------+---------+
  62. | podberezowik | 24 |
  63. +---------------------+---------+
  64. | Павел_Шуков_talks48 | 20 |
  65. +---------------------+---------+
  66. | stupich | 14 |
  67. +---------------------+---------+
  68. | kipovets | 14 |
  69. +---------------------+---------+
  70. | Лайош_Портиш | 13 |
  71. +---------------------+---------+
  72. | vijigau_mraz | 13 |
  73. +---------------------+---------+
  74. | наивная баба | 12 |
  75. +---------------------+---------+
  76. | genek77 | 12 |
  77. +---------------------+---------+
  78.  
  79. print('{:<20} {:<15}'.format('NickName', 'Numb_comm'))
  80. for name, n_comm in a.items():
  81. print('{:<20} {:<15}'.format(name, n_comm))
  82.  
  83. NickName Numb_comm
  84. repeinik 26
  85. podberezowik 24
  86. Павел_Шуков_talks48 20
  87. stupich 14
  88. kipovets 14
  89. Лайош_Портиш 13
  90. vijigau_mraz 13
  91. наивная баба 12
  92. genek77 12
  93.  
  94. In [41]: df = pd.DataFrame({
  95. 'name':np.random.choice(['aaa','bbb','ccc'], 500, p=[0.55, .3, .15])
  96. })
  97.  
  98. In [42]: df
  99. Out[42]:
  100. name
  101. 0 ccc
  102. 1 aaa
  103. 2 ccc
  104. 3 aaa
  105. 4 aaa
  106. 5 bbb
  107. 6 bbb
  108. .. ...
  109. 493 aaa
  110. 494 bbb
  111. 495 aaa
  112. 496 aaa
  113. 497 aaa
  114. 498 bbb
  115. 499 aaa
  116.  
  117. [500 rows x 1 columns]
  118.  
  119. In [43]: df.groupby('name').size()
  120. Out[43]:
  121. name
  122. aaa 269
  123. bbb 153
  124. ccc 78
  125. dtype: int64
  126.  
  127. In [44]: df.groupby('name').size().reset_index(name='count')
  128. Out[44]:
  129. name count
  130. 0 aaa 269
  131. 1 bbb 153
  132. 2 ccc 78
Add Comment
Please, Sign In to add comment