Advertisement
Guest User

Untitled

a guest
Nov 20th, 2018
99
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.75 KB | None | 0 0
  1. import pandas as pd
  2.  
  3. print("1=================")
  4. dict = {
  5. 'name': ['Jan', 'Adam'],
  6. 'surname': ['Kowalski', 'Nowak'],
  7. 'age': [25, 43]
  8. }
  9. print(dict)
  10. data_frame = pd.DataFrame(dict)
  11. print(data_frame)
  12.  
  13. print("2=================")
  14.  
  15. import numpy as np
  16.  
  17. array = np.array([1,2,3,4,5])
  18. print(array)
  19. data_frame = pd.DataFrame(array)
  20. print(data_frame)
  21.  
  22. print("3=================")
  23.  
  24. dict = {
  25. 'name': ['Jan', 'Adam'],
  26. 'surname': ['Kowalski', 'Nowak'],
  27. 'age': [25, 43]
  28. }
  29. data_frame = pd.DataFrame(dict)
  30. data_frame = data_frame.rename(index=str, columns={'name': 'first name', 'surname': 'last name'})
  31. print(data_frame)
  32.  
  33. print("4=================")
  34.  
  35. numbers = {
  36. 'numbers': [1,3,5,7,9,3]
  37. }
  38. data_frame = pd.DataFrame(numbers)
  39. print(data_frame)
  40. print(f'mean: {data_frame["numbers"].mean()}')
  41. print(f'median: {data_frame["numbers"].median()}')
  42. print(f'mode: {data_frame["numbers"].mode()}')
  43.  
  44. print("5=================")
  45.  
  46. dict = {
  47. 'col1': ['C1', 'C1', 'C2', 'C2', 'C2', 'C3', 'C2'],
  48. 'col2': [1,2,3,3,4,6,5]
  49. }
  50. data_frame = pd.DataFrame(dict)
  51. print(data_frame)
  52. print(data_frame.groupby('col1')['col2'].apply(list))
  53.  
  54. print("6=================")
  55.  
  56. dict = {
  57. 'name': ['Jan', 'Adam'],
  58. 'surname': ['Kowalski', 'Nowak'],
  59. 'age': [25, 43]
  60. }
  61. data_frame = pd.DataFrame(dict)
  62. data_frame = data_frame.drop('surname', axis=1)
  63. print(data_frame)
  64.  
  65. print("7=================")
  66.  
  67. dict = {
  68. 'col1': ['C1', 'C1', 'C2', 'C2', 'C2', 'C3', 'C2'],
  69. 'col2': [1,2,np.inf,3,-np.inf,np.inf,5]
  70. }
  71. data_frame = pd.DataFrame(dict)
  72. print(data_frame)
  73. data_frame = data_frame[(data_frame.col2 != np.inf) & (data_frame.col2 != -np.inf)]
  74. print(data_frame)
  75.  
  76. print("8=================")
  77.  
  78. data_frame = pd.DataFrame(np.random.randn(5, 3), columns=['col1', 'col2', 'col3'])
  79. print(data_frame)
  80. print(f'column 1: {data_frame.col1.idxmax()}')
  81. print(f'column 2: {data_frame.col2.idxmax()}')
  82. print(f'column 2: {data_frame.col3.idxmax()}')
  83.  
  84. print("9=================")
  85.  
  86. data_frame = pd.DataFrame({'x': [1, 2, 3, 4], 'y': [4, 5, 6, 7]})
  87. print(data_frame)
  88. print(data_frame[data_frame.columns[0]])
  89.  
  90. print("10=================")
  91.  
  92. data_frame = pd.read_csv('./Orange.csv')
  93. print(data_frame)
  94. print(data_frame.describe())
  95.  
  96. print("11=================")
  97.  
  98. import matplotlib.pyplot as plt
  99. from sqlalchemy import create_engine
  100.  
  101. data = pd.read_csv('./muscle.csv')
  102. engine = create_engine('sqlite:///:memory:')
  103. data.to_sql('data_table', engine)
  104. print(pd.read_sql_query('SELECT * FROM data_table', engine))
  105.  
  106. data["Length"].plot.hist(grid=True, bins=20, rwidth=0.9,
  107. color="lightblue")
  108. plt.title('Values of data[Length]')
  109. plt.xlabel('Frequency')
  110. plt.ylabel('Count')
  111. plt.grid(axis='y', alpha=0.75)
  112.  
  113. plt.show()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement