Advertisement
ShrekOP

Assg25

Dec 14th, 2022
45
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.06 KB | None | 0 0
  1. import pandas as pd
  2. df=pd.read_csv("covid_19_india.csv")
  3.  
  4. print(df)
  5.  
  6. #detecting NA values
  7. df.isnull()
  8.  
  9. import numpy as np
  10. missing_values=["N/a","na",np.nan,0]
  11. df=pd.read_csv("covid_19_india.csv",na_values=missing_values)
  12. df
  13.  
  14. df.isnull()
  15.  
  16. df.isnull().sum()
  17.  
  18. import seaborn as sns
  19. sns.heatmap(df.isnull(),yticklabels=False)
  20.  
  21. #removing NA values
  22. df.dropna()
  23.  
  24. df.dropna(how='all')
  25.  
  26. #filling data
  27. df.fillna(0)
  28.  
  29. df_next=df.fillna(method='bfill')
  30. df_next
  31.  
  32. df.interpolate()
  33.  
  34. #transforming data
  35. df.drop(['Date','Time'],axis=1)
  36.  
  37. from pandas import DataFrame
  38. series_obj=Series(np.arange(6))
  39. series_obj.name="added_variable"
  40. series_obj
  41.  
  42. added=DataFrame.join(df,series_obj)
  43. added
  44.  
  45. #sorting
  46. print(df_next.sort_values(['Cured','Confirmed'], ascending=True))
  47.  
  48. import matplotlib.pyplot as plt
  49. x=df_next['Confirmed']
  50. plt.hist(x,bins=25,color='green',edgecolor='blue',alpha=0.5)
  51. plt.title("Histogram")
  52. plt.xlabel('Cured')
  53. plt.ylabel('Deaths')
  54.  
  55. x=df['Cured']
  56. y=df['Deaths']
  57. plt.scatter(x,y,c=df['Cured'], s=df['Deaths'],marker='D',alpha=0.4)
  58.  
  59.  
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement