Advertisement
PyNoob1

Step 1: Downloading historical data

Jun 11th, 2021
151
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 10.16 KB | None | 0 0
  1. import pandas as pd
  2. from datetime import datetime
  3.  
  4. start = datetime.now()
  5. print("Downloading data for Season 2019")
  6. Season_2019 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1920/all-euro-data-2019-2020.xlsx", sheet_name=None)
  7. print("Downloading data for Season 2019 completed successfully")
  8. print("Concatenating data for Season 2019")
  9. Season_2019_c = pd.concat(Season_2019, axis=0, ignore_index=True)
  10. print("Concatenating data for Season 2019 completed successfully")
  11. print("Downloading data for Season 2018")
  12. Season_2018 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1819/all-euro-data-2018-2019.xlsx", sheet_name=None)
  13. print("Downloading data for Season 2018 completed successfully")
  14. print("Concatenating data for Season 2018")
  15. Season_2018_c = pd.concat(Season_2018, axis=0, ignore_index=True)
  16. print("Concatenating data for Season 2018 completed successfully")
  17. print("Downloading data for Season 2017")
  18. Season_2017 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1718/all-euro-data-2017-2018.xlsx", sheet_name=None)
  19. print("Concatenating data for Season 2017")
  20. Season_2017_c = pd.concat(Season_2017, axis=0, ignore_index=True)
  21. print("Concatenating data for Season 2017 completed successfully")
  22. print("Downloading data for Season 2016")
  23. Season_2016 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1617/all-euro-data-2016-2017.xls", sheet_name=None)
  24. print("Concatenating data for Season 2016")
  25. Season_2016_c = pd.concat(Season_2016, axis=0, ignore_index=True)
  26. print("Concatenating data for Season 2016 completed successfully")
  27. print("Downloading data for Season 2015")
  28. Season_2015 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1516/all-euro-data-2015-2016.xls", sheet_name=None)
  29. print("Concatenating data for Season 2015")
  30. Season_2015_c = pd.concat(Season_2015, axis=0, ignore_index=True)
  31. print("Concatenating data for Season 2015 completed successfully")
  32. print("Downloading data for Season 2014")
  33. Season_2014 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1415/all-euro-data-2014-2015.xls", sheet_name=None)
  34. print("Concatenating data for Season 2014")
  35. Season_2014_c = pd.concat(Season_2014, axis=0, ignore_index=True)
  36. print("Concatenating data for Season 2014 completed successfully")
  37. print("Downloading data for Season 2013")
  38. Season_2013 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1314/all-euro-data-2013-2014.xls", sheet_name=None)
  39. print("Concatenating data for Season 2013")
  40. Season_2013_c = pd.concat(Season_2013, axis=0, ignore_index=True)
  41. print("Concatenating data for Season 2013 completed successfully")
  42. print("Downloading data for Season 2012")
  43. Season_2012 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1213/all-euro-data-2012-2013.xls", sheet_name=None)
  44. print("Concatenating data for Season 2012")
  45. Season_2012_c = pd.concat(Season_2012, axis=0, ignore_index=True)
  46. print("Concatenating data for Season 2012 completed successfully")
  47. print("Downloading data for Season 2011")
  48. Season_2011 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1112/all-euro-data-2011-2012.xls", sheet_name=None)
  49. print("Concatenating data for Season 2011")
  50. Season_2011_c = pd.concat(Season_2011, axis=0, ignore_index=True)
  51. print("Concatenating data for Season 2011 completed successfully")
  52. print("Downloading data for Season 2010")
  53. Season_2010 = pd.read_excel(r"https://football-data.co.uk/mmz4281/1011/all-euro-data-2010-2011.xls", sheet_name=None)
  54. print("Concatenating data for Season 2010")
  55. Season_2010_c = pd.concat(Season_2010, axis=0, ignore_index=True)
  56. print("Concatenating data for Season 2010 completed successfully")
  57. print("Downloading data for Season 2009")
  58. Season_2009 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0910/all-euro-data-2009-2010.xls", sheet_name=None)
  59. print("Concatenating data for Season 2009")
  60. Season_2009_c = pd.concat(Season_2009, axis=0, ignore_index=True)
  61. print("Concatenating data for Season 2009 completed successfully")
  62. print("Downloading data for Season 2008")
  63. Season_2008 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0809/all-euro-data-2008-2009.xls", sheet_name=None)
  64. print("Concatenating data for Season 2008")
  65. Season_2008_c = pd.concat(Season_2008, axis=0, ignore_index=True)
  66. print("Concatenating data for Season 2008 completed successfully")
  67. print("Downloading data for Season 2007")
  68. Season_2007 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0708/all-euro-data-2007-2008.xls", sheet_name=None)
  69. print("Concatenating data for Season 2007")
  70. Season_2007_c = pd.concat(Season_2007, axis=0, ignore_index=True)
  71. print("Concatenating data for Season 2007 completed successfully")
  72. print("Downloading data for Season 2006")
  73. Season_2006 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0607/all-euro-data-2006-2007.xls", sheet_name=None)
  74. print("Concatenating data for Season 2006")
  75. Season_2006_c = pd.concat(Season_2006, axis=0, ignore_index=True)
  76. print("Concatenating data for Season 2006 completed successfully")
  77. print("Downloading data for Season 2005")
  78. Season_2005 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0506/all-euro-data-2005-2006.xls", sheet_name=None)
  79. print("Concatenating data for Season 2005")
  80. Season_2005_c = pd.concat(Season_2005, axis=0, ignore_index=True)
  81. print("Concatenating data for Season 2005 completed successfully")
  82. print("Downloading data for Season 2004")
  83. Season_2004 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0405/all-euro-data-2004-2005.xls", sheet_name=None)
  84. print("Concatenating data for Season 2004")
  85. Season_2004_c = pd.concat(Season_2004, axis=0, ignore_index=True)
  86. print("Concatenating data for Season 2004 completed successfully")
  87. print("Downloading data for Season 2003")
  88. Season_2003 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0304/all-euro-data-2003-2004.xls", sheet_name=None)
  89. print("Concatenating data for Season 2003")
  90. Season_2003_c = pd.concat(Season_2003, axis=0, ignore_index=True)
  91. print("Concatenating data for Season 2003 completed successfully")
  92. print("Downloading data for Season 2002")
  93. Season_2002 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0203/all-euro-data-2002-2003.xls", sheet_name=None)
  94. print("Concatenating data for Season 2002")
  95. Season_2002_c = pd.concat(Season_2002, axis=0, ignore_index=True)
  96. print("Concatenating data for Season 2002 completed successfully")
  97. print("Downloading data for Season 2001")
  98. Season_2001 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0102/all-euro-data-2001-2002.xls", sheet_name=None)
  99. print("Concatenating data for Season 2001")
  100. Season_2001_c = pd.concat(Season_2001, axis=0, ignore_index=True)
  101. print("Concatenating data for Season 2001 completed successfully")
  102. print("Downloading data for Season 2000")
  103. Season_2000 = pd.read_excel(r"https://football-data.co.uk/mmz4281/0001/all-euro-data-2000-2001.xls", sheet_name=None)
  104. print("Concatenating data for Season 2000")
  105. Season_2000_c = pd.concat(Season_2000, axis=0, ignore_index=True)
  106. print("Concatenating data for Season 2000 completed successfully")
  107. print("Downloading data for Season 1999")
  108. Season_1999 = pd.read_excel(r"https://football-data.co.uk/mmz4281/9900/all-euro-data-1999-2000.xls", sheet_name=None)
  109. print("Concatenating data for Season 1999")
  110. Season_1999_c = pd.concat(Season_1999, axis=0, ignore_index=True)
  111. print("Concatenating data for Season 1999 completed successfully")
  112. print("Downloading data for Season 1998")
  113. Season_1998 = pd.read_excel(r"https://football-data.co.uk/mmz4281/9899/all-euro-data-1998-1999.xls", sheet_name=None)
  114. print("Concatenating data for Season 1998")
  115. Season_1998_c = pd.concat(Season_1998, axis=0, ignore_index=True)
  116. print("Concatenating data for Season 1998 completed successfully")
  117. print("Downloading data for Season 1997")
  118. Season_1997 = pd.read_excel(r"https://football-data.co.uk/mmz4281/9798/all-euro-data-1997-1998.xls", sheet_name=None)
  119. print("Concatenating data for Season 1997")
  120. Season_1997_c = pd.concat(Season_1997, axis=0, ignore_index=True)
  121. print("Concatenating data for Season 1997 completed successfully")
  122. print("Downloading data for Season 1996")
  123. Season_1996 = pd.read_excel(r"https://football-data.co.uk/mmz4281/9697/all-euro-data-1996-1997.xls", sheet_name=None)
  124. print("Concatenating data for Season 1996")
  125. Season_1996_c = pd.concat(Season_1996, axis=0, ignore_index=True)
  126. print("Concatenating data for Season 1996 completed successfully")
  127. print("Downloading data for Season 1995")
  128. Season_1995 = pd.read_excel(r"https://football-data.co.uk/mmz4281/9596/all-euro-data-1995-1996.xls", sheet_name=None)
  129. print("Concatenating data for Season 1995")
  130. Season_1995_c = pd.concat(Season_1995, axis=0, ignore_index=True)
  131. print("Concatenating data for Season 1995 completed successfully")
  132. print("Downloading data for Season 1994")
  133. Season_1994 = pd.read_excel(r"https://football-data.co.uk/mmz4281/9495/all-euro-data-1994-1995.xls", sheet_name=None)
  134. print("Concatenating data for Season 1994")
  135. Season_1994_c = pd.concat(Season_1994, axis=0, ignore_index=True)
  136. print("Concatenating data for Season 1994 completed successfully")
  137. print("Downloading data for Season 1993")
  138. Season_1993 = pd.read_excel(r"https://football-data.co.uk/mmz4281/9394/all-euro-data-1993-1994.xls", sheet_name=None)
  139. print("Concatenating data for Season 1993")
  140. Season_1993_c = pd.concat(Season_1993, axis=0, ignore_index=True)
  141. print("Concatenating data for Season 1993 completed successfully")
  142. print("Defining list of all seasons")
  143. Season_list = [
  144.     # Season_2020_c,
  145.     Season_2019_c,
  146.     Season_2018_c,
  147.     Season_2017_c,
  148.     Season_2016_c,
  149.     Season_2015_c,
  150.     Season_2014_c,
  151.     Season_2013_c,
  152.     Season_2012_c,
  153.     Season_2011_c,
  154.     Season_2010_c,
  155.     Season_2009_c,
  156.     Season_2008_c,
  157.     Season_2007_c,
  158.     Season_2006_c,
  159.     Season_2005_c,
  160.     Season_2004_c,
  161.     Season_2003_c,
  162.     Season_2002_c,
  163.     Season_2001_c,
  164.     Season_2000_c,
  165.     Season_1999_c,
  166.     Season_1998_c,
  167.     Season_1997_c,
  168.     Season_1996_c,
  169.     Season_1995_c,
  170.     Season_1994_c,
  171.     Season_1993_c,
  172. ]
  173. print("Concatenating all data into one dataframe")
  174. db_concat = pd.concat(Season_list)
  175. print("Saving csv")
  176. db_concat.to_csv(r"C:\Users\harsh\Documents\My Dream\sportsintel.shop\Files\dataset.csv")
  177. print("File Saved")
  178. print("Success")
  179. end = datetime.now()
  180. time_taken = end - start
  181. print('Time taken to complete: ', time_taken)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement