Advertisement
Guest User

Untitled

a guest
Apr 21st, 2019
155
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 32.96 KB | None | 0 0
  1. #name, type, description, rating, relaxed, sleepy, happy, euphoric, uplifted, focused, tingly, energetic, giggly, hungry, creative, aroused, talkative, stress, headaches, insomnia, pain, lack_of_appetite, cramps, depression, eye_pressure, fatigue, inflammation, muscle_spasms, spasticicity, seizures, dry_mouth, dry_eyes, paranoid, dizzy, nausea, anxious, headache, flavour_1, flavour_2, flavour_3
  2. from bs4 import BeautifulSoup
  3. import glob
  4.  
  5. #TOFIX - NAUSEA IS A GOOD HEALTH THING, NEEDS TO BE SWAPPED AND RE-PARSED
  6. # - No spasticity strains showing up?
  7.  
  8.  
  9. strains = []
  10.  
  11. delimiter = "|"
  12.  
  13. #print("id" + delimiter + "name" + delimiter + "type" + delimiter + "description" + delimiter + "rating" + delimiter + "relaxed" + delimiter + "sleepy" + delimiter + "happy" + delimiter + "euphoric" + delimiter + "uplifted" + delimiter + "focused" + delimiter + "tingly" + delimiter + "energetic" + delimiter + "giggly" + delimiter + "hungry" + delimiter + "creative" + delimiter + "aroused" + delimiter + "talkative" + delimiter + "stress" + delimiter + "headaches" + delimiter + "insomnia" + delimiter + "pain" + delimiter + "lack_of_appetite" + delimiter + "cramps" + delimiter + "depression" + delimiter + "eye_pressure" + delimiter + "fatigue" + delimiter + "inflammation" + delimiter + "muscle_spasms" + delimiter + "spasticicity" + delimiter + "seizures" + delimiter + "dry_mouth" + delimiter + "dry_eyes" + delimiter + "paranoid" + delimiter + "dizzy" + delimiter + "nausea" + delimiter + "anxious" + delimiter + "headache" + delimiter + "flavour_1" + delimiter + "flavour_2" + delimiter + "flavour_3")
  14.  
  15. strain_id = 0
  16.  
  17. for filename in glob.glob('*.html'):
  18. with open(filename, "r", encoding="utf8") as fp:
  19. relaxed = "0"
  20. sleepy = "0"
  21. happy = "0"
  22. euphoric = "0"
  23. uplifted = "0"
  24. focused = "0"
  25. tingly = "0"
  26. energetic = "0"
  27. giggly = "0"
  28. hungry = "0"
  29. creative = "0"
  30. aroused = "0"
  31. talkative = "0"
  32. stress = "0"
  33. headaches = "0"
  34. insomnia = "0"
  35. pain = "0"
  36. lack_of_appetite = "0"
  37. cramps = "0"
  38. depression = "0"
  39. eye_pressure = "0"
  40. fatigue = "0"
  41. inflammation = "0"
  42. muscle_spasms = "0"
  43. spasticicity = "0"
  44. seizures = "0"
  45. dry_mouth = "0"
  46. dry_eyes = "0"
  47. paranoid = "0"
  48. dizzy = "0"
  49. nausea = "0"
  50. anxious = "0"
  51. headache = "0"
  52.  
  53. strain_id += 1
  54. csv = ""
  55. soup = BeautifulSoup(fp, "lxml")
  56. desc_divs = soup.findAll("p")
  57. attr_div_labels = soup.findAll("div", {"class": "histogram-label"})
  58. attr_divs = soup.findAll("div", {"class": "histogram-item"})
  59. flav_divs = soup.findAll("div", {"class": "flavor-name"})
  60. csv += str(strain_id) + delimiter # id
  61. print(soup.find_all('span')[8].text)
  62. csv += soup.find_all('span')[8].text + delimiter # Name
  63. csv += soup.find_all('span')[7].text + delimiter # Type
  64. try:
  65. csv += (desc_divs[5].text).strip() + delimiter # Description
  66. except IndexError:
  67. print("No description!")
  68. csv += "This strain doesn't have a description - think you can help us?" + delimiter
  69. csv += soup.find_all('span')[9].text[0:3] + delimiter # Rating / 5
  70.  
  71.  
  72. # Check and set properties
  73.  
  74. try:
  75. if (attr_div_labels[0].text == "Relaxed"):
  76. relaxed = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  77. if (attr_div_labels[0].text == "Sleepy"):
  78. sleepy = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  79. if (attr_div_labels[0].text == "Happy"):
  80. happy = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  81. if (attr_div_labels[0].text == "Euphoric"):
  82. euphoric = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  83. if (attr_div_labels[0].text == "Uplifted"):
  84. uplifted = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  85. if (attr_div_labels[0].text == "Energetic"):
  86. energetic = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  87. if (attr_div_labels[0].text == "Focused"):
  88. focused = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  89. if (attr_div_labels[0].text == "Tingly"):
  90. tingly = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  91. if (attr_div_labels[0].text == "Giggly"):
  92. giggly = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  93. if (attr_div_labels[0].text == "Hungry"):
  94. hungry = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  95. if (attr_div_labels[0].text == "Creative"):
  96. creative = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  97. if (attr_div_labels[0].text == "Talkative"):
  98. talkative = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  99. if (attr_div_labels[0].text == "Aroused"):
  100. aroused = attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]
  101. except IndexError:
  102. print("(IndexError) Couldn't find effect")
  103.  
  104. try:
  105. if (attr_div_labels[1].text == "Relaxed"):
  106. relaxed = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  107. if (attr_div_labels[1].text == "Sleepy"):
  108. sleepy = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  109. if (attr_div_labels[1].text == "Happy"):
  110. happy = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  111. if (attr_div_labels[1].text == "Euphoric"):
  112. euphoric = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  113. if (attr_div_labels[1].text == "Uplifted"):
  114. uplifted = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  115. if (attr_div_labels[1].text == "Energetic"):
  116. energetic = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  117. if (attr_div_labels[1].text == "Focused"):
  118. focused = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  119. if (attr_div_labels[1].text == "Tingly"):
  120. tingly = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  121. if (attr_div_labels[1].text == "Giggly"):
  122. giggly = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  123. if (attr_div_labels[1].text == "Hungry"):
  124. hungry = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  125. if (attr_div_labels[1].text == "Creative"):
  126. creative = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  127. if (attr_div_labels[1].text == "Talkative"):
  128. talkative = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  129. if (attr_div_labels[1].text == "Aroused"):
  130. aroused = attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]
  131. except IndexError:
  132. print("(IndexError) Couldn't find effect")
  133.  
  134. try:
  135. if (attr_div_labels[2].text == "Relaxed"):
  136. relaxed = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  137. if (attr_div_labels[2].text == "Sleepy"):
  138. sleepy = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  139. if (attr_div_labels[2].text == "Happy"):
  140. happy = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  141. if (attr_div_labels[2].text == "Euphoric"):
  142. euphoric = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  143. if (attr_div_labels[2].text == "Uplifted"):
  144. uplifted = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  145. if (attr_div_labels[2].text == "Energetic"):
  146. energetic = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  147. if (attr_div_labels[2].text == "Focused"):
  148. focused = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  149. if (attr_div_labels[2].text == "Tingly"):
  150. tingly = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  151. if (attr_div_labels[2].text == "Giggly"):
  152. giggly = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  153. if (attr_div_labels[2].text == "Hungry"):
  154. hungry = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  155. if (attr_div_labels[2].text == "Creative"):
  156. creative = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  157. if (attr_div_labels[2].text == "Talkative"):
  158. talkative = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  159. if (attr_div_labels[2].text == "Aroused"):
  160. aroused = attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]
  161. except IndexError:
  162. print("(IndexError) Couldn't find effect")
  163.  
  164. try:
  165. if (attr_div_labels[3].text == "Relaxed"):
  166. relaxed = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  167. if (attr_div_labels[3].text == "Sleepy"):
  168. sleepy = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  169. if (attr_div_labels[3].text == "Happy"):
  170. happy = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  171. if (attr_div_labels[3].text == "Euphoric"):
  172. euphoric = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  173. if (attr_div_labels[3].text == "Uplifted"):
  174. uplifted = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  175. if (attr_div_labels[3].text == "Energetic"):
  176. energetic = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  177. if (attr_div_labels[3].text == "Focused"):
  178. focused = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  179. if (attr_div_labels[3].text == "Tingly"):
  180. tingly = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  181. if (attr_div_labels[3].text == "Giggly"):
  182. giggly = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  183. if (attr_div_labels[3].text == "Hungry"):
  184. hungry = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  185. if (attr_div_labels[3].text == "Creative"):
  186. creative = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  187. if (attr_div_labels[3].text == "Talkative"):
  188. talkative = attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]
  189. except IndexError:
  190. print("(IndexError) Couldn't find effect")
  191.  
  192. try:
  193. if (attr_div_labels[4].text == "Relaxed"):
  194. relaxed = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  195. if (attr_div_labels[4].text == "Sleepy"):
  196. sleepy = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  197. if (attr_div_labels[4].text == "Happy"):
  198. happy = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  199. if (attr_div_labels[4].text == "Euphoric"):
  200. euphoric = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  201. if (attr_div_labels[4].text == "Uplifted"):
  202. uplifted = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  203. if (attr_div_labels[4].text == "Energetic"):
  204. energetic = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  205. if (attr_div_labels[4].text == "Focused"):
  206. focused = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  207. if (attr_div_labels[4].text == "Tingly"):
  208. tingly = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  209. if (attr_div_labels[4].text == "Giggly"):
  210. giggly = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  211. if (attr_div_labels[4].text == "Hungry"):
  212. hungry = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  213. if (attr_div_labels[4].text == "Creative"):
  214. creative = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  215. if (attr_div_labels[4].text == "Talkative"):
  216. talkative = attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]
  217. except IndexError:
  218. print("(IndexError) Couldn't find effect")
  219.  
  220. try:
  221. if (attr_div_labels[5].text == "Stress"):
  222. stress = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  223. if (attr_div_labels[5].text == "Insomnia"):
  224. insomnia = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  225. if (attr_div_labels[5].text == "Pain"):
  226. pain = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  227. if (attr_div_labels[5].text == "Lack of Appetite"):
  228. lack_of_appetite = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  229. if (attr_div_labels[5].text == "Cramps"):
  230. cramps = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  231. if (attr_div_labels[5].text == "Headaches"):
  232. headaches = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  233. if (attr_div_labels[5].text == "Depression"):
  234. depression = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  235. if (attr_div_labels[5].text == "Eye Pressure"):
  236. eye_pressure = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  237. if (attr_div_labels[5].text == "Spasticity"):
  238. spasticity = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  239. if (attr_div_labels[5].text == "Seizures"):
  240. seizures = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  241. if (attr_div_labels[5].text == "Fatigue"):
  242. fatigue = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  243. if (attr_div_labels[5].text == "Inflammation"):
  244. inflammation = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  245. if (attr_div_labels[5].text == "Muscle Spasms"):
  246. muscle_spasms = attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]
  247. except IndexError:
  248. print("Unable to find medical effect")
  249.  
  250. try:
  251. if (attr_div_labels[6].text == "Stress"):
  252. stress = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  253. if (attr_div_labels[6].text == "Insomnia"):
  254. insomnia = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  255. if (attr_div_labels[6].text == "Pain"):
  256. pain = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  257. if (attr_div_labels[6].text == "Lack of Appetite"):
  258. lack_of_appetite = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  259. if (attr_div_labels[6].text == "Cramps"):
  260. cramps = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  261. if (attr_div_labels[6].text == "Headaches"):
  262. headaches = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  263. if (attr_div_labels[6].text == "Depression"):
  264. depression = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  265. if (attr_div_labels[6].text == "Eye Pressure"):
  266. eye_pressure = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  267. if (attr_div_labels[6].text == "Spasticity"):
  268. spasticity = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  269. if (attr_div_labels[6].text == "Seizures"):
  270. seizures = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  271. if (attr_div_labels[6].text == "Fatigue"):
  272. fatigue = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  273. if (attr_div_labels[6].text == "Inflammation"):
  274. inflammation = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  275. if (attr_div_labels[6].text == "Muscle Spasms"):
  276. muscle_spasms = attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]
  277. except IndexError:
  278. print("Unable to find medical effect")
  279.  
  280. try:
  281. if (attr_div_labels[7].text == "Stress"):
  282. stress = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  283. if (attr_div_labels[7].text == "Insomnia"):
  284. insomnia = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  285. if (attr_div_labels[7].text == "Pain"):
  286. pain = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  287. if (attr_div_labels[7].text == "Lack of Appetite"):
  288. lack_of_appetite = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  289. if (attr_div_labels[7].text == "Cramps"):
  290. cramps = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  291. if (attr_div_labels[7].text == "Headaches"):
  292. headaches = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  293. if (attr_div_labels[7].text == "Depression"):
  294. depression = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  295. if (attr_div_labels[7].text == "Eye Pressure"):
  296. eye_pressure = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  297. if (attr_div_labels[7].text == "Spasticity"):
  298. spasticity = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  299. if (attr_div_labels[7].text == "Seizures"):
  300. seizures = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  301. if (attr_div_labels[7].text == "Fatigue"):
  302. fatigue = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  303. if (attr_div_labels[7].text == "Inflammation"):
  304. inflammation = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  305. if (attr_div_labels[7].text == "Muscle Spasms"):
  306. muscle_spasms = attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]
  307. except IndexError:
  308. print("Unable to find medical effect")
  309.  
  310. try:
  311. if (attr_div_labels[8].text == "Stress"):
  312. stress = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  313. if (attr_div_labels[8].text == "Insomnia"):
  314. insomnia = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  315. if (attr_div_labels[8].text == "Pain"):
  316. pain = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  317. if (attr_div_labels[8].text == "Lack of Appetite"):
  318. lack_of_appetite = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  319. if (attr_div_labels[8].text == "Cramps"):
  320. cramps = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  321. if (attr_div_labels[8].text == "Headaches"):
  322. headaches = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  323. if (attr_div_labels[8].text == "Depression"):
  324. depression = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  325. if (attr_div_labels[8].text == "Eye Pressure"):
  326. eye_pressure = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  327. if (attr_div_labels[8].text == "Spasticity"):
  328. spasticity = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  329. if (attr_div_labels[8].text == "Seizures"):
  330. seizures = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  331. if (attr_div_labels[8].text == "Fatigue"):
  332. fatigue = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  333. if (attr_div_labels[8].text == "Inflammation"):
  334. inflammation = attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]
  335. if (attr_div_labels[8].text == "Muscle Spasms"):
  336. muscle_spasms = attr_divs[8]['style'][6:len(attr_divs[9]['style'])-1]
  337. except IndexError:
  338. print("Unable to find medical effect")
  339.  
  340. try:
  341. if (attr_div_labels[9].text == "Stress"):
  342. stress = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  343. if (attr_div_labels[9].text == "Insomnia"):
  344. insomnia = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  345. if (attr_div_labels[9].text == "Pain"):
  346. pain = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  347. if (attr_div_labels[9].text == "Lack of Appetite"):
  348. lack_of_appetite = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  349. if (attr_div_labels[9].text == "Cramps"):
  350. cramps = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  351. if (attr_div_labels[9].text == "Headaches"):
  352. headaches = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  353. if (attr_div_labels[9].text == "Depression"):
  354. depression = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  355. if (attr_div_labels[9].text == "Eye Pressure"):
  356. eye_pressure = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  357. if (attr_div_labels[9].text == "Spasticity"):
  358. spasticity = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  359. if (attr_div_labels[9].text == "Seizures"):
  360. seizures = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  361. if (attr_div_labels[9].text == "Fatigue"):
  362. fatigue = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  363. if (attr_div_labels[9].text == "Inflammation"):
  364. inflammation = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  365. if (attr_div_labels[9].text == "Muscle Spasms"):
  366. muscle_spasms = attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]
  367. except IndexError:
  368. print("Unable to find medical effect")
  369.  
  370. try:
  371. if (attr_div_labels[10].text == "Dry Mouth"):
  372. dry_mouth = attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]
  373. if (attr_div_labels[10].text == "Dry Eyes"):
  374. dry_eyes = attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]
  375. if (attr_div_labels[10].text == "Paranoid"):
  376. paranoid = attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]
  377. if (attr_div_labels[10].text == "Dizzy"):
  378. dizzy = attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]
  379. if (attr_div_labels[10].text == "Headache"):
  380. headache = attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]
  381. if (attr_div_labels[10].text == "Nausea"):
  382. nausea = attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]
  383. if (attr_div_labels[10].text == "Anxious"):
  384. anxious = attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]
  385. except IndexError:
  386. print("Unable to find bad effect")
  387.  
  388. try:
  389. if (attr_div_labels[11].text == "Dry Mouth"):
  390. dry_mouth = attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]
  391. if (attr_div_labels[11].text == "Dry Eyes"):
  392. dry_eyes = attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]
  393. if (attr_div_labels[11].text == "Paranoid"):
  394. paranoid = attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]
  395. if (attr_div_labels[11].text == "Dizzy"):
  396. dizzy = attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]
  397. if (attr_div_labels[11].text == "Headache"):
  398. headache = attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]
  399. if (attr_div_labels[11].text == "Nausea"):
  400. nausea = attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]
  401. if (attr_div_labels[11].text == "Anxious"):
  402. anxious = attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]
  403. except IndexError:
  404. print("Unable to find bad effect")
  405.  
  406. try:
  407. if (attr_div_labels[12].text == "Dry Mouth"):
  408. dry_mouth = attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]
  409. if (attr_div_labels[12].text == "Dry Eyes"):
  410. dry_eyes = attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]
  411. if (attr_div_labels[12].text == "Paranoid"):
  412. paranoid = attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]
  413. if (attr_div_labels[12].text == "Dizzy"):
  414. dizzy = attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]
  415. if (attr_div_labels[12].text == "Headache"):
  416. headache = attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]
  417. if (attr_div_labels[12].text == "Nausea"):
  418. nausea = attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]
  419. if (attr_div_labels[12].text == "Anxious"):
  420. anxious = attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]
  421. except IndexError:
  422. print("Unable to find bad effect")
  423.  
  424. try:
  425. if (attr_div_labels[13].text == "Dry Mouth"):
  426. dry_mouth = attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]
  427. if (attr_div_labels[13].text == "Dry Eyes"):
  428. dry_eyes = attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]
  429. if (attr_div_labels[13].text == "Paranoid"):
  430. paranoid = attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]
  431. if (attr_div_labels[13].text == "Dizzy"):
  432. dizzy = attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]
  433. if (attr_div_labels[13].text == "Headache"):
  434. headache = attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]
  435. if (attr_div_labels[13].text == "Nausea"):
  436. nausea = attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]
  437. if (attr_div_labels[13].text == "Anxious"):
  438. anxious = attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]
  439. except IndexError:
  440. print("Unable to find bad effect")
  441.  
  442. try:
  443. if (attr_div_labels[14].text == "Dry Mouth"):
  444. dry_mouth = attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]
  445. if (attr_div_labels[14].text == "Dry Eyes"):
  446. dry_eyes = attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]
  447. if (attr_div_labels[14].text == "Paranoid"):
  448. paranoid = attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]
  449. if (attr_div_labels[14].text == "Dizzy"):
  450. dizzy = attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]
  451. if (attr_div_labels[14].text == "Headache"):
  452. headache = attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]
  453. if (attr_div_labels[14].text == "Nausea"):
  454. nausea = attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]
  455. if (attr_div_labels[14].text == "Anxious"):
  456. anxious = attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]
  457. except IndexError:
  458. print("Unable to find bad effect")
  459.  
  460. # Add properties to csv
  461.  
  462. csv += relaxed + delimiter
  463. csv += sleepy + delimiter
  464. csv += happy + delimiter
  465. csv += euphoric + delimiter
  466. csv += uplifted + delimiter
  467. csv += focused + delimiter
  468. csv += tingly + delimiter
  469. csv += energetic + delimiter
  470. csv += giggly + delimiter
  471. csv += hungry + delimiter
  472. csv += creative + delimiter
  473. csv += aroused + delimiter
  474. csv += talkative + delimiter
  475. csv += stress + delimiter
  476. csv += headaches + delimiter
  477. csv += insomnia + delimiter
  478. csv += pain + delimiter
  479. csv += lack_of_appetite + delimiter
  480. csv += cramps + delimiter
  481. csv += depression + delimiter
  482. csv += eye_pressure + delimiter
  483. csv += fatigue + delimiter
  484. csv += inflammation + delimiter
  485. csv += muscle_spasms + delimiter
  486. csv += spasticicity + delimiter
  487. csv += seizures + delimiter
  488. csv += dry_mouth + delimiter
  489. csv += dry_eyes + delimiter
  490. csv += paranoid + delimiter
  491. csv += dizzy + delimiter
  492. csv += nausea + delimiter
  493. csv += anxious + delimiter
  494. csv += headache + delimiter
  495.  
  496.  
  497. try:
  498. csv += flav_divs[0].text[3:len(flav_divs[0].text)] + delimiter # Flavour 1
  499. except IndexError:
  500. csv += "N/A" + delimiter
  501.  
  502. try:
  503. csv += flav_divs[1].text[3:len(flav_divs[1].text)] + delimiter # Flavour 2
  504. except IndexError:
  505. csv += "N/A" + delimiter
  506.  
  507. try:
  508. csv += flav_divs[2].text[3:len(flav_divs[2].text)] # Flavour 3
  509. except IndexError:
  510. csv += "N/A"
  511.  
  512. strains.append(csv)
  513.  
  514. print("Finished parsing - will now start writing to file!")
  515.  
  516. out_file = open("finished.csv", 'w', encoding="utf8")
  517.  
  518. for csv in strains:
  519. out_file.write(csv + "\n")
  520.  
  521. print("Done!")
  522.  
  523. out_file.close()
  524.  
  525.  
  526. ##try:
  527. ## print(attr_div_labels[0].text) # Effect 1
  528. ## print(attr_divs[0]['style'][6:len(attr_divs[0]['style'])-1]) # Effect 1 score /100
  529. ##except IndexError:
  530. ## print("(IndexError) Couldn't find effect")
  531. ##
  532. ##try:
  533. ## print(attr_div_labels[1].text) # Effect 2
  534. ## print(attr_divs[1]['style'][6:len(attr_divs[1]['style'])-1]) # Effect 2 score /100
  535. ##except IndexError:
  536. ## print("(IndexError) Couldn't find effect")
  537. ##
  538. ##try:
  539. ## print(attr_div_labels[2].text) # Effect 3
  540. ## print(attr_divs[2]['style'][6:len(attr_divs[2]['style'])-1]) # Effect 3 score /100
  541. ##except IndexError:
  542. ## print("(IndexError) Couldn't find effect")
  543. ##
  544. ##try:
  545. ## print(attr_div_labels[3].text) # Effect 4
  546. ## print(attr_divs[3]['style'][6:len(attr_divs[3]['style'])-1]) # Effect 4 score /100
  547. ##except IndexError:
  548. ## print("(IndexError) Couldn't find effect")
  549. ##
  550. ##try:
  551. ## print(attr_div_labels[4].text) # Effect 5
  552. ## print(attr_divs[4]['style'][6:len(attr_divs[4]['style'])-1]) # Effect 5 score /100
  553. ##except IndexError:
  554. ## print("(IndexError) Couldn't find effect")
  555. ##
  556. ##try:
  557. ## print(attr_div_labels[5].text) # Medical Effect 1
  558. ## print(attr_divs[5]['style'][6:len(attr_divs[5]['style'])-1]) # Medical 1 score /100
  559. ##except IndexError:
  560. ## print("(IndexError) Couldn't find medical effect")
  561. ##
  562. ##try:
  563. ## print(attr_div_labels[6].text) # Medical Effect 2
  564. ## print(attr_divs[6]['style'][6:len(attr_divs[6]['style'])-1]) # Medical 2 score /100
  565. ##except IndexError:
  566. ## print("(IndexError) Couldn't find medical effect")
  567. ##
  568. ##try:
  569. ## print(attr_div_labels[7].text) # Medical Effect 3
  570. ## print(attr_divs[7]['style'][6:len(attr_divs[7]['style'])-1]) # Medical 3 score /100
  571. ##except IndexError:
  572. ## print("(IndexError) Couldn't find medical effect")
  573. ##
  574. ##try:
  575. ## print(attr_div_labels[8].text) # Medical Effect 4
  576. ## print(attr_divs[8]['style'][6:len(attr_divs[8]['style'])-1]) # Medical 4 score /100
  577. ##except IndexError:
  578. ## print("(IndexError) Couldn't find medical effect")
  579. ##
  580. ##try:
  581. ## print(attr_div_labels[9].text) # Medical Effect 5
  582. ## print(attr_divs[9]['style'][6:len(attr_divs[9]['style'])-1]) # Medical 5 score /100
  583. ##except IndexError:
  584. ## print("(IndexError) Couldn't find medical effect")
  585. ##
  586. ##try:
  587. ## print(attr_div_labels[10].text) # Negative Effect 1
  588. ## print(attr_divs[10]['style'][6:len(attr_divs[10]['style'])-1]) # Negative 1 score /100
  589. ##except IndexError:
  590. ## print("(IndexError) Couldn't find negative effect")
  591. ##
  592. ##try:
  593. ## print(attr_div_labels[11].text) # Negative Effect 2
  594. ## print(attr_divs[11]['style'][6:len(attr_divs[11]['style'])-1]) # Negative 2 score /100
  595. ##except IndexError:
  596. ## print("(IndexError) Couldn't find negative effect")
  597. ##
  598. ##try:
  599. ## print(attr_div_labels[12].text) # Negative Effect 3
  600. ## print(attr_divs[12]['style'][6:len(attr_divs[12]['style'])-1]) # Negative 3 score /100
  601. ##except IndexError:
  602. ## print("(IndexError) Couldn't find negative effect")
  603. ##
  604. ##try:
  605. ## print(attr_div_labels[13].text) # Negative Effect 4
  606. ## print(attr_divs[13]['style'][6:len(attr_divs[13]['style'])-1]) # Negative 4 score /100
  607. ##except IndexError:
  608. ## print("(IndexError) Couldn't find negative effect")
  609. ##
  610. ##try:
  611. ## print(attr_div_labels[14].text) # Negative Effect 5
  612. ## print(attr_divs[14]['style'][6:len(attr_divs[14]['style'])-1]) # Negative 5 score /100
  613. ##except IndexError:
  614. ## print("(IndexError) Couldn't find negative effect")
  615. ##
  616. ##try:
  617. ## print(flav_divs[0].text[3:len(flav_divs[0].text)]) # Flavour 1
  618. ##except IndexError:
  619. ## print("(IndexError) Couldn't find flavour")
  620. ##
  621. ##try:
  622. ## print(flav_divs[1].text[3:len(flav_divs[1].text)]) # Flavour 2
  623. ##except IndexError:
  624. ## print("(IndexError) Couldn't find flavour")
  625. ##
  626. ##try:
  627. ## print(flav_divs[2].text[3:len(flav_divs[2].text)]) # Flavour 3
  628. ##except IndexError:
  629. ## print("(IndexError) Couldn't find flavour")
  630. ##
  631. ##
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement