Advertisement
sowamaciej

Untitled

Jun 3rd, 2018
89
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.78 KB | None | 0 0
  1. import re
  2.  
  3. try:
  4. with open('page1.html', encoding='utf8') as infile:
  5. data = infile.read()
  6. except FileNotFoundError:
  7. exit()
  8. try:
  9. with open('page2.html', encoding='utf8') as infile:
  10. data = infile.read()
  11. except FileNotFoundError:
  12. print('Error')
  13. exit()
  14.  
  15. file = re.findall('(<tr.*?\/tr>)', data)
  16. nick = re.findall('/users\/(.*?)">(.*?)<\/a>', data)
  17. results = re.findall('(?<=submissions">).*?(?=<\/font>)|>-<', data)
  18. size = len(results)/len(nick)
  19. results = [result.replace('.', ',') for result in results]
  20. results = [result.replace('>-<', '0,0') for result in results]
  21. i=0
  22. j=0
  23. for key, value in nick:
  24. print('"'+key+'","'+value+'"', end='')
  25. j=j+1
  26. while i<size*j:
  27. print(',"'+results[i]+'"', end='')
  28. i=i+1
  29. print()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement