Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- from bs4 import BeautifulSoup
- import re
- class WikiArtHandler:
- def __init__(self):
- self.page = requests.get('https://www.wikiart.org/ru')
- self.soup = BeautifulSoup(self.page.text, 'html.parser')
- pass
- def get_genres(self):
- # возвращает список жанров
- artist_genre_list = self.soup.find(class_='popular-dictionaries view-dictionaries-container')
- d = artist_genre_list.get_attribute_list('ng-init')[0]
- d = re.split('[}{,;".}:]', d)
- self.genre_names = set()
- for i in range(len(d) - 1):
- for c in d[i]:
- if c.isupper():
- self.genre_names.add(d[i])
- useless_words = {'Title', 'Url', 'PopularDictionariesViewModel', 'popularDictionariesModel = ','Items', 'GroupTitle', 'TotalViews', 'Стиль'}
- self.genre_names.difference_update(useless_words)
- self.genre_names = list(self.genre_names)
- print(self.genre_names)
- pass
- def get_artists(self):
- # возвращает список художников
- artist_name_list = self.soup.find(class_='popular-artists view-dictionaries-container')
- d = artist_name_list.get_attribute_list('ng-init')[0]
- d = re.split('[}{,;".}:]', d)
- self.artist_names = set()
- for i in range(len(d) - 1):
- for c in d[i]:
- if c.isupper():
- self.artist_names.add(d[i])
- useless_words = {'Title', 'Url', 'PopularArtistsViewModel', 'popularArtistsModel = '}
- self.artist_names.difference_update(useless_words)
- self.artist_names = list(self.artist_names)
- print(self.artist_names)
- pass
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement