Untitled

import requests
from bs4 import BeautifulSoup
import re

SOURCE_URL = '<some url>'
r = requests.get(SOURCE_URL)
soup = BeautifulSoup(str(r.content, encoding='shift_jis'), 'lxml')


pattern = r'^(\d+):\s(.+)\s\((\d+)\)'


def thread_id(key):
    return re.sub(r'/l\d+', '', key)


def parse_title(a):
    title = a.text
    groups = re.search(pattern, title)
    if not groups:
        return None

    return {
        'num': int(groups.group(1)),
        'title': groups.group(2),
        'res': int(groups.group(3)),
        'url_key': thread_id(a.get('href'))
    }


for a in soup.find_all('a'):
    th_data = parse_title(a)
    if th_data:
        print(th_data)