Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #!/bin/env python2
- import requests
- from lxml import html
- def main(url, element_id = 'WitnessSlipTabStrip'):
- tree = html.fromstring(requests.get(url).content)
- ws_tabs = tree.xpath('.//div[@id="{}"]/ul/li'.format(element_id))
- for tab in ws_tabs:
- print tab.text_content()
- if __name__ == '__main__':
- # URL for witness slips for SB1966 HCA1
- url = 'http://my.ilga.gov/Hearing/WitnessSlipInfo/119887?hearingid=17216&LegislationDocumentId=154212&HCommittees5%2F27%2F2019-page=1&committeeid=0&chamber=H&nodays=7&_=1558384770586'
- # Minimal URL that works
- url = 'http://my.ilga.gov/Hearing/WitnessSlipInfo/119887?hearingid=17216&LegislationDocumentId=154212'
- main(url)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement