Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from bs4 import BeautifulSoup
- import requests
- import smtplib
- from email.mime.multipart import MIMEMultipart
- from email.mime.text import MIMEText
- import urllib2
- import time
- from lxml import etree
- keyword1 = "marine"
- keyword2 = "boost"
- keyword3 = "red"
- print("starting")
- r = requests.get('http://kithnyc.com/sitemap_products_1.xml?from=60594372&to=9545825095')
- soup = BeautifulSoup(r.text, 'lxml')
- links = soup.find_all('loc')
- for link in links: #This is where script should scrape until link is found
- if keyword1 in link.text and keyword2 in link.text and keyword3 in link.text:
- print(link.text)
- break
- jake = link.text
- print(jake)
- from_adr='@gmail.com'
- to_adr='@gmail.com'
- msg = MIMEMultipart('alternative')
- msg['Subject'] = "Emailing a link"
- msg['From'] = from_adr
- msg['To'] = to_adr
- html = """
- <html>
- <head></head>
- <body>
- <p>Link:</p>
- <a href="http://www.somewhere.com/whatever.foo">Link Text</a>
- </body>
- </html>
- """
- print("found")
- part1=MIMEText(str(jake), 'html')
- part2=MIMEText(jake, 'text')
- msg.attach(part1)
- msg.attach(part2)
- s = smtplib.SMTP('smtp.gmail.com', 587)
- s.starttls()
- s.login("@gmail.com", "pass")
- s.sendmail(from_adr, to_adr, msg.as_string())
- s.quit
- url = str(jake) #second script
- response = urllib2.urlopen(url)
- htmlparser = etree.HTMLParser()
- tree = etree.parse(response, htmlparser)
- nodeList = tree.xpath('//script[@type="text/javascript"][contains(.,"Kith")][contains(.,"variants")]')
- blue = len(nodeList)
- if blue != 0:
- for node in nodeList:
- print etree.tostring(node)
- server = smtplib.SMTP('smtp.gmail.com', 587)
- server.starttls()
- server.login("@gmail.com", "pass")
- variants = etree.tostring(node)
- msg2 = str(variants)
- server.sendmail("@gmail.com", "@gmail.com", msg2)
- server.quit()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement