Advertisement
Guest User

Untitled

a guest
Jul 20th, 2017
66
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.93 KB | None | 0 0
  1. "~/folder/file.htm"
  2.  
  3. "../../folder/file.htm"
  4.  
  5. var parser = new HtmlParser();
  6.  
  7. var siteBase = "https://mail.ru/mail/something/etc/";
  8. var siteBaseUrl = new Url(siteBase);
  9.  
  10. // Скачали с siteBase документ, тут заглушка - просто образец полученного Html
  11.  
  12. var document = parser.Parse(@"<body>
  13. <div class='product'>
  14. <a href='/url1.html'><img src='img1.jpg' alt=''></a>
  15. Hello, world
  16. <div class='comments-likes'>1</div>
  17. </div>
  18. <div class='footer'>
  19. <a href='../../folder/file.htm'>link</a>
  20. </div>
  21. </body>");
  22.  
  23. var links = document.QuerySelectorAll("a");
  24. foreach (var link in links)
  25. {
  26. var url = link.GetAttribute("href");
  27. url.Dump();
  28. var urlFull = new Url(siteBaseUrl, url);
  29. //urlFull.Dump();
  30. urlFull.Href.Dump();
  31. }
  32.  
  33. /url1.html
  34. https://mail.ru/url1.html
  35. ../../folder/file.htm
  36. https://mail.ru/mail/folder/file.htm
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement