Advertisement
ZeekoSec

html crawler

Jan 26th, 2016
445
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 27.64 KB | None | 0 0
  1.  
  2. html = ('''
  3.  
  4.  
  5. <!DOCTYPE HTML>
  6. <!--[if lt IE 7 ]> <html class="no-js ie6" lang="da-DK"> <![endif]-->
  7. <!--[if IE 7 ]>    <html class="no-js ie7" lang="da-DK"> <![endif]-->
  8. <!--[if IE 8 ]>    <html class="no-js ie8" lang="da-DK"> <![endif]-->
  9. <!--[if IE 9 ]>    <html class="no-js ie9" lang="da-DK"> <![endif]-->
  10. <!--[if (gte IE 9)|!(IE)]><!--> <html class="no-js wf-loading" lang="da_DK"> <!--<![endif]-->
  11. <head>
  12.    <meta charset="ISO-8859-1">
  13.    <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1" />
  14.    <meta name="apple-mobile-web-app-capable" content="yes" />
  15.    <link href="//fonts.googleapis.com" rel="dns-prefetch">
  16.  
  17.    <script type="text/javascript">
  18.        WebFontConfig = {
  19.            google: { families: [ 'Open+Sans+Condensed:300,700,300italic:latin','Open+Sans:300,700,300italic:latin' ] }
  20.        };
  21.  
  22.        (function() {
  23.            var wf = document.createElement('script');
  24.            wf.src = ('https:' == document.location.protocol ? 'https' : 'http') +
  25.            '://ajax.googleapis.com/ajax/libs/webfont/1/webfont.js';
  26.            wf.type = 'text/javascript';
  27.            wf.async = 'true';
  28.            var s = document.getElementsByTagName('script')[0];
  29.            s.parentNode.insertBefore(wf, s);
  30.        })();
  31.    </script>
  32.  
  33.            <title>Cold Hand Winery - Prisvindende frugtvin</title>
  34.        <meta http-equiv="content-type" content="text/html; charset=iso-8859-1">
  35.        <!-- Metatags -->
  36.        <meta name="modified" content="11-03-2014 10:06:25">
  37.        <meta name="generator" content="Aviva Content Management (www.aviva.dk)">
  38.        <meta name="webbureauet" content="Webbureauet Infoserv ApS (www.infoserv.dk)">
  39.        <meta name="hardlink" content="default.asp&amp;page_id=2">
  40.        <meta http-equiv="Content-Language" content="DK">
  41.        <meta name="robots" content="index,follow">
  42.        <!-- Base -->
  43.        <base href="http://www.coldhandwinery.dk/">
  44.  
  45.  
  46.  
  47.    <link rel="stylesheet" type="text/css" href="templates/responsiv3/scripts/stylesheet.css?v=1">
  48.  
  49. <!-- LESS Javascript compiler -->
  50. <!--
  51.    <link rel="stylesheet/less" type="text/css" href="templates/responsiv3/scripts/bootstrap/less/bootstrap.less">
  52.    <link rel="stylesheet/less" type="text/css" href="templates/responsiv3/scripts/bootstrap/less/responsive.less">
  53.    <link rel="stylesheet/less" type="text/css" href="templates/responsiv3/less/stylesheet.less?05092013-1003">
  54.    <script type="text/javascript">less = { env: "development", dumpLineNumbers: "mediaquery" };</script>
  55.    <script src="templates/responsiv3/scripts/less.js"></script>
  56. -->
  57.    <link
  58.        rel="alternate"
  59.        href="http://www.coldhandwinery.dk/rss_news.asp?page_id=2"
  60.        title="News feed"
  61.        type="application/rss+xml">
  62.    <link
  63.        rel="alternate"
  64.        href="http://www.coldhandwinery.dk/rss_pages.asp?page_id=2"
  65.        title="Page update feed"
  66.        type="application/rss+xml">
  67.  
  68.    <!-- blasted ie -->
  69.    <!--[if (lt IE 9) & (!IEMobile)]>
  70.        <script src="//html5shiv.googlecode.com/svn/trunk/html5.js"></script>
  71.        <script src="templates/responsiv3/scripts/DOMAssistant-2.8.1.js"></script>
  72.        <script src="templates/responsiv3/scripts/selectivizr-min.js"></script>
  73.    <![endif]-->
  74.  
  75.    <script src="http://code.jquery.com/jquery.js"></script>
  76.    <script src="templates/responsiv3/scripts/modernizr.foundation.js"></script>
  77.  
  78.    
  79.  
  80. </head>
  81.  
  82. <body id="default" class="forside">
  83.    <div id="site-actions" class="hidden-phone">
  84.  
  85.  
  86. <a target="_blank" href="http://shop.coldhandwinery.dk/da/3-online-shop" class="shop"></a>
  87.  <a href="http://eepurl.com/XahwT" class="newsletter" target="_blank"></a>
  88.  
  89.  
  90. </div>
  91.  
  92.    <div class="container">
  93.    
  94.        <div id="top-site-actions" class="hidden-phone">
  95.            <a target="_blank" href="http://shop.coldhandwinery.dk/da/3-online-shop" class="shop"></a>
  96.        </div>
  97.    
  98.        
  99.        <header id="header" class="row clearfix">
  100.            <!-- hero unit -->
  101. <ul class="lang_menu" style="">
  102.      
  103.            <li style="color: #fff; padding: 0 15px;">
  104.                <p style="padding: 0 15px; margin-bottom: 0; border-right: 1px solid #74848f; border-left: 1px solid #74848f;">Danish</p>
  105.                <ul class="lang_submenu" style="margin-left: 0; list-style: none; background-color: #333333;">
  106.                    <a style="color:#fff;" href="/en"><li style="padding: 5px 0;" >English</li></a>
  107.                    <a style="color:#fff;" href="/de"><li style="padding: 5px 0;">Deutsch</li></a>
  108.                </ul>
  109.            </li>
  110.    
  111. </ul>
  112. <div id="fb" style="position:absolute; right:30px; top:1px;">
  113.  
  114.    <a href="https://www.facebook.com/pages/Cold-Hand-Winery/280396455326889" target="_blank" style="color:white; font-size:14px;">Følg os på <img src="http://www.coldhandwinery.dk/templates/responsiv3/images/fb.png" style="height:20px; margin-top:-2px;"></a>
  115.  
  116. </div>
  117.  
  118. <div id="hero" class="clearfix">
  119.  
  120.    <span class='logo'>
  121.    <img src="http://www.coldhandwinery.dk/templates/responsiv3/images/logo.png" alt="">
  122.    </span>
  123.  
  124. </div>
  125. <!--- navigation -->
  126. <div id="menu-container" class="span12 clearfix">
  127.    <!-- desktop -->
  128.    <nav id="main" class="menu visible-desktop clearfix">
  129.        <!-- aviva menu -->
  130.        
  131. <ul class="xm_0" id="xm_2">
  132.     <li id="xmi2" class="xm_0 selected current begin"><a id="xma2" class="xm_0 selected current begin" href="http://www.coldhandwinery.dk/">Velkommen<span class='teaser'>Start her</span><span class='indicator'></span></a></li>
  133.     <li id="xmi77" class="xm_0"><a id="xma77" class="xm_0" href="http://www.coldhandwinery.dk/vores-&230bler/">Om &#230;blerne<span class='teaser'>Om &#230;blesorterne</span><span class='indicator'></span></a></li>
  134.     <li id="xmi73" class="xm_0"><a id="xma73" class="xm_0" href="http://www.coldhandwinery.dk/firma-profil/aktuelt/">Firma profil<span class='teaser'>Hvem er vi</span><span class='indicator'></span></a>
  135.     <ul class="xm_1 submenu" id="xm_73">
  136.         <li id="xmi129" class="xm_1 begin"><a id="xma129" class="xm_1 begin" href="http://www.coldhandwinery.dk/firma-profil/aktuelt/">F&#248;lg med....</a></li>
  137.         <li id="xmi91" class="xm_1"><a id="xma91" class="xm_1" href="http://www.coldhandwinery.dk/firma-profil/hvem-er-vi/">Hvem er vi</a></li>
  138.         <li id="xmi221" class="xm_1"><a id="xma221" class="xm_1" href="http://www.coldhandwinery.dk/firma-profil/bliv-medejer/">Bliv medejer</a></li>
  139.         <li id="xmi122" class="xm_1 end"><a id="xma122" class="xm_1 end" href="http://www.coldhandwinery.dk/firma-profil/presse/hvad-skrev-pressen/">Presse<span class='marker'></span></a>
  140.         <ul class="xm_2 submenu" id="xm_122">
  141.             <li id="xmi124" class="xm_2 begin"><a id="xma124" class="xm_2 begin" href="http://www.coldhandwinery.dk/firma-profil/presse/hvad-skrev-pressen/">Hvad skrev pressen</a></li>
  142.             <li id="xmi123" class="xm_2"><a id="xma123" class="xm_2" href="http://www.coldhandwinery.dk/firma-profil/presse/tv-indslag-og-videoklip/">TV indslag og videoklip</a></li>
  143.             <li id="xmi128" class="xm_2 end"><a id="xma128" class="xm_2 end" href="http://www.coldhandwinery.dk/firma-profil/presse/blogget-om-os/">Blogget om os</a></li>
  144.         </ul>
  145.  
  146. <a href='#' style='display:none;'></a></li>
  147.     </ul>
  148.  
  149. <a href='#' style='display:none;'></a></li>
  150.     <li id="xmi76" class="xm_0"><a id="xma76" class="xm_0" href="http://www.coldhandwinery.dk/produkter/">Produkter<span class='teaser'>Se vores udvalg</span><span class='indicator'></span></a>
  151.     <ul class="xm_1 submenu" id="xm_76">
  152.         <li id="xmi127" class="xm_1 begin"><a id="xma127" class="xm_1 begin" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/crispa-2013/">Mousserende frugtvin<span class='marker'></span></a>
  153.         <ul class="xm_2 submenu" id="xm_127">
  154.             <li id="xmi139" class="xm_2 begin"><a id="xma139" class="xm_2 begin" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/crispa-2013/">Crispa - boblende stikkelsb&#230;r</a></li>
  155.             <li id="xmi140" class="xm_2"><a id="xma140" class="xm_2" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/rubus-2013/">Rubus - boblende hindb&#230;r</a></li>
  156.             <li id="xmi141" class="xm_2"><a id="xma141" class="xm_2" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/cerasus-2013---boblende-kirsebaer/">Cerasus 2013 - boblende kirsebær</a></li>
  157.             <li id="xmi131" class="xm_2"><a id="xma131" class="xm_2" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/pommus---boblende-&230bler/">Pommus - boblende &#230;bler</a></li>
  158.             <li id="xmi130" class="xm_2"><a id="xma130" class="xm_2" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/rheum---boblende-rabarber/">Rheum - boblende rabarber</a></li>
  159.             <li id="xmi142" class="xm_2 end"><a id="xma142" class="xm_2 end" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/vinter-2012/">Vinter - En outcider</a></li>
  160.         </ul>
  161.  
  162. <a href='#' style='display:none;'></a></li>
  163.         <li id="xmi125" class="xm_1"><a id="xma125" class="xm_1" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-danica---&230bleisvin/">&#198;blevin<span class='marker'></span></a>
  164.         <ul class="xm_2 submenu" id="xm_125">
  165.             <li id="xmi97" class="xm_2 begin"><a id="xma97" class="xm_2 begin" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-danica---&230bleisvin/">Malus Danica - &#230;bleisvin</a></li>
  166.             <li id="xmi222" class="xm_2"><a id="xma222" class="xm_2" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-danica-2012-oeko/">Malus Danica 2012 &#8211; &#216;KO</a></li>
  167.             <li id="xmi132" class="xm_2"><a id="xma132" class="xm_2" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-x---feminam/">Malus X - Feminam</a></li>
  168.             <li id="xmi133" class="xm_2 end"><a id="xma133" class="xm_2 end" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-x---masculine/">Malus X - Masculine</a></li>
  169.         </ul>
  170.  
  171. <a href='#' style='display:none;'></a></li>
  172.         <li id="xmi126" class="xm_1"><a id="xma126" class="xm_1" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/nigra-x-2014/">&#216;vrige frugtvine<span class='marker'></span></a>
  173.         <ul class="xm_2 submenu" id="xm_126">
  174.             <li id="xmi224" class="xm_2 begin"><a id="xma224" class="xm_2 begin" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/nigra-x-2014/">Nigra X 2014</a></li>
  175.             <li id="xmi134" class="xm_2"><a id="xma134" class="xm_2" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/prunus-nigra---kirsebaervin/">Prunus Nigra - kirsebærvin</a></li>
  176.             <li id="xmi225" class="xm_2"><a id="xma225" class="xm_2" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/pyrus-communis-paeredessertvin/">Pyrus Communis - p&#230;redessertvin</a></li>
  177.             <li id="xmi223" class="xm_2"><a id="xma223" class="xm_2" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/ribes-ruby/">Ribes Ruby - solb&#230;rvin</a></li>
  178.             <li id="xmi135" class="xm_2"><a id="xma135" class="xm_2" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/ribes-nigrum---solbaervin/">Ribes Nigrum - solb&#230;rvin</a></li>
  179.             <li id="xmi137" class="xm_2 end"><a id="xma137" class="xm_2 end" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/prunus-rosa---blommevin/">Prunus Rosa - blommevin</a></li>
  180.         </ul>
  181.  
  182. <a href='#' style='display:none;'></a></li>
  183.         <li id="xmi144" class="xm_1 end"><a id="xma144" class="xm_1 end" href="http://www.coldhandwinery.dk/produkter/praemievine/">Pr&#230;mievine</a></li>
  184.     </ul>
  185.  
  186. <a href='#' style='display:none;'></a></li>
  187.     <li id="xmi120" class="xm_0"><a id="xma120" class="xm_0" href="http://www.coldhandwinery.dk/smagninger/">Smagninger<span class='teaser'><p>Bes&oslash;g os</p></span><span class='indicator'></span></a></li>
  188.     <li id="xmi143" class="xm_0"><a id="xma143" class="xm_0" href="http://www.coldhandwinery.dk/forhandler/">Forhandler <span class='teaser'>Find forhandler</span><span class='indicator'></span></a></li>
  189.     <li id="xmi10" class="xm_0 end"><a id="xma10" class="xm_0 end" href="http://www.coldhandwinery.dk/kontakt-os/">Kontakt os<span class='teaser'>F&#229; mere information</span><span class='indicator'></span></a></li>
  190. </ul>
  191.  
  192.  
  193.  
  194.        <!-- search -->
  195.        
  196.        <a href="#search"
  197.           id="main-search-toggle"
  198.           class="search"
  199.           rel="tooltip"
  200.           data-placement="top"
  201.           data-original-title="S&oslash;g"
  202.           title='S&oslash;g'></a>
  203.        
  204.    </nav>
  205.  
  206.    <!-- tablets -->
  207.    <nav id="responsive" class="menu hidden-desktop">
  208.        <!-- buttons -->
  209.        <div class="buttons">
  210.        
  211.          <a href="http://shop.coldhandwinery.dk/da" id="responsive-webshop">WEBSHOP</a>
  212.        
  213.          <a href="http://www.coldhandwinery.dk/" id="responsive-menu-toggle">MENU</a>
  214.          <a href="http://www.coldhandwinery.dk/" id="responsive-home-btn"><i class="icon-home"></i> </a>
  215.          <a href="#search" id="responsive-search-toggle"><i class="icon-search"></i> </a>
  216.          <a href="https://www.facebook.com/pages/Cold-Hand-Winery/280396455326889" id="responsive-fb-btn"><i class="icon-facebook"></i></a>
  217.        </div>
  218.                            <!-- aviva menu -->
  219.        
  220.     <ul class="xm_1 sel" id="xm_2">
  221.         <li id="xmi77" class="xm_1 begin"><a id="xma77" class="xm_1 begin" href="http://www.coldhandwinery.dk/vores-&230bler/">Om &#230;blerne</a></li>
  222.         <li id="xmi73" class="xm_1 presub"><a id="xma73" class="xm_1 presub" href="http://www.coldhandwinery.dk/firma-profil/aktuelt/">Firma profil<span class='marker'></span></a></li><li class="xm_1 presub subcontainer">
  223.  
  224.         <ul class="xm_2 submenu" id="xm_73">
  225.             <li id="xmi129" class="xm_2 begin"><a id="xma129" class="xm_2 begin" href="http://www.coldhandwinery.dk/firma-profil/aktuelt/">F&#248;lg med....</a></li>
  226.             <li id="xmi91" class="xm_2"><a id="xma91" class="xm_2" href="http://www.coldhandwinery.dk/firma-profil/hvem-er-vi/">Hvem er vi</a></li>
  227.             <li id="xmi221" class="xm_2"><a id="xma221" class="xm_2" href="http://www.coldhandwinery.dk/firma-profil/bliv-medejer/">Bliv medejer</a></li>
  228.             <li id="xmi122" class="xm_2 end presub"><a id="xma122" class="xm_2 end presub" href="http://www.coldhandwinery.dk/firma-profil/presse/hvad-skrev-pressen/">Presse<span class='marker'></span></a></li><li class="xm_2 end presub subcontainer">
  229.  
  230.             <ul class="xm_3 submenu" id="xm_122">
  231.                 <li id="xmi124" class="xm_3 begin"><a id="xma124" class="xm_3 begin" href="http://www.coldhandwinery.dk/firma-profil/presse/hvad-skrev-pressen/">Hvad skrev pressen</a></li>
  232.                 <li id="xmi123" class="xm_3"><a id="xma123" class="xm_3" href="http://www.coldhandwinery.dk/firma-profil/presse/tv-indslag-og-videoklip/">TV indslag og videoklip</a></li>
  233.                 <li id="xmi128" class="xm_3 end"><a id="xma128" class="xm_3 end" href="http://www.coldhandwinery.dk/firma-profil/presse/blogget-om-os/">Blogget om os</a></li>
  234.             </ul>
  235.  
  236. </li>       </ul>
  237.  
  238. </li>       <li id="xmi76" class="xm_1 presub postsub"><a id="xma76" class="xm_1 presub postsub" href="http://www.coldhandwinery.dk/produkter/">Produkter<span class='marker'></span></a></li><li class="xm_1 presub postsub subcontainer">
  239.  
  240.         <ul class="xm_2 submenu" id="xm_76">
  241.             <li id="xmi127" class="xm_2 begin presub"><a id="xma127" class="xm_2 begin presub" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/crispa-2013/">Mousserende frugtvin<span class='marker'></span></a></li><li class="xm_2 begin presub subcontainer">
  242.  
  243.             <ul class="xm_3 submenu" id="xm_127">
  244.                 <li id="xmi139" class="xm_3 begin"><a id="xma139" class="xm_3 begin" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/crispa-2013/">Crispa - boblende stikkelsb&#230;r</a></li>
  245.                 <li id="xmi140" class="xm_3"><a id="xma140" class="xm_3" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/rubus-2013/">Rubus - boblende hindb&#230;r</a></li>
  246.                 <li id="xmi141" class="xm_3"><a id="xma141" class="xm_3" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/cerasus-2013---boblende-kirsebaer/">Cerasus 2013 - boblende kirsebær</a></li>
  247.                 <li id="xmi131" class="xm_3"><a id="xma131" class="xm_3" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/pommus---boblende-&230bler/">Pommus - boblende &#230;bler</a></li>
  248.                 <li id="xmi130" class="xm_3"><a id="xma130" class="xm_3" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/rheum---boblende-rabarber/">Rheum - boblende rabarber</a></li>
  249.                 <li id="xmi142" class="xm_3 end"><a id="xma142" class="xm_3 end" href="http://www.coldhandwinery.dk/produkter/mousserende-frugtvin/vinter-2012/">Vinter - En outcider</a></li>
  250.             </ul>
  251.  
  252. </li>           <li id="xmi125" class="xm_2 presub postsub"><a id="xma125" class="xm_2 presub postsub" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-danica---&230bleisvin/">&#198;blevin<span class='marker'></span></a></li><li class="xm_2 presub postsub subcontainer">
  253.  
  254.             <ul class="xm_3 submenu" id="xm_125">
  255.                 <li id="xmi97" class="xm_3 begin"><a id="xma97" class="xm_3 begin" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-danica---&230bleisvin/">Malus Danica - &#230;bleisvin</a></li>
  256.                 <li id="xmi222" class="xm_3"><a id="xma222" class="xm_3" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-danica-2012-oeko/">Malus Danica 2012 &#8211; &#216;KO</a></li>
  257.                 <li id="xmi132" class="xm_3"><a id="xma132" class="xm_3" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-x---feminam/">Malus X - Feminam</a></li>
  258.                 <li id="xmi133" class="xm_3 end"><a id="xma133" class="xm_3 end" href="http://www.coldhandwinery.dk/produkter/&198blevin/malus-x---masculine/">Malus X - Masculine</a></li>
  259.             </ul>
  260.  
  261. </li>           <li id="xmi126" class="xm_2 presub postsub"><a id="xma126" class="xm_2 presub postsub" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/nigra-x-2014/">&#216;vrige frugtvine<span class='marker'></span></a></li><li class="xm_2 presub postsub subcontainer">
  262.  
  263.             <ul class="xm_3 submenu" id="xm_126">
  264.                 <li id="xmi224" class="xm_3 begin"><a id="xma224" class="xm_3 begin" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/nigra-x-2014/">Nigra X 2014</a></li>
  265.                 <li id="xmi134" class="xm_3"><a id="xma134" class="xm_3" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/prunus-nigra---kirsebaervin/">Prunus Nigra - kirsebærvin</a></li>
  266.                 <li id="xmi225" class="xm_3"><a id="xma225" class="xm_3" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/pyrus-communis-paeredessertvin/">Pyrus Communis - p&#230;redessertvin</a></li>
  267.                 <li id="xmi223" class="xm_3"><a id="xma223" class="xm_3" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/ribes-ruby/">Ribes Ruby - solb&#230;rvin</a></li>
  268.                 <li id="xmi135" class="xm_3"><a id="xma135" class="xm_3" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/ribes-nigrum---solbaervin/">Ribes Nigrum - solb&#230;rvin</a></li>
  269.                 <li id="xmi137" class="xm_3 end"><a id="xma137" class="xm_3 end" href="http://www.coldhandwinery.dk/produkter/&216vrige-frugtvine/prunus-rosa---blommevin/">Prunus Rosa - blommevin</a></li>
  270.             </ul>
  271.  
  272. </li>           <li id="xmi144" class="xm_2 end postsub"><a id="xma144" class="xm_2 end postsub" href="http://www.coldhandwinery.dk/produkter/praemievine/">Pr&#230;mievine</a></li>
  273.         </ul>
  274.  
  275. </li>       <li id="xmi120" class="xm_1 postsub"><a id="xma120" class="xm_1 postsub" href="http://www.coldhandwinery.dk/smagninger/">Smagninger</a></li>
  276.         <li id="xmi143" class="xm_1"><a id="xma143" class="xm_1" href="http://www.coldhandwinery.dk/forhandler/">Forhandler </a></li>
  277.         <li id="xmi10" class="xm_1 end"><a id="xma10" class="xm_1 end" href="http://www.coldhandwinery.dk/kontakt-os/">Kontakt os</a></li>
  278.     </ul>
  279.  
  280.  
  281.    </nav>
  282.  
  283.    <!-- search form -->
  284.    
  285.    <div id="search-container" class="span6" style="display: none;">
  286.        <form action="default.asp?page_id=4" method="post" class="smallsearch"><input class="span3" type="text" name="keyword" value="" placeholder="Skriv søgeord"><button class="btn btn-success hidden-desktop" type="submit">S&oslash;g</button></form>
  287.    </div>
  288.    
  289. </div>
  290.  
  291.            <!-- fader -->
  292.            <div id='slider' class='carousel slide span12'><ol class='carousel-indicators'><li data-target='#slider' data-slide-to='0' class='active'></li><li data-target='#slider' data-slide-to='1'></li><li data-target='#slider' data-slide-to='2'></li><li data-target='#slider' data-slide-to='3'></li><li data-target='#slider' data-slide-to='4'></li><li data-target='#slider' data-slide-to='5'></li><li data-target='#slider' data-slide-to='6'></li></ol><div class='carousel-inner'><a href='/produkter/' class='item active clearfix'><div style='position:absolute;top:0;left:0;bottom:0;'><img src='aviva/media/slider/banner_nye_vine_2015_.jpg' alt=''></div><span class='readmore-big'>L&aelig;s mere</span></a><a href='/firma-profil/bliv-medejer/' class='item clearfix'><div style='position:absolute;top:0;left:0;bottom:0;'><img src='aviva/media/slider/forside_banner_investor.jpg' alt=''></div><div class='carousel--text'><h1>Bliv medejer….&#8232;</h1><p>Lige siden firmaets spæde start, har udfordringen været at følge med efterspørgslen. Derfor sælger vi nu aktier for at skaffe vækstkapital.</p></div><span class='readmore-big'>L&aelig;s mere</span></a><a href='produkter/&216vrige-frugtvine/nigra-x-2014/' class='item clearfix'><div style='position:absolute;top:0;left:0;bottom:0;'><img src='aviva/media/produkter/3kirsebaervin_coldhandwinery.jpg' alt=''></div><div class='carousel--text'><h1>Kirsebær</h1><p>det danske Stevnsbær er nordens drue</p></div><span class='readmore-big'>L&aelig;s mere</span></a><a href='produkter/mousserende-frugtvin/rheum---boblende-rabarber/' class='item clearfix'><div style='position:absolute;top:0;left:0;bottom:0;'><img src='aviva/media/slider/mousserende_bobler_coldhandwinery.png' alt=''></div><span class='readmore-big'>L&aelig;s mere</span></a><a href='produkter/&216vrige-frugtvine/pyrus-x---paeredesssertvin/' class='item clearfix'><div style='position:absolute;top:0;left:0;bottom:0;'><img src='aviva/media/slider/pyrus_coldhandwinery_slider.jpg' alt=''></div><div class='carousel--text'><h1>Pyrus Communis 2013</h1><p>Superkoncentrerede pærer</p></div><span class='readmore-big'>L&aelig;s mere</span></a><a href='produkter/&198blevin/malus-x---feminam/' class='item clearfix'><div style='position:absolute;top:0;left:0;bottom:0;'><img src='aviva/media/slider/prisvindende_masculine_feminam_coldhandwinery.jpg' alt=''></div><div class='carousel--text'><h1>Malus X</h1><p>prisvindende æble-dessertvine</p></div><span class='readmore-big'>L&aelig;s mere</span></a><a href='produkter/&198blevin/malus-danica---&230bleisvin/' class='item clearfix'><div style='position:absolute;top:0;left:0;bottom:0;'><img src='aviva/media/slider/forside_4.jpg' alt=''></div><div class='carousel--text'><h1>Malus Danica</h1><p>Danmarks første æble-isvin</p></div><span class='readmore-big'>L&aelig;s mere</span></a></div></div><nav id="breadcrumbs" class="clearfix">
  293.  
  294. </nav>
  295.        </header>
  296.  
  297.        <!-- body content & sidebar -->
  298. <section id="content-container">
  299.    <article class="row">
  300.        <h1 style="display:none;">Site name | Velkommen</h1>
  301.        <div class="clearfix span12" id="content"><ul class='row focus'><li class='span4 even'><img src='aviva/media/forside-bokse/billede_1_1.jpg' alt='Smagninger'><div class='text'><h4 style='text-transform:uppercase;'>Smagninger</h4><div class='partner-text-internal'><p>Vi tilbyder vinsmagninger med rundvisning og historiefortælling. Book en smagning til vennerne, kollegerne, vinklubben - helt efter jeres ønsker</p></div><div class='link'><a href='smagninger/'>L&aelig;s mere</a></div></div></li><li class='span4 odd'><img src='aviva/media/forside-bokse/billede_1.jpg' alt='Frugtvin eller cider ?'><div class='text'><h4 style='text-transform:uppercase;'>Frugtvin eller cider ?</h4><div class='partner-text-internal'><p>Verdens bedste æbler dyrkes i Danmark. Når disse æbler kombineres med moderne vinøse teknikker og udstyr, bliver produktet af hidtil uset kvalitet. Derfor kalder vi det for frugtvin i stedet for cider.  </p></div><div class='link'><a href='produkter/'>L&aelig;s mere</a></div></div></li><li class='span4 even'><img src='aviva/media/coldhandwineryfacebook.jpg' alt='Aktuelt'><div class='text'><h4 style='text-transform:uppercase;'>Aktuelt</h4><div class='partner-text-internal'><p>Følg med i hverdagen på Danmarks mest nørdede frugtvineri. Se aktuelle begivenheder og følg os på Facebook.<br></p></div><div class='link'><a href='firma-profil/aktuelt/'>L&aelig;s mere</a></div></div></li></ul></div>
  302.    </article>
  303. </section><!-- body footer -->
  304. <div class="row">
  305.    <div class="span8 offset2">
  306.        <div id="footer">
  307.            <p style="text-align: center;"><strong>COLD HAND WINERY<br></strong>Haversmosevej 21, DK-8920, Randers NV &#183; Telefon: +45 21 64 27 65&#160;&#183;&#160;<a href="mailto:jens@coldhandwinery.dk">jens@coldhandwinery.dk</a></p>
  308. <p><a href="http://www.findsmiley.dk/da-DK/Searching/DetailsView.htm?virk=40903526" target="_blank"><img style="display: block; margin-left: auto; margin-right: auto;" src="aviva/media/forside-bokse/coldhandwinery_elite_smiley.png" alt="" width="49" height="42"></a></p>
  309.  
  310.            <!-- icons -->
  311.            <div class="icons">
  312.                <div>
  313.                    <!-- sitemap en ven -->
  314.                    <a href='sitemap/'
  315.                       class="sitemap"
  316.                       rel="tooltip"
  317.                       data-placement="bottom"
  318.                       data-original-title="Tip en ven"
  319.                       title='Sitemap'><i class="icon-sitemap"></i> </a>
  320.                    &nbsp;
  321.  
  322.                    <!-- print icon -->
  323.                    
  324.                    <a href='javascript:window.print();'
  325.                       class="print"
  326.                       rel="tooltip"
  327.                       data-placement="bottom"
  328.                       data-original-title="Udskriv"
  329.                       title="Udskriv"><i class="icon-print"></i> </a>
  330.                    &nbsp;
  331.                    
  332.  
  333.                    <!-- tip en ven -->
  334.                    
  335.                </div>
  336.            </div>
  337.        </div>
  338.        
  339.            <p class="cms"><small>Webbureau: <a href="http://www.infoserv.dk">Infoserv</a><span class="dash">&nbsp;&nbsp;-&nbsp;&nbsp;</span>CMS: <a href="http://www.aviva.dk">Aviva CMS</a></small></p>
  340.        
  341.    </div>
  342. </div>
  343.  
  344.    </div>
  345.        <!-- to top -->
  346.    <div id="to-top-media-hook">
  347.         <div id="to-top-wrap">
  348.            <div class="container">
  349.                <a href="#" id="to-top-btn"></a>
  350.            </div>
  351.        </div>
  352.    </div>
  353.  
  354.    <!-- Included JS Files (Uncompressed) -->
  355.    <script src="templates/responsiv3/scripts/bootstrap/js/bootstrap-carousel.js"></script>
  356.    <script src="templates/responsiv3/scripts/bootstrap/js/bootstrap-tooltip.js"></script>
  357.    <script src="templates/responsiv3/scripts/app.js"></script>
  358.  
  359.    <!-- GOOGLE ANALYTICS -->
  360.    
  361. </body>
  362. </html>
  363.  
  364. ''')
  365.  
  366. # -/ Remove html string and replace with html from site /
  367.  
  368. def meta(html):
  369.     html = html.splitlines()
  370.  
  371. # -/ Finish the function /
  372.  
  373.  
  374.  
  375.  
  376. # -/ Clean code /
  377.  
  378. html = html.splitlines()
  379. found = []
  380. found2 = []
  381.  
  382. for x in html:
  383.     try:
  384.         #x.split('<script src="')[1].split('"></script>')[0]
  385.         x.split('content="')[1].split('"')[0]
  386.         found.append(x)
  387.     except:
  388.         continue
  389.  
  390. for x in html:
  391.     try:
  392.         #x.split('<script src="')[1].split('"></script>')[0]
  393.         x.split('<meta name="')[1].split('"')[0]
  394.         found2.append(x)
  395.     except:
  396.         continue
  397.  
  398.    
  399. for x in found2:
  400.     x.strip()
  401.     #result = x.split('<meta name="')[1].split('"')[0]
  402.     result = x.split('content="')[1].split('"')[0]
  403.     result.split('\n')
  404.     test = []
  405.     test.append(result)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement