Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- <?php
- error_reporting(E_ALL);
- require 'phpQuery.php';
- $url = 'http://theory.phphtml.net/exercises/advanced/php/parsing/zadachi-na-poetapnyj-parsing-i-metod-pauka/1/index.php';
- $prefix = 'http://theory.phphtml.net/exercises/advanced/php/parsing/zadachi-na-poetapnyj-parsing-i-metod-pauka/1/';
- $result = connect($url);
- $pq = phpQuery::newDocument($result);
- $links = $pq->find('#menu a');
- foreach($links as $link){
- $link = pq($link);
- $href = $link->attr('href');
- $url = $prefix.$href;
- $contetntPage = connect($url);
- $pq = phpQuery::newDocument($contetntPage);
- $title = $pq->find('title')->text();
- $content = $pq->find('#content p')->text();
- addContent($url, $title, $content);
- }
- function addContent($url, $title, $content)
- {
- $host = 'localhost';
- $user = 'root';
- $password = '';
- $db_name = 'phpquery';
- $connect = mysqli_connect($host, $user, $password, $db_name) or die(mysqli_error($link));
- $query = "INSERT INTO page (id, title, content, url) VALUES (null, '".$title."', '".$content."','".$url."')";
- $result = mysqli_query($connect, $query);
- return $result;
- }
- function connect($url)
- {
- $curl = curl_init();
- curl_setopt($curl, CURLOPT_URL, $url);
- curl_setopt($curl, CURLOPT_FOLLOWLOCATION, true);
- curl_setopt($curl, CURLOPT_RETURNTRANSFER, true);
- $result = curl_exec($curl);
- return $result;
- }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement