Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- var request = require('request');
- var cheerio = require('cheerio');
- var fs = require('fs');
- fs.open("proxy.txt", 'a', 666, function(e, id) {
- global.id = id
- });
- var a_links = [];
- var links = [];
- class Scraper {
- constructor() {
- this.a_links = [];
- this.links = [];
- }
- getLinks() {
- var self = this;
- request({
- url: 'http://proxyserverlist-24.blogspot.com/',
- },
- function(error, response, body) {
- if(!error){
- var data = "";
- var $ = cheerio.load(body);
- data = $('a[href*="http://proxyserverlist-24.blogspot.com/2017/"]')
- data = data.toString();
- data.replace(/href=("|')(.*?)("|')/g, function(a, b, match) {
- self.a_links.push(match);
- });
- self.links[0] = self.a_links[0];
- self.links[1] = self.a_links[2];
- self.links[2] = self.a_links[4];
- console.log("Got new 3 links...");
- self.getProxy();
- }
- });
- }
- getProxy(){
- var self = this;
- for(var i in self.links){
- request({
- url: this.links[i],
- },
- function(error, response, body) {
- if(!error){
- var data = "";
- var $ = cheerio.load(body);
- data = $('span[style*="font-weight: bold;"]')
- data = data.toString();
- data = data.split('bold;">');
- data = data[4];
- data = data.split("</span>");
- data = data[0];
- fs.write(global.id, data, null, 'utf8', function() {
- console.log("Saved");
- });
- }
- });
- }
- }
- }
- var test = new Scraper();
- test.getLinks();
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement