Guest User

Untitled

a guest
Dec 5th, 2018
140
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Ruby 1.47 KB | None | 0 0
  1. require 'nokogiri'
  2. require 'open-uri'
  3. require 'csv'
  4.  
  5. csv = CSV.open("out.csv", "wb")
  6.  
  7. (1..100).each do |page|  # ustawic ile stron ma sciagac
  8.   main_url = "https://allegro.pl/kategoria/samochody-osobowe-4029?order=m&p=#{page}"
  9.   print "Pobieranie strony:#{page}  "
  10.   data = Nokogiri::HTML(open(main_url))
  11.   print " OK\n"
  12.   (1..60).each do |record|  # bo 60 rekordow na stronie
  13.     lp = ( page - 1 ) * 60 + record
  14.     filerec = Array.new
  15.  
  16.     opis =      data.xpath("/html/body/div[2]/div[3]/div/div/div/div/div[2]/div[2]/div/div[3]/div/div/div/div/div/div/div/section[2]/section/article[#{record}]/div/div/div[2]/div[1]/h2/a").text
  17.     przebieg =  data.xpath("/html/body/div[2]/div[3]/div/div/div/div/div[2]/div[2]/div/div[3]/div/div/div/div/div/div/div/section[2]/section/article[#{record}]/div/div/div[2]/div[1]/div/dl/dd[3]/span").text
  18.     przebieg.gsub! ' km', ''  #wyciecie koncowki
  19.  
  20.     rocznik =   data.xpath("/html/body/div[2]/div[3]/div/div/div/div/div[2]/div[2]/div/div[3]/div/div/div/div/div/div/div/section[2]/section/article[#{record}]/div/div/div[2]/div[1]/div/dl/dd[2]/span").text
  21.  
  22.     cena =      data.xpath("/html/body/div[2]/div[3]/div/div/div/div/div[2]/div[2]/div/div[3]/div/div/div/div/div/div/div/section[2]/section/article[#{record}]/div/div/div[2]/div[2]/div/div/span/span").text
  23.     cena.gsub!( /(,\d\d zł)/, '' )  #wywalenie koncowki
  24.     cena.gsub!( ' ', '' ) #wywalenie pustych spacji
  25.  
  26.     csv << [ lp, przebieg, rocznik, cena, opis ]
  27.   end
  28. end
Advertisement
Add Comment
Please, Sign In to add comment