Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #!/usr/bin/env ruby
- require 'nokogiri'
- require 'open-uri'
- require 'sequel'
- require 'sqlite3'
- require 'pry'
- require 'uri'
- require 'cgi'
- clubland = "http://www.clublandlv.com/forum.php"
- doc = Nokogiri::HTML(open(clubland))
- puts doc.css('title').text
- puts
- doc.css("#cat10").each do |grab|
- genres = grab.css(".forumtitle").map(&:text)
- genre_links = grab.css(".forumtitle"){[:href]}
- subgenre = grab.css(".subforum a").map(&:text)
- subgenre_links = grab.css(".subforum a"){[:href]}
- puts "This is an array of the genres:"
- puts genres
- puts
- puts "These are the genre links:"
- puts genre_links
- puts
- # puts "This is an array of the subgenres:"
- # puts subgenre
- # puts
- # puts "These are the subgenre links:"
- # puts subgenrelink
- # Table has 3 columns. ID(auto), genre, forum_id
- DB = Sequel.connect('sqlite://clublandlv.sqlite')
- # Create a dataset
- main_genre = DB[:genres]
- # Insert the results
- # genres.each do |genre|
- # main_genre.insert(:genre => genre)
- # unless db_has_genre?
- # genre;
- genre_links.map { |g_link|
- link_id = g_link.children.first["href"]
- link_cut = CGI.parse(URI.parse(link_id).query)['f'].first.to_i #returns Numeric,Integer,Fixnum
- genre_links << (link_cut) #`push': node must be a Nokogiri::XML::Node or Nokogiri::XML::Namespace (ArgumentError)
- binding.pry
- }
- # main_genre.insert(:forum_id => link_cut)
- g_link;
- # main_genre.insert(:forum_id => genrelink)
- # unless db_has_genre?
- # genrelink;
- end
Advertisement
Add Comment
Please, Sign In to add comment