module Scrapers::GoComics
Constants
- GOCOMIC_URL
Public Class Methods
scrape(comic)
click to toggle source
# File lib/scrapers/gocomics.rb, line 11 def self.scrape(comic) results = Hash.new results[:comic] = comic url = URI.parse GOCOMIC_URL url.path = "/#{comic}" results[:url] = url.to_s page = Nokogiri::HTML(open(url.to_s)) results[:title] = scrape_title(page) results[:pubdate] = scrape_pubdate(page) results[:img_src] = scrape_image_source(page) results end
scrape_image_source(page)
click to toggle source
# File lib/scrapers/gocomics.rb, line 40 def self.scrape_image_source(page) page. at_css("p.feature_item"). at_css("img"). attr("src") end
scrape_pubdate(page)
click to toggle source
# File lib/scrapers/gocomics.rb, line 36 def self.scrape_pubdate(page) Date.parse(page.at_css("ul.feature-nav > li").content).to_s end
scrape_title(page)
click to toggle source
# File lib/scrapers/gocomics.rb, line 32 def self.scrape_title(page) page.at_css("title").content.strip.gsub(/[[:space:]]/,' ').squeeze(" ") end