module Scrapers::GoComics

Constants

GOCOMIC_URL

Public Class Methods

scrape(comic) click to toggle source
# File lib/scrapers/gocomics.rb, line 11
def self.scrape(comic)

  results = Hash.new

  results[:comic] = comic

  url = URI.parse GOCOMIC_URL
  url.path = "/#{comic}"

  results[:url] = url.to_s

  page = Nokogiri::HTML(open(url.to_s))

  results[:title] = scrape_title(page)
  results[:pubdate] = scrape_pubdate(page)
  results[:img_src] = scrape_image_source(page)

  results

end
scrape_image_source(page) click to toggle source
# File lib/scrapers/gocomics.rb, line 40
def self.scrape_image_source(page)
  page.
    at_css("p.feature_item").
    at_css("img").
    attr("src")
end
scrape_pubdate(page) click to toggle source
# File lib/scrapers/gocomics.rb, line 36
def self.scrape_pubdate(page)
  Date.parse(page.at_css("ul.feature-nav > li").content).to_s
end
scrape_title(page) click to toggle source
# File lib/scrapers/gocomics.rb, line 32
def self.scrape_title(page)
  page.at_css("title").content.strip.gsub(/[[:space:]]/,' ').squeeze(" ")
end