class ChildrensBooks::Scraper
Public Class Methods
scrape()
click to toggle source
# File lib/childrens_books/scraper.rb, line 3 def self.scrape html = open("https://www.commonsensemedia.org/lists/50-books-all-kids-should-read-before-theyre-12") doc = Nokogiri::HTML(html) doc.css(".views-row-odd").each do |node| title = node.css("strong.field-content a").text author = node.css("div.views-field-field-term-book-authors").text.gsub("By", "").strip description = node.css("div.views-field-field-one-liner").text.strip age = node.css("div.views-field-field-review-recommended-age").text.strip.delete("age").delete("+").split.join("") year = node.css("div.views-field-field-canonical-date").text.strip.gsub(/[()]/, "") url = node.css("strong.field-content a").attr("href").value ChildrensBooks::Book.new(title, author, description, age, year, url) end doc.css(".views-row-even").each do |node| title = node.css("strong.field-content a").text author = node.css("div.views-field-field-term-book-authors").text.gsub("By", "").strip description = node.css("div.views-field-field-one-liner").text.strip age = node.css("div.views-field-field-review-recommended-age").text.strip.delete("age").delete("+").split.join("") year = node.css("div.views-field-field-canonical-date").text.strip.gsub(/[()]/, "") url = node.css("strong.field-content a").attr("href").value ChildrensBooks::Book.new(title, author, description, age, year, url) end end