module Bbc10::Scraper
Public Class Methods
get_links(page)
click to toggle source
# File lib/bbc10/scraper.rb, line 12 def self.get_links(page) page.css('.nw-c-most-read__items a').map{|link| 'https://www.bbc.co.uk' << link['href']} end
read_page(url)
click to toggle source
# File lib/bbc10/scraper.rb, line 8 def self.read_page(url) Nokogiri::HTML(open(url).read) end
scrape_story(story)
click to toggle source
# File lib/bbc10/scraper.rb, line 16 def self.scrape_story(story) article = story.css('.story-body__inner p').map(&:content) if article.empty? puts "\nFailed to scrape - use link above\n\n" else article.each{|para| puts "#{para}\n\n"} end end