class Ish::Crawler

Public Class Methods

google_first_result(text) click to toggle source
# File lib/ish/crawler.rb, line 4
def self.google_first_result text
  result = HTTParty.get( "https://www.google.com/search?q=#{text}", :verify => false )
  r = Nokogiri::HTML(result.body)
  website = r.css('cite')[0].text
  website = "https://#{website}" unless website[0..3] == 'http'

  begin
    r = HTTParty.get( website, :verify => false )
  rescue OpenSSL::SSL::SSLError => e
    return { :url => website }
  end

  return { :url => website, :html => r.body }
end
look_for_emails(text) click to toggle source
# File lib/ish/crawler.rb, line 19
def self.look_for_emails text
  email_regex = /\A[\w+\-.]+@[a-z\d\-]+(\.[a-z\d\-]+)*\.[a-z]+\z/i
  result = text.scan( email_regex )
  return result.length > 0 ? result.join(',') : nil
end