module Sites
Public Class Methods
get_html(p_url)
click to toggle source
# File lib/sites_module.rb, line 13 def self.get_html(p_url) if valid?(p_url) hash = {"User-Agent" => "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_4) AppleWebKit/534.57.5 (KHTML, like Gecko) Version/5.1.7 Safari/534.57.4", "allow_redirections"=>"safe"} source = open(p_url, hash){|f|f.read} page = Nokogiri::HTML(source) end end
get_site_name(url)
click to toggle source
# File lib/sites_module.rb, line 29 def self.get_site_name(url) full_url = URI.parse(url).host.downcase full_url.split(".")[1].downcase rescue URI::InvalidURIError "" end
valid?(url)
click to toggle source
# File lib/sites_module.rb, line 22 def self.valid?(url) uri = URI.parse(url) uri.kind_of?(URI::HTTP) rescue URI::InvalidURIError false end