class MovieScraper
Constants
- BASE_RT_URL
Attributes
movie[RW]
Public Instance Methods
get_main_page()
click to toggle source
# File lib/movie_scraper.rb, line 11 def get_main_page doc = Nokogiri::HTML(open('https://www.rottentomatoes.com/top/bestofrt/')) end
new_with_attributes()
click to toggle source
# File lib/movie_scraper.rb, line 15 def new_with_attributes self.get_main_page.css(".table tr").drop(1).each do |row| movie = DustinAndersonCLIApp::Movie.new movie.rank = row.css(".bold").text.delete!(".") movie.rating = row.css(".tMeterScore").text.gsub!(/\u00A0/, "") movie.title = row.css(".unstyled").text movie.title.strip! movie.reviews = row.css(".right").text link = row.css("a").attribute("href").value.sub("/", "") details_doc = BASE_RT_URL + link open_details_doc = Nokogiri::HTML(open(details_doc)) movie.summary = open_details_doc.css(".movie_synopsis").text.strip! movie.parental = open_details_doc.css(".meta-value").first.text movie.genre = open_details_doc.css(".meta-value a").first.text.strip! movie.theatre_date = open_details_doc.css(".meta-value time").first.text movie.studio = open_details_doc.css("div.meta-value").last.text.strip end DustinAndersonCLIApp::Movie.all end