Class: FindRecipe::Scraper
- Inherits:
-
Object
- Object
- FindRecipe::Scraper
- Defined in:
- lib/find_recipe/scraper.rb
Constant Summary collapse
- ROOT_URL =
"https://cookpad.com"
Class Method Summary collapse
- .get_individual_recipe_page(recipe_url) ⇒ Object
- .get_recipe_page_from_keyword(keyword) ⇒ Object
- .get_trending_recipes_page ⇒ Object
- .open_url(url) ⇒ Object
- .scrape_individual_recipe_data(recipe_url) ⇒ Object
- .scrape_search_page(keyword) ⇒ Object
- .scrape_trending_recipes_page ⇒ Object
Class Method Details
.get_individual_recipe_page(recipe_url) ⇒ Object
53 54 55 |
# File 'lib/find_recipe/scraper.rb', line 53 def self.get_individual_recipe_page(recipe_url) open_url(recipe_url) end |
.get_recipe_page_from_keyword(keyword) ⇒ Object
48 49 50 51 |
# File 'lib/find_recipe/scraper.rb', line 48 def self.get_recipe_page_from_keyword(keyword) url = ROOT_URL + "/uk/search/#{keyword}" open_url(url) end |
.get_trending_recipes_page ⇒ Object
43 44 45 46 |
# File 'lib/find_recipe/scraper.rb', line 43 def self.get_trending_recipes_page url = ROOT_URL + "/uk/trending" open_url(url) end |
.open_url(url) ⇒ Object
57 58 59 |
# File 'lib/find_recipe/scraper.rb', line 57 def self.open_url(url) Nokogiri::HTML(open(url)) end |
.scrape_individual_recipe_data(recipe_url) ⇒ Object
28 29 30 31 32 33 34 35 36 37 38 39 40 41 |
# File 'lib/find_recipe/scraper.rb', line 28 def self.scrape_individual_recipe_data(recipe_url) recipe_data = {} recipe_page = self.get_individual_recipe_page(recipe_url) recipe_data[:description] = recipe_page.at("meta[itemprop='description']")['content'] # Gets ingredients as an array of each ingredient recipe_data[:ingredients] = recipe_page.css(".ingredient__details").collect { |ingredient| ingredient.text.strip } # Gets steps as an array of each step recipe_data[:steps] = recipe_page.css(".step .prose").collect { |step| step.text.strip } recipe_data end |
.scrape_search_page(keyword) ⇒ Object
16 17 18 19 20 21 22 23 24 25 26 |
# File 'lib/find_recipe/scraper.rb', line 16 def self.scrape_search_page(keyword) recipe_page = self.get_recipe_page_from_keyword(keyword) recipe_cards = recipe_page.css("li.wide-card") recipe_cards.collect do |card| recipe = { name: card.css("h2.recipe-title span").text.strip, url: ROOT_URL + card.css("a.media").attribute("href").value } end end |
.scrape_trending_recipes_page ⇒ Object
4 5 6 7 8 9 10 11 12 13 14 |
# File 'lib/find_recipe/scraper.rb', line 4 def self.scrape_trending_recipes_page recipe_page = self.get_trending_recipes_page recipe_cards = recipe_page.css(".card.feed__card") recipe_cards.collect do |card| recipe = { name: card.css("h2.recipe-title").text.strip, url: ROOT_URL + card.css("a.link-unstyled").attribute("href").value } end.uniq end |