Class: Miteru::Crawler
- Inherits:
-
Object
- Object
- Miteru::Crawler
- Defined in:
- lib/miteru/crawler.rb
Instance Attribute Summary collapse
-
#downloader ⇒ Object
readonly
Returns the value of attribute downloader.
-
#feeds ⇒ Object
readonly
Returns the value of attribute feeds.
Class Method Summary collapse
Instance Method Summary collapse
- #auto_download? ⇒ Boolean
- #crawl(url) ⇒ Object
- #execute ⇒ Object
-
#initialize ⇒ Crawler
constructor
A new instance of Crawler.
- #notify(website) ⇒ Object
- #threads ⇒ Object
- #verbose? ⇒ Boolean
Constructor Details
#initialize ⇒ Crawler
Returns a new instance of Crawler.
11 12 13 14 15 |
# File 'lib/miteru/crawler.rb', line 11 def initialize @downloader = Downloader.new(Miteru.configuration.download_to) @feeds = Feeds.new @notifier = Notifier.new end |
Instance Attribute Details
#downloader ⇒ Object (readonly)
Returns the value of attribute downloader.
9 10 11 |
# File 'lib/miteru/crawler.rb', line 9 def downloader @downloader end |
#feeds ⇒ Object (readonly)
Returns the value of attribute feeds.
9 10 11 |
# File 'lib/miteru/crawler.rb', line 9 def feeds @feeds end |
Class Method Details
.execute ⇒ Object
51 52 53 |
# File 'lib/miteru/crawler.rb', line 51 def execute new.execute end |
Instance Method Details
#auto_download? ⇒ Boolean
42 43 44 |
# File 'lib/miteru/crawler.rb', line 42 def auto_download? Miteru.configuration.auto_download? end |
#crawl(url) ⇒ Object
17 18 19 20 21 22 23 |
# File 'lib/miteru/crawler.rb', line 17 def crawl(url) website = Website.new(url) downloader.download_kits(website.kits) if website.has_kits? && auto_download? notify(website) if website.has_kits? || verbose? rescue OpenSSL::SSL::SSLError, HTTP::Error, Addressable::URI::InvalidURIError => _e nil end |
#execute ⇒ Object
25 26 27 28 29 30 31 32 |
# File 'lib/miteru/crawler.rb', line 25 def execute suspicious_urls = feeds.suspicious_urls puts "Loaded #{suspicious_urls.length} URLs to crawl. (crawling in #{threads} threads)" if verbose? Parallel.each(suspicious_urls, in_threads: threads) do |url| crawl url end end |
#notify(website) ⇒ Object
38 39 40 |
# File 'lib/miteru/crawler.rb', line 38 def notify(website) @notifier.notify(url: website.url, kits: website.kits, message: website.) end |
#threads ⇒ Object
34 35 36 |
# File 'lib/miteru/crawler.rb', line 34 def threads @threads ||= Miteru.configuration.threads end |
#verbose? ⇒ Boolean
46 47 48 |
# File 'lib/miteru/crawler.rb', line 46 def verbose? Miteru.configuration.verbose? end |