Class: Miteru::Crawler

Inherits:
Object
  • Object
show all
Defined in:
lib/miteru/crawler.rb

Instance Attribute Summary collapse

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initializeCrawler

Returns a new instance of Crawler.



11
12
13
14
15
# File 'lib/miteru/crawler.rb', line 11

def initialize
  @downloader = Downloader.new(Miteru.configuration.download_to)
  @feeds = Feeds.new
  @notifier = Notifier.new
end

Instance Attribute Details

#downloaderObject (readonly)

Returns the value of attribute downloader.



9
10
11
# File 'lib/miteru/crawler.rb', line 9

def downloader
  @downloader
end

#feedsObject (readonly)

Returns the value of attribute feeds.



9
10
11
# File 'lib/miteru/crawler.rb', line 9

def feeds
  @feeds
end

Class Method Details

.executeObject



51
52
53
# File 'lib/miteru/crawler.rb', line 51

def execute
  new.execute
end

Instance Method Details

#auto_download?Boolean

Returns:

  • (Boolean)


42
43
44
# File 'lib/miteru/crawler.rb', line 42

def auto_download?
  Miteru.configuration.auto_download?
end

#crawl(url) ⇒ Object



17
18
19
20
21
22
23
# File 'lib/miteru/crawler.rb', line 17

def crawl(url)
  website = Website.new(url)
  downloader.download_kits(website.kits) if website.has_kits? && auto_download?
  notify(website) if website.has_kits? || verbose?
rescue OpenSSL::SSL::SSLError, HTTP::Error, Addressable::URI::InvalidURIError => _e
  nil
end

#executeObject



25
26
27
28
29
30
31
32
# File 'lib/miteru/crawler.rb', line 25

def execute
  suspicious_urls = feeds.suspicious_urls
  puts "Loaded #{suspicious_urls.length} URLs to crawl. (crawling in #{threads} threads)" if verbose?

  Parallel.each(suspicious_urls, in_threads: threads) do |url|
    crawl url
  end
end

#notify(website) ⇒ Object



38
39
40
# File 'lib/miteru/crawler.rb', line 38

def notify(website)
  @notifier.notify(url: website.url, kits: website.kits, message: website.message)
end

#threadsObject



34
35
36
# File 'lib/miteru/crawler.rb', line 34

def threads
  @threads ||= Miteru.configuration.threads
end

#verbose?Boolean

Returns:

  • (Boolean)


46
47
48
# File 'lib/miteru/crawler.rb', line 46

def verbose?
  Miteru.configuration.verbose?
end