Class: Arachni::RPC::Server::Spider

# File 'lib/arachni/rpc/server/spider.rb', line 39

def initialize( framework )
    super( framework.opts )

    @framework    = framework
    @peers        = {}
    @done_signals = Hash.new( true )

    @distribution_filter   = Support::LookUp::Moolb.new

    @after_each_run_blocks = []
    @on_first_run_blocks   = []
end

Instance Method Details

#after_each_run(&block) ⇒ `Object`

Parameters:

block (Block) —

Block to be called after each URL batch has been consumed.



58
59
60

# File 'lib/arachni/rpc/server/spider.rb', line 58

def after_each_run( &block )
    @after_each_run_blocks << block
end

#clear_distribution_filter ⇒ `Object`



52
53
54

# File 'lib/arachni/rpc/server/spider.rb', line 52

def clear_distribution_filter
    @distribution_filter.clear
end

#local_sitemap ⇒ `Hash<String, Integer>`

Returns URLs crawled by this Instance, along with their HTTP status codes.

Returns:

(Hash<String, Integer>) —

URLs crawled by this Instance, along with their HTTP status codes.



137
138
139

# File 'lib/arachni/rpc/server/spider.rb', line 137

def local_sitemap
    @sitemap
end

#on_first_run(&block) ⇒ `Object`

Parameters:

block (Block) —

Block to be called just before the crawl starts.



64
65
66

# File 'lib/arachni/rpc/server/spider.rb', line 64

def on_first_run( &block )
    @on_first_run_blocks << block
end

#peer_done(url) ⇒ `Object`

Sets a peer crawler’s state to finished. Exposed so that peers can signal the master once they’re done.

Parameters:

url (String) —

URL of the finished peer.

# File 'lib/arachni/rpc/server/spider.rb', line 152

def peer_done( url )
    @done_signals[url] = true
    master_done_handler
    true
end

#run(*args) ⇒ `Object`

#signal_if_done(master) ⇒ `Object`

Signals the ‘master` Instance that this crawler has finished.

Parameters:

master (Arachni::RPC::Client::Instance)

# File 'lib/arachni/rpc/server/spider.rb', line 163

def signal_if_done( master )
    return if !done?
    master.spider.peer_done( framework.multi_self_url ){}
end

#sitemap ⇒ `Array<String>`

Returns Crawled URLs.

Returns:

(Array<String>) —

Crawled URLs.



142
143
144

# File 'lib/arachni/rpc/server/spider.rb', line 142

def sitemap
    @distributed_sitemap || super
end

#update_peers(peers, &block) ⇒ `Object`

Updates the list of Instances to assist in the crawl.

Parameters:

peers (Array<Hash>) —

Array containing Instance info hashes – with ‘:url` and `:token` at least.
block (Block) —

Block to be called once the update operation has completed.

# File 'lib/arachni/rpc/server/spider.rb', line 103

def update_peers( peers, &block )
    @peers_array = peers
    sorted_peers = @peers_array.inject( {} ) do |h, p|
        h[p[:url]] = framework.connect_to_instance( p )
        h
    end.sort

    @peers = Hash[sorted_peers]

    @peers[framework.multi_self_url] = framework

    @peers = Hash[@peers.sort]

    @peer_urls    = @peers.keys
    @peer_clients = @peers.values

    if !master?
        block.call if block_given?
        return true
    end

    each = proc do |peer, iter|
        peer.spider.update_peers( @peers_array | [self_instance_info] ) {
            iter.return
        }
    end

    map_peers( each, proc { block.call if block_given? } )

    true
end

Class: Arachni::RPC::Server::Spider

Overview

Constant Summary collapse

Constants inherited from Spider

Instance Attribute Summary

Attributes inherited from Spider

Instance Method Summary collapse

Methods inherited from Spider

Methods included from Utilities

Methods included from UI::Output

Constructor Details

#initialize(framework) ⇒ Spider

Instance Method Details

#after_each_run(&block) ⇒ Object

#clear_distribution_filter ⇒ Object

#local_sitemap ⇒ Hash<String, Integer>

#on_first_run(&block) ⇒ Object

#peer_done(url) ⇒ Object

#run(*args) ⇒ Object

#signal_if_done(master) ⇒ Object

#sitemap ⇒ Array<String>

#update_peers(peers, &block) ⇒ Object

#initialize(framework) ⇒ `Spider`

#after_each_run(&block) ⇒ `Object`

#clear_distribution_filter ⇒ `Object`

#local_sitemap ⇒ `Hash<String, Integer>`

#on_first_run(&block) ⇒ `Object`

#peer_done(url) ⇒ `Object`

#run(*args) ⇒ `Object`

#signal_if_done(master) ⇒ `Object`

#sitemap ⇒ `Array<String>`

#update_peers(peers, &block) ⇒ `Object`