Class: Arachni::Element::LinkTemplate

Inherits:
Base show all
Includes:
Capabilities::Analyzable, Capabilities::Auditable, Capabilities::Inputtable, Capabilities::WithDOM
Defined in:
lib/arachni/element/link_template.rb,
lib/arachni/element/link_template/dom.rb,
lib/arachni/element/link_template/capabilities/with_dom.rb,
lib/arachni/element/link_template/capabilities/auditable.rb,
lib/arachni/element/link_template/capabilities/inputtable.rb

Overview

Represents an auditable link element whose inputs have been extracted based on an externally provided template.

Defined Under Namespace

Modules: Capabilities Classes: DOM

Constant Summary collapse

INVALID_INPUT_DATA =
[
    # Protocol URLs require a // which we can't preserve.
    '://'
]

Constants included from Capabilities::Auditable

Capabilities::Auditable::OPTIONS

Constants included from Capabilities::Mutable

Capabilities::Mutable::EXTRA_NAME, Capabilities::Mutable::FUZZ_NAME, Capabilities::Mutable::FUZZ_NAME_VALUE, Capabilities::Mutable::MUTATION_OPTIONS

Constants included from Capabilities::Inputtable

Capabilities::Inputtable::INPUTTABLE_CACHE

Constants included from Capabilities::Analyzable::Differential

Capabilities::Analyzable::Differential::DIFFERENTIAL_OPTIONS

Constants included from Capabilities::Analyzable::Timeout

Capabilities::Analyzable::Timeout::TIMEOUT_OPTIONS

Constants included from Capabilities::Analyzable::Taint

Capabilities::Analyzable::Taint::TAINT_CACHE, Capabilities::Analyzable::Taint::TAINT_OPTIONS

Constants inherited from Base

Base::MAX_SIZE

Instance Attribute Summary collapse

Attributes included from Capabilities::Auditable

#audit_options

Attributes included from Capabilities::WithAuditor

#auditor

Attributes included from Capabilities::Mutable

#affected_input_name, #format, #seed

Attributes included from Capabilities::Inputtable

#default_inputs, #inputs

Attributes included from Capabilities::WithDOM

#dom, #skip_dom

Attributes included from Capabilities::Analyzable::Differential

#differential_analysis_options

Attributes included from Capabilities::Analyzable::Timeout

#timing_attack_remark_data

Attributes inherited from Base

#initialization_options, #page

Class Method Summary collapse

Instance Method Summary collapse

Methods included from Capabilities::Auditable

#audit, #audit_id, #audit_status_message, #audit_status_message_action, #audit_verbose_message, #coverage_hash, #coverage_id, #dup, #matches_skip_like_blocks?, #reset, reset, #skip?, skip_like

Methods included from Capabilities::WithAuditor

#dup, #marshal_dump, #orphan?, #prepare_for_report, #remove_auditor

Methods included from Capabilities::Mutable

#affected_input_value, #affected_input_value=, #dup, #each_mutation, #immutables, #inspect, #mutation?, #mutations, #reset, #switch_method, #to_h

Methods included from Capabilities::Submittable

#action, #action=, #dup, #http, #method, #method=, #platforms, #submit, #to_h

Methods included from Capabilities::Inputtable

#[], #[]=, #changes, #dup, #has_inputs?, #inputtable_id, #reset, #to_h, #try_input, #update, #valid_input_data?, #valid_input_name?, #valid_input_name_data?, #valid_input_value?, #valid_input_value_data?

Methods included from Utilities

#available_port, #bytes_to_kilobytes, #bytes_to_megabytes, #caller_name, #caller_path, #cookie_decode, #cookie_encode, #cookies_from_document, #cookies_from_file, #cookies_from_response, #exception_jail, #exclude_path?, #follow_protocol?, #form_decode, #form_encode, #forms_from_document, #forms_from_response, #full_and_absolute_url?, #generate_token, #get_path, #hms_to_seconds, #html_decode, #html_encode, #include_path?, #links_from_document, #links_from_response, #normalize_url, #page_from_response, #page_from_url, #parse_set_cookie, #path_in_domain?, #path_too_deep?, #port_available?, #rand_port, #random_seed, #redundant_path?, #regexp_array_match, #remove_constants, #request_parse_body, #seconds_to_hms, #skip_page?, #skip_path?, #skip_resource?, #skip_response?, #to_absolute, #uri_decode, #uri_encode, #uri_parse, #uri_parse_query, #uri_parser, #uri_rewrite

Methods included from Capabilities::WithDOM

#dup, #skip_dom?

Methods included from Capabilities::Analyzable

has_timeout_candidates?, reset, timeout_audit_run

Methods included from Capabilities::Analyzable::Differential

#differential_analysis, #dup, reset

Methods included from Capabilities::Analyzable::Timeout

add_phase_2_candidate, candidates_include?, deduplicate, deduplicate?, do_not_deduplicate, #dup, #ensure_responsiveness, has_candidates?, payload_delay_from_options, reset, run, #timeout_analysis, timeout_from_options, #timeout_id, #timing_attack_probe, #timing_attack_verify

Methods included from Capabilities::Analyzable::Taint

#taint_analysis

Methods inherited from Base

#==, #action, #dup, #hash, #marshal_dump, #marshal_load, #persistent_hash, #prepare_for_report, #reset, #to_h, #to_hash, too_big?, #type, #url, #url=

Methods included from Capabilities::WithScope

#scope

Constructor Details

#initialize(options) ⇒ LinkTemplate

Returns a new instance of LinkTemplate.

Parameters:

Options Hash (options):

  • :url (String)

    URL of the page which includes the link.

  • :action (String)

    Link URL – defaults to ‘:url`.

  • :inputs (Hash)

    Query parameters as ‘name => value` pairs. If none have been provided they will automatically be extracted from Capabilities::Submittable#action.



50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
# File 'lib/arachni/element/link_template.rb', line 50

def initialize( options )
    super( options )

    @template = options[:template]

    if options[:inputs]
        self.inputs = options[:inputs]
    else
        if @template
            _, inputs = self.class.extract_inputs( self.action, [@template] )
            self.inputs = inputs if inputs
        else
            @template, inputs = self.class.extract_inputs( self.action )

            if @template
                self.inputs = inputs
            end
        end
    end

    self.inputs ||= {}
    @default_inputs = self.inputs.dup.freeze
end

Instance Attribute Details

#templateRegexp (readonly)

Returns Regular expressions with named captures, serving as templates used to identify and manipulate inputs in Capabilities::Submittable#action.

Returns:



40
41
42
# File 'lib/arachni/element/link_template.rb', line 40

def template
  @template
end

Class Method Details

.decode(*args) ⇒ Object



219
220
221
# File 'lib/arachni/element/link_template.rb', line 219

def decode( *args )
    Link.decode( *args )
end

.encode(string) ⇒ Object



215
216
217
# File 'lib/arachni/element/link_template.rb', line 215

def encode( string )
    Link.encode string
end

.extract_inputs(url, templates = Arachni::Options.audit.link_templates) ⇒ Array[Regexp, Hash]

Extracts inputs from a URL based on the given templates.

Parameters:

  • url (String)
  • templates (Array<Regexp>) (defaults to: Arachni::Options.audit.link_templates)

Returns:

  • (Array[Regexp, Hash])

    Matched template and inputs.



200
201
202
203
204
205
206
207
208
209
210
211
212
213
# File 'lib/arachni/element/link_template.rb', line 200

def extract_inputs( url, templates = Arachni::Options.audit.link_templates )
    return [] if !url || templates.empty?

    templates.each do |template|
        if (match = url.scan_in_groups( template )).any?
            return [
                template,
                match.inject({}){ |h, (k, v)| h[k] = decode(v); h }
            ]
        end
    end

    []
end

.from_document(url, document, templates = Arachni::Options.audit.link_templates) ⇒ Array<LinkTemplate>

Extracts link with inputs based on the provided templates from a document.

Parameters:

  • url (String)

    URL of the document – used for path normalization purposes.

  • document (String, Nokogiri::HTML::Document)
  • templates (Array<Regexp>) (defaults to: Arachni::Options.audit.link_templates)

Returns:



162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
# File 'lib/arachni/element/link_template.rb', line 162

def from_document( url, document, templates = Arachni::Options.audit.link_templates )
    return [] if templates.empty?

    document = Nokogiri::HTML( document.to_s ) if !document.is_a?( Nokogiri::HTML::Document )
    base_url = begin
        document.search( '//base[@href]' )[0]['href']
    rescue
        url
    end

    document.search( '//a' ).map do |link|
        next if too_big?( link['href'] )
        next if !(href = to_absolute( link['href'], base_url ))

        template, inputs = extract_inputs( href, templates )
        next if !template && !self::DOM.data_from_node( link )

        if (parsed_url = Arachni::URI( href ))
            next if parsed_url.scope.out?
        end

        new(
            url:      url.freeze,
            action:   href.freeze,
            inputs:   inputs || {},
            template: template,
            source:   link.to_html.freeze
        )
    end.compact
end

.from_response(response, templates = Arachni::Options.audit.link_templates) ⇒ Array<Link>

Extracts links from an HTTP response.

Parameters:

Returns:



134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
# File 'lib/arachni/element/link_template.rb', line 134

def from_response( response, templates = Arachni::Options.audit.link_templates )
    url = response.url

    links = from_document( url, response.body, templates )

    template, inputs = extract_inputs( url, templates )
    if template
        links << new(
            url:      url.freeze,
            action:   url.freeze,
            inputs:   inputs,
            template: template
        )
    end

    links
end

.from_rpc_data(data) ⇒ Object



115
116
117
118
119
120
121
122
123
124
125
126
# File 'lib/arachni/element/link_template.rb', line 115

def from_rpc_data( data )
    if data['initialization_options']['template']
        data['initialization_options']['template'] =
            Regexp.new( data['initialization_options']['template'] )
    end

    if data['template']
        data['template'] = Regexp.new( data['template'] )
    end

    super data
end

.typeObject



223
224
225
# File 'lib/arachni/element/link_template.rb', line 223

def type
    :link_template
end

Instance Method Details

#decode(*args) ⇒ Object



95
96
97
# File 'lib/arachni/element/link_template.rb', line 95

def decode( *args )
    self.class.decode( *args )
end

#encode(string) ⇒ Object



91
92
93
# File 'lib/arachni/element/link_template.rb', line 91

def encode( string )
    self.class.encode( string )
end

#idObject



99
100
101
# File 'lib/arachni/element/link_template.rb', line 99

def id
    dom_data ? "#{super}:#{dom_data[:inputs].sort_by { |k,_| k }}" : super
end

#simpleHash

Returns Simple representation of self in the form of ‘{ Capabilities::Submittable#action => Capabilities::Inputtable#inputs }`.

Returns:



76
77
78
# File 'lib/arachni/element/link_template.rb', line 76

def simple
    { self.action => self.inputs }
end

#to_rpc_dataObject



103
104
105
106
107
108
109
110
111
# File 'lib/arachni/element/link_template.rb', line 103

def to_rpc_data
    data = super
    return data if !@template

    data.merge!( 'template' => @template.source )
    data['initialization_options']['template'] = data['template']
    data.delete 'dom_data'
    data
end

#to_sString

Returns URL updated with the configured Capabilities::Inputtable#inputs.

Returns:



82
83
84
85
86
87
88
89
# File 'lib/arachni/element/link_template.rb', line 82

def to_s
    return self.action if self.inputs.empty?

    self.action.sub_in_groups(
        @template,
        inputs.inject({}) { |h, (k, v)| h[k] = encode(v); h }
    )
end