Class: ETL::Parser::ApacheCombinedLogParser
- Includes:
- HttpTools
- Defined in:
- lib/etl/parser/apache_combined_log_parser.rb
Overview
Parser which can parser the Apache Combined Log Format as defined at httpd.apache.org/docs/2.2/logs.html
Instance Attribute Summary
Attributes inherited from Parser
Instance Method Summary collapse
- #each ⇒ Object
-
#initialize(source, options = {}) ⇒ ApacheCombinedLogParser
constructor
A new instance of ApacheCombinedLogParser.
- #parse(line) ⇒ Object
Methods included from HttpTools
Methods inherited from Parser
Constructor Details
#initialize(source, options = {}) ⇒ ApacheCombinedLogParser
Returns a new instance of ApacheCombinedLogParser.
7 8 9 |
# File 'lib/etl/parser/apache_combined_log_parser.rb', line 7 def initialize(source, ={}) super end |
Instance Method Details
#each ⇒ Object
11 12 13 14 15 16 17 |
# File 'lib/etl/parser/apache_combined_log_parser.rb', line 11 def each Dir.glob(file).each do |file| File.open(file).each_line do |line| yield parse(line) end end end |
#parse(line) ⇒ Object
19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 |
# File 'lib/etl/parser/apache_combined_log_parser.rb', line 19 def parse(line) # example line: 127.0.0.1 - frank [10/Oct/2000:13:55:36 -0700] "GET /apache_pb.gif HTTP/1.0" 200 2326 "http://www.example.com/start.html" "Mozilla/4.08 [en] (Win98; I ;Nav)" line =~ /^(\S+)\s(\S+)\s(\S+)\s\[([^\]]*)\]\s"([^"]*)"\s(\d*)\s(\d*)\s"([^"]*)"\s"([^"]*)"/ fields = { :ip_address => $1, :identd => $2, :user => $3, :timestamp => $4, :request => $5, :response_code => $6, :bytes => $7, :referrer => $8, :user_agent => $9, } #fields[:timestamp] =~ r%{(\d\d)/(\w\w\w)/(\d\d\d\d):(\d\d):(\d\d):(\d\d) -(\d\d\d\d)} d = Date._strptime(fields[:timestamp], '%d/%b/%Y:%H:%M:%S') unless fields[:timestamp].nil? fields[:timestamp] = Time.mktime(d[:year], d[:mon], d[:mday], d[:hour], d[:min], d[:sec], d[:sec_fraction]) unless d.nil? fields[:method], fields[:path] = fields[:request].split(/\s/) fields.merge!(parse_user_agent(fields[:user_agent])) unless fields[:user_agent].nil? fields.merge!(parse_uri(fields[:referrer], :prefix => 'referrer_')) fields.each do |key, value| fields[key] = nil if value == '-' end end |