Class: Fluent::Plugin::SolrOutput

Inherits:

Output

Object
Output
Fluent::Plugin::SolrOutput

show all

Defined in:: lib/fluent/plugin/out_solr.rb

Constant Summary collapse

DEFAULT_COLLECTION =

'collection1'

DEFAULT_IGNORE_UNDEFINED_FIELDS =

false

DEFAULT_STRING_FIELD_VALUE_MAX_LENGTH =

-1

DEFAULT_TAG_FIELD =

'tag'

DEFAULT_TIMESTAMP_FIELD =

'time'

DEFAULT_FLUSH_SIZE =

DEFAULT_BUFFER_TYPE =

"memory"

DEFAULT_COMMIT_WITH_FLUSH =

true

MODE_STANDALONE =

'Standalone'

MODE_SOLRCLOUD =

'SolrCloud'

Instance Method Summary collapse

#configure(conf) ⇒ Object
#format(tag, time, record) ⇒ Object
#formatted_to_msgpack_binary ⇒ Object
#get_fields ⇒ Object
#get_unique_key ⇒ Object
#initialize ⇒ SolrOutput constructor

A new instance of SolrOutput.
#multi_workers_ready? ⇒ Boolean
#shutdown ⇒ Object
#start ⇒ Object
#update(documents) ⇒ Object
#write(chunk) ⇒ Object

Constructor Details

#initialize ⇒ `SolrOutput`

Returns a new instance of SolrOutput.



61
62
63

# File 'lib/fluent/plugin/out_solr.rb', line 61

def initialize
  super
end

Instance Method Details

#configure(conf) ⇒ `Object`

Raises:

(Fluent::ConfigError)

# File 'lib/fluent/plugin/out_solr.rb', line 65

def configure(conf)
  compat_parameters_convert(conf, :inject)
  super
  raise Fluent::ConfigError, "'tag' in chunk_keys is required." if not @chunk_key_tag
end

#format(tag, time, record) ⇒ `Object`



101
102
103

# File 'lib/fluent/plugin/out_solr.rb', line 101

def format(tag, time, record)
  [time, record].to_msgpack
end

#formatted_to_msgpack_binary ⇒ `Object`



105
106
107

# File 'lib/fluent/plugin/out_solr.rb', line 105

def formatted_to_msgpack_binary
  true
end

#get_fields ⇒ `Object`

# File 'lib/fluent/plugin/out_solr.rb', line 214

def get_fields
  response = nil

  if @mode == MODE_STANDALONE then
    response = @solr.get 'schema/fields'
  elsif @mode == MODE_SOLRCLOUD then
    response = @solr.get 'schema/fields', collection: @collection
  end

  fields = []
  response['fields'].each do |field|
    fields.push(field['name'])
  end
  log.debug "Fields: #{fields}"

  return fields

  rescue Exception => e
    log.warn "An error occurred: #{e.message}"
end

#get_unique_key ⇒ `Object`

# File 'lib/fluent/plugin/out_solr.rb', line 196

def get_unique_key
  response = nil

  if @mode == MODE_STANDALONE then
    response = @solr.get 'schema/uniquekey'
  elsif @mode == MODE_SOLRCLOUD then
    response = @solr.get 'schema/uniquekey', collection: @collection
  end

  unique_key = response['uniqueKey']
  log.debug "Unique key: #{unique_key}"

  return unique_key

  rescue Exception => e
    log.warn "An error occurred: #{e.message}"
end

#multi_workers_ready? ⇒ `Boolean`

Returns:

(Boolean)



109
110
111

# File 'lib/fluent/plugin/out_solr.rb', line 109

def multi_workers_ready?
  true
end

#shutdown ⇒ `Object`

# File 'lib/fluent/plugin/out_solr.rb', line 93

def shutdown
  super

  unless @zk.nil? then
    @zk.close
  end
end

#start ⇒ `Object`

# File 'lib/fluent/plugin/out_solr.rb', line 71

def start
  super

  @mode = nil
  if ! @url.nil? then
    @mode = MODE_STANDALONE
  elsif ! @zk_host.nil?
    @mode = MODE_SOLRCLOUD
  end

  @solr = nil
  @zk = nil

  if @mode == MODE_STANDALONE then
    @solr = RSolr.connect :url => @url
  elsif @mode == MODE_SOLRCLOUD then
    @zk = ZK.new(@zk_host)
    cloud_connection = RSolr::Cloud::Connection.new(@zk)
    @solr = RSolr::Client.new(cloud_connection, read_timeout: 60, open_timeout: 60)
  end
end

#update(documents) ⇒ `Object`

# File 'lib/fluent/plugin/out_solr.rb', line 184

def update(documents)
  if @mode == MODE_STANDALONE then
    @solr.add documents, :params => {:commit => @commit_with_flush}
    log.debug "Added %d document(s) to Solr" % documents.count
  elsif @mode == MODE_SOLRCLOUD then
    @solr.add documents, collection: @collection, :params => {:commit => @commit_with_flush}
    log.debug "Added #{documents.count} document(s) to Solr"
  end
  rescue Exception => e
    log.warn "Update: An error occurred while indexing: #{e.message}"
end

#write(chunk) ⇒ `Object`

# File 'lib/fluent/plugin/out_solr.rb', line 113

def write(chunk)
  documents = []

  @fields = @defined_fields.nil? ? get_fields : @defined_fields
  @unique_key = @unique_key_field.nil? ? get_unique_key : @unique_key_field
  tag = chunk.metadata.tag
  chunk.msgpack_each do |time, record|
    record = inject_values_to_record(tag, time, record)

    unless record.has_key?(@unique_key) then
      record.merge!({@unique_key => SecureRandom.uuid})
    end

    unless record.has_key?(@tag_field) then
      record.merge!({@tag_field => tag})
    end

    if record.has_key?(@timestamp_field) then
      begin
        event_timestamp_dt = DateTime.strptime(record[@timestamp_field], "%d/%b/%Y:%H:%M:%S %z").to_s
        record.merge!({@timestamp_field => Time.parse(event_timestamp_dt.to_s).utc.strftime('%FT%TZ')})
      rescue
        record.merge!({@timestamp_field => Time.at(time).utc.strftime('%FT%TZ')})
      end
    else
      record.merge!({@timestamp_field => Time.at(time).utc.strftime('%FT%TZ')})
    end

    if @ignore_undefined_fields then
      record.each_key do |key|
        unless @fields.include?(key) then
          record.delete(key)
        end
      end
    end

    if @string_field_value_max_length >= 0 then
      record.each_key do |key|
        if record[key].instance_of?(Array) then
          values = []
          record[key].each do |value|
            if value.instance_of?(String) then
              if value.length > @string_field_value_max_length then
                log.warn "#{key} is too long (#{value.length}, max is #{@string_field_value_max_length})."
                values.push(value.slice(0, @string_field_value_max_length))
              else
                values.push(value)
              end
            end
          end
          record[key] = values
        elsif record[key].instance_of?(String) then
          if record[key].length > @string_field_value_max_length then
            log.warn "#{key} is too long (#{record[key].length}, max is #{@string_field_value_max_length})."
            record[key] = record[key].slice(0, @string_field_value_max_length)
          end
        end
      end
    end

    documents << record

    if documents.count >= @flush_size
      update documents
      documents.clear
    end
  end

  update documents unless documents.empty?
end

Class: Fluent::Plugin::SolrOutput

Constant Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize ⇒ SolrOutput

Instance Method Details

#configure(conf) ⇒ Object

#format(tag, time, record) ⇒ Object

#formatted_to_msgpack_binary ⇒ Object

#get_fields ⇒ Object

#get_unique_key ⇒ Object

#multi_workers_ready? ⇒ Boolean

#shutdown ⇒ Object

#start ⇒ Object

#update(documents) ⇒ Object

#write(chunk) ⇒ Object