# encoding: utf-8 require "logstash/namespace" require "logstash/environment" require "logstash/outputs/base" require "logstash/outputs/amazon_es/http_client" require "logstash/json" require "concurrent" require "stud/buffer" require "socket" require "thread" require "uri" # This output plugin emits data to Amazon Elasticsearch with support for signing requests using AWS V4 Signatures # # # The configuration and experience is similar to logstash-output-elasticsearch plugin and we have added Signature V4 support for the same # Some of the default configurations like connection timeouts have been tuned for optimal performance with Amazon Elasticsearch # # ==== Retry Policy # # This plugin uses the same retry policy as logstash-output-elasticsearch, It uses bulk API to optimize its # imports into Elasticsearch.. These requests may experience either partial or total failures. # Events are retried if they fail due to either a network error or the status codes # 429 (the server is busy), 409 (Version Conflict), or 503 (temporary overloading/maintenance). # # The retry policy's logic can be described as follows: # # - Block and retry all events in the bulk response that experience transient network exceptions until # a successful submission is received by Elasticsearch. # - Retry the subset of sent events which resulted in ES errors of a retryable nature. # - Events which returned retryable error codes will be pushed onto a separate queue for # retrying events. Events in this queue will be retried a maximum of 5 times by default (configurable through :max_retries). # The size of this queue is capped by the value set in :retry_max_items. # - Events from the retry queue are submitted again when the queue reaches its max size or when # the max interval time is reached. The max interval time is configurable via :retry_max_interval. # - Events which are not retryable or have reached their max retry count are logged to stderr. class LogStash::Outputs::AmazonES < LogStash::Outputs::Base attr_reader :client include Stud::Buffer RETRYABLE_CODES = [409, 429, 503] SUCCESS_CODES = [200, 201] config_name "amazon_es" # The index to write events to. This can be dynamic using the `%{foo}` syntax. # The default value will partition your indices by day so you can more easily # delete old data or only search specific date ranges. # Indexes may not contain uppercase characters. # For weekly indexes ISO 8601 format is recommended, eg. logstash-%{+xxxx.ww} config :index, :validate => :string, :default => "logstash-%{+YYYY.MM.dd}" # The index type to write events to. Generally you should try to write only # similar events to the same 'type'. String expansion `%{foo}` works here. # # Deprecated in favor of `document_type` field. config :index_type, :validate => :string, :deprecated => "Please use the 'document_type' setting instead. It has the same effect, but is more appropriately named." # The document type to write events to. Generally you should try to write only # similar events to the same 'type'. String expansion `%{foo}` works here. # Unless you set 'document_type', the event 'type' will be used if it exists # otherwise the document type will be assigned the value of 'logs' config :document_type, :validate => :string # Starting in Logstash 1.3 (unless you set option `manage_template` to false) # a default mapping template for Elasticsearch will be applied, if you do not # already have one set to match the index pattern defined (default of # `logstash-%{+YYYY.MM.dd}`), minus any variables. For example, in this case # the template will be applied to all indices starting with `logstash-*` # # If you have dynamic templating (e.g. creating indices based on field names) # then you should set `manage_template` to false and use the REST API to upload # your templates manually. config :manage_template, :validate => :boolean, :default => true # This configuration option defines how the template is named inside Elasticsearch. # Note that if you have used the template management features and subsequently # change this, you will need to prune the old template manually, e.g. # # `curl -XDELETE ` # # where `OldTemplateName` is whatever the former setting was. config :template_name, :validate => :string, :default => "logstash" # You can set the path to your own template here, if you so desire. # If not set, the included template will be used. config :template, :validate => :path # Overwrite the current template with whatever is configured # in the `template` and `template_name` directives. config :template_overwrite, :validate => :boolean, :default => false # The document ID for the index. Useful for overwriting existing entries in # Elasticsearch with the same ID. config :document_id, :validate => :string # A routing override to be applied to all processed events. # This can be dynamic using the `%{foo}` syntax. config :routing, :validate => :string # Set the endpoint of your Amazon Elasticsearch domain. This will always be array of size 1 # ["foo.us-east-1.es.amazonaws.com"] config :hosts, :validate => :array # You can set the remote port as part of the host, or explicitly here as well config :port, :validate => :string, :default => 80 #Signing specific details config :region, :validate => :string, :default => "us-east-1" # aws_access_key_id and aws_secret_access_key . # credential resolution logic as follows: # # - User passed aws_access_key_id and aws_secret_access_key in aes configuration # - Environment Variables - AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY # (RECOMMENDED since they are recognized by all the AWS SDKs and CLI except for .NET), # or AWS_ACCESS_KEY and AWS_SECRET_KEY (only recognized by Java SDK) # - Credential profiles file at the default location (~/.aws/credentials) shared by all AWS SDKs and the AWS CLI # - Instance profile credentials delivered through the Amazon EC2 metadata service config :aws_access_key_id, :validate => :string config :aws_secret_access_key, :validate => :string # This plugin uses the bulk index api for improved indexing performance. # To make efficient bulk api calls, we will buffer a certain number of # events before flushing that out to Elasticsearch. This setting # controls how many events will be buffered before sending a batch # of events. config :flush_size, :validate => :number, :default => 500 # The amount of time since last flush before a flush is forced. # # This setting helps ensure slow event rates don't get stuck in Logstash. # For example, if your `flush_size` is 100, and you have received 10 events, # and it has been more than `idle_flush_time` seconds since the last flush, # Logstash will flush those 10 events automatically. # # This helps keep both fast and slow log streams moving along in # near-real-time. config :idle_flush_time, :validate => :number, :default => 1 # The Elasticsearch action to perform. Valid actions are: `index`, `delete`. # # Use of this setting *REQUIRES* you also configure the `document_id` setting # because `delete` actions all require a document id. # # What does each action do? # # - index: indexes a document (an event from Logstash). # - delete: deletes a document by id # - create: indexes a document, fails if a document by that id already exists in the index. # - update: updates a document by id # following action is not supported by HTTP protocol # # For more details on actions, check out the http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/docs-bulk.html[Elasticsearch bulk API documentation] config :action, :validate => %w(index delete create update), :default => "index" # Username and password (only valid when protocol is HTTP; this setting works with HTTP or HTTPS auth) config :user, :validate => :string config :password, :validate => :password # HTTP Path at which the Elasticsearch server lives. Use this if you must run ES behind a proxy that remaps # the root path for the Elasticsearch HTTP API lives. config :path, :validate => :string, :default => "/" # Set max retry for each event config :max_retries, :validate => :number, :default => 3 # Set retry policy for events that failed to send config :retry_max_items, :validate => :number, :default => 5000 # Set max interval between bulk retries config :retry_max_interval, :validate => :number, :default => 5 # Set the address of a forward HTTP proxy. Must be used with the 'http' protocol # Can be either a string, such as 'http://localhost:123' or a hash in the form # {host: 'proxy.org' port: 80 scheme: 'http'} # Note, this is NOT a SOCKS proxy, but a plain HTTP proxy config :proxy # Enable doc_as_upsert for update mode # create a new document with source if document_id doesn't exists config :doc_as_upsert, :validate => :boolean, :default => false # Set upsert content for update mode # create a new document with this parameter as json string if document_id doesn't exists config :upsert, :validate => :string, :default => "" public def register @hosts = Array(@hosts) # retry-specific variables @retry_flush_mutex = Mutex.new @retry_teardown_requested = Concurrent::AtomicBoolean.new(false) # needs flushing when interval @retry_queue_needs_flushing = ConditionVariable.new @retry_queue_not_full = ConditionVariable.new @retry_queue = Queue.new @submit_mutex = Mutex.new client_settings = {} common_options = { :client_settings => client_settings } client_settings[:path] = "/#{@path}/".gsub(/\/+/, "/") # Normalize slashes @logger.debug? && @logger.debug("Normalizing http path", :path => @path, :normalized => client_settings[:path]) if @hosts.nil? || @hosts.empty? @logger.info("No 'host' set in elasticsearch output. Defaulting to localhost") @hosts = ["localhost"] end client_settings.merge! setup_proxy() common_options.merge! setup_basic_auth() # Update API setup update_options = { :upsert => @upsert, :doc_as_upsert => @doc_as_upsert } common_options.merge! update_options if @action == 'update' @client = LogStash::Outputs::AES::HttpClient.new( common_options.merge(:hosts => @hosts, :port => @port, :region => @region, :aws_access_key_id => @aws_access_key_id, :aws_secret_access_key => @aws_secret_access_key) ) if @manage_template begin @logger.info("Automatic template management enabled", :manage_template => @manage_template.to_s) @client.template_install(@template_name, get_template, @template_overwrite) rescue => e @logger.error("Failed to install template: #{e.message}") end end @logger.info("New Elasticsearch output", :hosts => @hosts, :port => @port) @client_idx = 0 buffer_initialize( :max_items => @flush_size, :max_interval => @idle_flush_time, :logger => @logger ) @retry_timer_thread = Thread.new do loop do sleep(@retry_max_interval) @retry_flush_mutex.synchronize { @retry_queue_needs_flushing.signal } end end @retry_thread = Thread.new do while @retry_teardown_requested.false? @retry_flush_mutex.synchronize { @retry_queue_needs_flushing.wait(@retry_flush_mutex) } retry_flush end end end # def register public def get_template if @template.nil? @template = ::File.expand_path('amazon_es/elasticsearch-template.json', ::File.dirname(__FILE__)) if !File.exists?(@template) raise "You must specify 'template => ...' in your elasticsearch output (I looked for '#{@template}')" end end template_json = IO.read(@template).gsub(/\n/,'') template = LogStash::Json.load(template_json) @logger.info("Using mapping template", :template => template) return template end # def get_template public def receive(event) return unless output?(event) # block until we have not maxed out our # retry queue. This is applying back-pressure # to slow down the receive-rate @retry_flush_mutex.synchronize { @retry_queue_not_full.wait(@retry_flush_mutex) while @retry_queue.size > @retry_max_items } event['@metadata']['retry_count'] = 0 # Set the 'type' value for the index. type = if @document_type event.sprintf(@document_type) elsif @index_type # deprecated event.sprintf(@index_type) else event["type"] || "logs" end params = { :_id => @document_id ? event.sprintf(@document_id) : nil, :_index => event.sprintf(@index), :_type => type, :_routing => @routing ? event.sprintf(@routing) : nil } params[:_upsert] = LogStash::Json.load(event.sprintf(@upsert)) if @action == 'update' && @upsert != "" buffer_receive([event.sprintf(@action), params, event]) end # def receive public # The submit method can be called from both the # Stud::Buffer flush thread and from our own retry thread. def submit(actions) @submit_mutex.synchronize do es_actions = actions.map { |a, doc, event| [a, doc, event.to_hash] } bulk_response = @client.bulk(es_actions) if bulk_response["errors"] && bulk_response["items"] actions_to_retry = [] bulk_response['items'].each_with_index do |item,idx| action = es_actions[idx] action_type, props = item.first # These are all hashes with one value, so we destructure them here status = props['status'] error = props['error'] if RETRYABLE_CODES.include?(status) @logger.warn "retrying failed action with response code: #{status}" actions_to_retry << action elsif not SUCCESS_CODES.include?(status) @logger.warn "failed action", status: status, error: error, action: action end end retry_push(actions_to_retry) unless actions_to_retry.empty? end end end # When there are exceptions raised upon submission, we raise an exception so that # Stud::Buffer will retry to flush public def flush(actions, teardown = false) begin submit(actions) rescue Manticore::SocketException => e # If we can't even connect to the server let's just print out the URL (:hosts is actually a URL) # and let the user sort it out from there @logger.error( "Attempted to send a bulk request to Elasticsearch configured at '#{@client.client_options[:hosts]}',"+ " but Elasticsearch appears to be unreachable or down!", :client_config => @client.client_options, :error_message => e.message ) @logger.debug("Failed actions for last bad bulk request!", :actions => actions) rescue => e # For all other errors print out full connection issues @logger.error( "Attempted to send a bulk request to Elasticsearch configured at '#{@client.client_options[:hosts]}'," + " but an error occurred and it failed! Are you sure you can reach elasticsearch from this machine using " + "the configuration provided?", :client_config => @client.client_options, :error_message => e.message, :error_class => e.class.name, :backtrace => e.backtrace ) @logger.debug("Failed actions for last bad bulk request!", :actions => actions) raise e end end # def flush public def teardown @retry_teardown_requested.make_true # First, make sure retry_timer_thread is stopped # to ensure we do not signal a retry based on # the retry interval. Thread.kill(@retry_timer_thread) @retry_timer_thread.join # Signal flushing in the case that #retry_flush is in # the process of waiting for a signal. @retry_flush_mutex.synchronize { @retry_queue_needs_flushing.signal } # Now, #retry_flush is ensured to not be in a state of # waiting and can be safely joined into the main thread # for further final execution of an in-process remaining call. @retry_thread.join # execute any final actions along with a proceeding retry for any # final actions that did not succeed. buffer_flush(:final => true) retry_flush end private def setup_proxy return {} unless @proxy # Symbolize keys proxy = if @proxy.is_a?(Hash) Hash[@proxy.map {|k,v| [k.to_sym, v]}] elsif @proxy.is_a?(String) @proxy else raise LogStash::ConfigurationError, "Expected 'proxy' to be a string or hash, not '#{@proxy}''!" end return {:proxy => proxy} end private def setup_basic_auth return {} unless @user && @password { :user => ::URI.escape(@user, "@:"), :password => ::URI.escape(@password.value, "@:") } end private # in charge of submitting any actions in @retry_queue that need to be # retried # # This method is not called concurrently. It is only called by @retry_thread # and once that thread is ended during the teardown process, a final call # to this method is done upon teardown in the main thread. def retry_flush() unless @retry_queue.empty? buffer = @retry_queue.size.times.map do next_action, next_doc, next_event = @retry_queue.pop next_event['@metadata']['retry_count'] += 1 if next_event['@metadata']['retry_count'] > @max_retries @logger.error "too many attempts at sending event. dropping: #{next_event}" nil else [next_action, next_doc, next_event] end end.compact submit(buffer) unless buffer.empty? end @retry_flush_mutex.synchronize { @retry_queue_not_full.signal if @retry_queue.size < @retry_max_items } end private def retry_push(actions) Array(actions).each{|action| @retry_queue << action} @retry_flush_mutex.synchronize { @retry_queue_needs_flushing.signal if @retry_queue.size >= @retry_max_items } end @@plugins = Gem::Specification.find_all{|spec| spec.name =~ /logstash-output-amazon_es-/ } @@plugins.each do |plugin| name = plugin.name.split('-')[-1] require "logstash/outputs/amazon_es/#{name}" end end