module Fluent class S3Output < Fluent::TimeSlicedOutput Fluent::Plugin.register_output('s3', self) def initialize super require 'aws-sdk' require 'zlib' require 'time' require 'tempfile' end config_param :path, :string, :default => "" config_param :time_format, :string, :default => nil include SetTagKeyMixin config_set_default :include_tag_key, false include SetTimeKeyMixin config_set_default :include_time_key, false config_param :aws_key_id, :string, :default => nil config_param :aws_sec_key, :string, :default => nil config_param :s3_bucket, :string config_param :s3_endpoint, :string, :default => nil def configure(conf) super if format_json = conf['format_json'] @format_json = true else @format_json = false end @timef = TimeFormatter.new(@time_format, @localtime) end def start super options = {} if @aws_key_id && @aws_sec_key options[:access_key_id] = @aws_key_id options[:secret_access_key] = @aws_sec_key end options[:s3_endpoint] = @s3_endpoint if @s3_endpoint @s3 = AWS::S3.new(options) @bucket = @s3.buckets[@s3_bucket] end def format(tag, time, record) if @include_time_key || !@format_json time_str = @timef.format(time) end # copied from each mixin because current TimeSlicedOutput can't support mixins. if @include_tag_key record[@tag_key] = tag end if @include_time_key record[@time_key] = time_str end if @format_json Yajl.dump(record) + "\n" else "#{time_str}\t#{tag}\t#{Yajl.dump(record)}\n" end end def write(chunk) i = 0 begin s3path = "#{@path}#{chunk.key}_#{i}.gz" i += 1 end while @bucket.objects[s3path].exists? tmp = Tempfile.new("s3-") w = Zlib::GzipWriter.new(tmp) begin chunk.write_to(w) w.close @bucket.objects[s3path].write(Pathname.new(tmp.path), :content_type => 'application/x-gzip') ensure w.close rescue nil end end end end