require_relative '../helper' require 'fluent/test/driver/input' require 'fluent/plugin/in_tail' require 'fluent/plugin/buffer' require 'fluent/system_config' require 'net/http' require 'flexmock/test_unit' require 'timecop' class TailInputTest < Test::Unit::TestCase include FlexMock::TestCase def setup Fluent::Test.setup cleanup_directory(TMP_DIR) end def teardown super Fluent::Engine.stop end def cleanup_directory(path) FileUtils.rm_rf(path, secure: true) if File.exist?(path) # ensure files are closed for Windows, on which deleted files # are still visible from filesystem GC.start(full_mark: true, immediate_mark: true, immediate_sweep: true) FileUtils.remove_entry_secure(path, true) end FileUtils.mkdir_p(path) end TMP_DIR = File.dirname(__FILE__) + "/../tmp/tail#{ENV['TEST_ENV_NUMBER']}" CONFIG = config_element("ROOT", "", { "path" => "#{TMP_DIR}/tail.txt", "tag" => "t1", "rotate_wait" => "2s" }) COMMON_CONFIG = CONFIG + config_element("", "", { "pos_file" => "#{TMP_DIR}/tail.pos" }) CONFIG_READ_FROM_HEAD = config_element("", "", { "read_from_head" => true }) CONFIG_ENABLE_WATCH_TIMER = config_element("", "", { "enable_watch_timer" => false }) CONFIG_DISABLE_STAT_WATCHER = config_element("", "", { "enable_stat_watcher" => false }) CONFIG_OPEN_ON_EVERY_UPDATE = config_element("", "", { "open_on_every_update" => true }) SINGLE_LINE_CONFIG = config_element("", "", { "format" => "/(?.*)/" }) PARSE_SINGLE_LINE_CONFIG = config_element("", "", {}, [config_element("parse", "", { "@type" => "/(?.*)/" })]) MULTILINE_CONFIG = config_element( "", "", { "format" => "multiline", "format1" => "/^s (?[^\\n]+)(\\nf (?[^\\n]+))?(\\nf (?.*))?/", "format_firstline" => "/^[s]/" }) PARSE_MULTILINE_CONFIG = config_element( "", "", {}, [config_element("parse", "", { "@type" => "multiline", "format1" => "/^s (?[^\\n]+)(\\nf (?[^\\n]+))?(\\nf (?.*))?/", "format_firstline" => "/^[s]/" }) ]) def create_driver(conf = SINGLE_LINE_CONFIG, use_common_conf = true) config = use_common_conf ? COMMON_CONFIG + conf : conf Fluent::Test::Driver::Input.new(Fluent::Plugin::TailInput).configure(config) end sub_test_case "configure" do test "plain single line" do d = create_driver assert_equal ["#{TMP_DIR}/tail.txt"], d.instance.paths assert_equal "t1", d.instance.tag assert_equal 2, d.instance.rotate_wait assert_equal "#{TMP_DIR}/tail.pos", d.instance.pos_file assert_equal 1000, d.instance.read_lines_limit assert_equal false, d.instance.ignore_repeated_permission_error end data("empty" => config_element, "w/o @type" => config_element("", "", {}, [config_element("parse", "", {})])) test "w/o parse section" do |conf| assert_raise(Fluent::ConfigError) do create_driver(conf) end end test "both enable_watch_timer and enable_stat_watcher are false" do assert_raise(Fluent::ConfigError) do create_driver(CONFIG_ENABLE_WATCH_TIMER + CONFIG_DISABLE_STAT_WATCHER + PARSE_SINGLE_LINE_CONFIG) end end sub_test_case "encoding" do test "valid" do conf = SINGLE_LINE_CONFIG + config_element("", "", { "encoding" => "utf-8" }) d = create_driver(conf) assert_equal Encoding::UTF_8, d.instance.encoding end test "invalid" do conf = SINGLE_LINE_CONFIG + config_element("", "", { "encoding" => "no-such-encoding" }) assert_raise(Fluent::ConfigError) do create_driver(conf) end end end sub_test_case "from_encoding" do test "only specified from_encoding raise ConfigError" do conf = SINGLE_LINE_CONFIG + config_element("", "", { "from_encoding" => "utf-8" }) assert_raise(Fluent::ConfigError) do create_driver(conf) end end test "valid" do conf = SINGLE_LINE_CONFIG + config_element("", "", { "from_encoding" => "utf-8", "encoding" => "utf-8" }) d = create_driver(conf) assert_equal(Encoding::UTF_8, d.instance.from_encoding) end test "invalid" do conf = SINGLE_LINE_CONFIG + config_element("", "", { "from_encoding" => "no-such-encoding", "encoding" => "utf-8" }) assert_raise(Fluent::ConfigError) do create_driver(conf) end end end end sub_test_case "singleline" do data(flat: SINGLE_LINE_CONFIG, parse: PARSE_SINGLE_LINE_CONFIG) def test_emit(data) config = data File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3\ntest4" } end events = d.events assert_equal(true, events.length > 0) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) assert(events[0][1].is_a?(Fluent::EventTime)) assert(events[1][1].is_a?(Fluent::EventTime)) assert_equal(1, d.emit_count) end def test_emit_with_emit_unmatched_lines_true config = config_element("", "", { "format" => "/^(?test.*)/", "emit_unmatched_lines" => true }) File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test line 1" f.puts "test line 2" f.puts "bad line 1" f.puts "test line 3" } end events = d.events assert_equal(4, events.length) assert_equal({"message" => "test line 1"}, events[0][2]) assert_equal({"message" => "test line 2"}, events[1][2]) assert_equal({"unmatched_line" => "bad line 1"}, events[2][2]) assert_equal({"message" => "test line 3"}, events[3][2]) end data('flat 1' => [:flat, 1, 2], 'flat 10' => [:flat, 10, 1], 'parse 1' => [:parse, 1, 2], 'parse 10' => [:parse, 10, 1]) def test_emit_with_read_lines_limit(data) config_style, limit, num_events = data case config_style when :flat config = CONFIG_READ_FROM_HEAD + SINGLE_LINE_CONFIG + config_element("", "", { "read_lines_limit" => limit }) when :parse config = CONFIG_READ_FROM_HEAD + config_element("", "", { "read_lines_limit" => limit }) + PARSE_SINGLE_LINE_CONFIG end d = create_driver(config) msg = 'test' * 2000 # in_tail reads 8192 bytes at once. d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts msg f.puts msg } end events = d.events assert_equal(true, events.length > 0) assert_equal({"message" => msg}, events[0][2]) assert_equal({"message" => msg}, events[1][2]) assert_equal(num_events, d.emit_count) end data(flat: CONFIG_READ_FROM_HEAD + SINGLE_LINE_CONFIG, parse: CONFIG_READ_FROM_HEAD + PARSE_SINGLE_LINE_CONFIG) def test_emit_with_read_from_head(data) config = data File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver(config) d.run(expect_emits: 2) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3" f.puts "test4" } end events = d.events assert(events.length > 0) assert_equal({"message" => "test1"}, events[0][2]) assert_equal({"message" => "test2"}, events[1][2]) assert_equal({"message" => "test3"}, events[2][2]) assert_equal({"message" => "test4"}, events[3][2]) end data(flat: CONFIG_ENABLE_WATCH_TIMER + SINGLE_LINE_CONFIG, parse: CONFIG_ENABLE_WATCH_TIMER + PARSE_SINGLE_LINE_CONFIG) def test_emit_with_enable_watch_timer(data) config = data File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3" f.puts "test4" } # according to cool.io's stat_watcher.c, systems without inotify will use # an "automatic" value, typically around 5 seconds end events = d.events assert(events.length > 0) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) end data(flat: CONFIG_DISABLE_STAT_WATCHER + SINGLE_LINE_CONFIG, parse: CONFIG_DISABLE_STAT_WATCHER + PARSE_SINGLE_LINE_CONFIG) def test_emit_with_disable_stat_watcher(data) config = data File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3" f.puts "test4" } end events = d.events assert(events.length > 0) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) end end class TestWithSystem < self include Fluent::SystemConfig::Mixin OVERRIDE_FILE_PERMISSION = 0620 CONFIG_SYSTEM = %[ file_permission #{OVERRIDE_FILE_PERMISSION} ] def setup omit "NTFS doesn't support UNIX like permissions" if Fluent.windows? # Store default permission @default_permission = system_config.instance_variable_get(:@file_permission) end def teardown # Restore default permission system_config.instance_variable_set(:@file_permission, @default_permission) end def parse_system(text) basepath = File.expand_path(File.dirname(__FILE__) + '/../../') Fluent::Config.parse(text, '(test)', basepath, true).elements.find { |e| e.name == 'system' } end def test_emit_with_system system_conf = parse_system(CONFIG_SYSTEM) sc = Fluent::SystemConfig.new(system_conf) Fluent::Engine.init(sc) File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3" f.puts "test4" } end events = d.events assert_equal(true, events.length > 0) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) assert(events[0][1].is_a?(Fluent::EventTime)) assert(events[1][1].is_a?(Fluent::EventTime)) assert_equal(1, d.emit_count) pos = d.instance.instance_variable_get(:@pf_file) mode = "%o" % File.stat(pos).mode assert_equal OVERRIDE_FILE_PERMISSION, mode[-3, 3].to_i end end sub_test_case "rotate file" do data(flat: SINGLE_LINE_CONFIG, parse: PARSE_SINGLE_LINE_CONFIG) def test_rotate_file(data) config = data events = sub_test_rotate_file(config, expect_emits: 2) assert_equal(4, events.length) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) assert_equal({"message" => "test5"}, events[2][2]) assert_equal({"message" => "test6"}, events[3][2]) end data(flat: CONFIG_READ_FROM_HEAD + SINGLE_LINE_CONFIG, parse: CONFIG_READ_FROM_HEAD + PARSE_SINGLE_LINE_CONFIG) def test_rotate_file_with_read_from_head(data) config = data events = sub_test_rotate_file(config, expect_records: 6) assert_equal(6, events.length) assert_equal({"message" => "test1"}, events[0][2]) assert_equal({"message" => "test2"}, events[1][2]) assert_equal({"message" => "test3"}, events[2][2]) assert_equal({"message" => "test4"}, events[3][2]) assert_equal({"message" => "test5"}, events[4][2]) assert_equal({"message" => "test6"}, events[5][2]) end data(flat: CONFIG_OPEN_ON_EVERY_UPDATE + CONFIG_READ_FROM_HEAD + SINGLE_LINE_CONFIG, parse: CONFIG_OPEN_ON_EVERY_UPDATE + CONFIG_READ_FROM_HEAD + PARSE_SINGLE_LINE_CONFIG) def test_rotate_file_with_open_on_every_update(data) config = data events = sub_test_rotate_file(config, expect_records: 6) assert_equal(6, events.length) assert_equal({"message" => "test1"}, events[0][2]) assert_equal({"message" => "test2"}, events[1][2]) assert_equal({"message" => "test3"}, events[2][2]) assert_equal({"message" => "test4"}, events[3][2]) assert_equal({"message" => "test5"}, events[4][2]) assert_equal({"message" => "test6"}, events[5][2]) end data(flat: SINGLE_LINE_CONFIG, parse: PARSE_SINGLE_LINE_CONFIG) def test_rotate_file_with_write_old(data) config = data events = sub_test_rotate_file(config, expect_emits: 3) { |rotated_file| File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } rotated_file.puts "test7" rotated_file.puts "test8" rotated_file.flush sleep 1 File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "test5" f.puts "test6" } } # This test sometimes fails and it shows a potential bug of in_tail # https://github.com/fluent/fluentd/issues/1434 assert_equal(6, events.length) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) assert_equal({"message" => "test7"}, events[2][2]) assert_equal({"message" => "test8"}, events[3][2]) assert_equal({"message" => "test5"}, events[4][2]) assert_equal({"message" => "test6"}, events[5][2]) end data(flat: SINGLE_LINE_CONFIG, parse: PARSE_SINGLE_LINE_CONFIG) def test_rotate_file_with_write_old_and_no_new_file(data) config = data events = sub_test_rotate_file(config, expect_emits: 2) { |rotated_file| rotated_file.puts "test7" rotated_file.puts "test8" rotated_file.flush } assert_equal(4, events.length) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) assert_equal({"message" => "test7"}, events[2][2]) assert_equal({"message" => "test8"}, events[3][2]) end def sub_test_rotate_file(config = nil, expect_emits: nil, expect_records: nil, timeout: nil) file = Fluent::FileWrapper.open("#{TMP_DIR}/tail.txt", "wb") file.puts "test1" file.puts "test2" file.flush d = create_driver(config) d.run(expect_emits: expect_emits, expect_records: expect_records, timeout: timeout) do size = d.emit_count file.puts "test3" file.puts "test4" file.flush sleep(0.1) until d.emit_count >= size + 1 size = d.emit_count if Fluent.windows? file.close FileUtils.mv("#{TMP_DIR}/tail.txt", "#{TMP_DIR}/tail2.txt", force: true) file = File.open("#{TMP_DIR}/tail.txt", "ab") else FileUtils.mv("#{TMP_DIR}/tail.txt", "#{TMP_DIR}/tail2.txt") end if block_given? yield file else File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } sleep 1 File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "test5" f.puts "test6" } end end d.events ensure file.close if file && !file.closed? end end def test_truncate_file omit "Permission denied error happen on Windows. Need fix" if Fluent.windows? config = SINGLE_LINE_CONFIG File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver(config) d.run(expect_emits: 2) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3\ntest4" f.flush } sleep 1 File.truncate("#{TMP_DIR}/tail.txt", 6) end events = d.events assert_equal(3, events.length) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) assert_equal({"message" => "test1"}, events[2][2]) assert(events[0][1].is_a?(Fluent::EventTime)) assert(events[1][1].is_a?(Fluent::EventTime)) assert(events[2][1].is_a?(Fluent::EventTime)) assert_equal(2, d.emit_count) end def test_move_truncate_move_back omit "Permission denied error happen on Windows. Need fix" if Fluent.windows? config = SINGLE_LINE_CONFIG File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver(config) d.run(expect_emits: 1) do if Fluent.windows? FileUtils.mv("#{TMP_DIR}/tail.txt", "#{TMP_DIR}/tail2.txt", force: true) else FileUtils.mv("#{TMP_DIR}/tail.txt", "#{TMP_DIR}/tail2.txt") end sleep(1) File.truncate("#{TMP_DIR}/tail2.txt", 6) sleep(1) if Fluent.windows? FileUtils.mv("#{TMP_DIR}/tail2.txt", "#{TMP_DIR}/tail.txt", force: true) else FileUtils.mv("#{TMP_DIR}/tail2.txt", "#{TMP_DIR}/tail.txt") end end events = d.events assert_equal(1, events.length) assert_equal({"message" => "test1"}, events[0][2]) assert(events[0][1].is_a?(Fluent::EventTime)) assert_equal(1, d.emit_count) end def test_lf File.open("#{TMP_DIR}/tail.txt", "wb") {|f| } d = create_driver d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.print "test3" } sleep 1 File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test4" } end events = d.events assert_equal(true, events.length > 0) assert_equal({"message" => "test3test4"}, events[0][2]) end def test_whitespace File.open("#{TMP_DIR}/tail.txt", "wb") {|f| } d = create_driver d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts " " # 4 spaces f.puts " 4 spaces" f.puts "4 spaces " f.puts " " # tab f.puts " tab" f.puts "tab " } end events = d.events assert_equal(true, events.length > 0) assert_equal({"message" => " "}, events[0][2]) assert_equal({"message" => " 4 spaces"}, events[1][2]) assert_equal({"message" => "4 spaces "}, events[2][2]) assert_equal({"message" => " "}, events[3][2]) assert_equal({"message" => " tab"}, events[4][2]) assert_equal({"message" => "tab "}, events[5][2]) end data( 'flat default encoding' => [SINGLE_LINE_CONFIG, Encoding::ASCII_8BIT], 'flat explicit encoding config' => [SINGLE_LINE_CONFIG + config_element("", "", { "encoding" => "utf-8" }), Encoding::UTF_8], 'parse default encoding' => [PARSE_SINGLE_LINE_CONFIG, Encoding::ASCII_8BIT], 'parse explicit encoding config' => [PARSE_SINGLE_LINE_CONFIG + config_element("", "", { "encoding" => "utf-8" }), Encoding::UTF_8]) def test_encoding(data) encoding_config, encoding = data d = create_driver(CONFIG_READ_FROM_HEAD + encoding_config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test" } end events = d.events assert_equal(encoding, events[0][2]['message'].encoding) end def test_from_encoding conf = config_element( "", "", { "format" => "/(?.*)/", "read_from_head" => "true", "from_encoding" => "cp932", "encoding" => "utf-8" }) d = create_driver(conf) cp932_message = "\x82\xCD\x82\xEB\x81\x5B\x82\xED\x81\x5B\x82\xE9\x82\xC7".force_encoding(Encoding::CP932) utf8_message = cp932_message.encode(Encoding::UTF_8) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "w:cp932") {|f| f.puts cp932_message } end events = d.events assert_equal(utf8_message, events[0][2]['message']) assert_equal(Encoding::UTF_8, events[0][2]['message'].encoding) end def test_from_encoding_utf16 conf = config_element( "", "", { "format" => "/(?.*)/", "read_from_head" => "true", "from_encoding" => "utf-16le", "encoding" => "utf-8" }) d = create_driver(conf) utf16_message = "\u306F\u308D\u30FC\u308F\u30FC\u308B\u3069\n".encode(Encoding::UTF_16LE) utf8_message = utf16_message.encode(Encoding::UTF_8).strip d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "w:utf-16le") { |f| f.write utf16_message } end events = d.events assert_equal(utf8_message, events[0][2]['message']) assert_equal(Encoding::UTF_8, events[0][2]['message'].encoding) end def test_encoding_with_bad_character conf = config_element( "", "", { "format" => "/(?.*)/", "read_from_head" => "true", "from_encoding" => "ASCII-8BIT", "encoding" => "utf-8" }) d = create_driver(conf) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "w") { |f| f.write "te\x86st\n" } end events = d.events assert_equal("te\uFFFDst", events[0][2]['message']) assert_equal(Encoding::UTF_8, events[0][2]['message'].encoding) end sub_test_case "multiline" do data(flat: MULTILINE_CONFIG, parse: PARSE_MULTILINE_CONFIG) def test_multiline(data) config = data File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "f test1" f.puts "s test2" f.puts "f test3" f.puts "f test4" f.puts "s test5" f.puts "s test6" f.puts "f test7" f.puts "s test8" } end events = d.events assert_equal(4, events.length) assert_equal({"message1" => "test2", "message2" => "test3", "message3" => "test4"}, events[0][2]) assert_equal({"message1" => "test5"}, events[1][2]) assert_equal({"message1" => "test6", "message2" => "test7"}, events[2][2]) assert_equal({"message1" => "test8"}, events[3][2]) end data(flat: MULTILINE_CONFIG, parse: PARSE_MULTILINE_CONFIG) def test_multiline_with_emit_unmatched_lines_true(data) config = data + config_element("", "", { "emit_unmatched_lines" => true }) File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "f test1" f.puts "s test2" f.puts "f test3" f.puts "f test4" f.puts "s test5" f.puts "s test6" f.puts "f test7" f.puts "s test8" } end events = d.events assert_equal(5, events.length) assert_equal({"unmatched_line" => "f test1"}, events[0][2]) assert_equal({"message1" => "test2", "message2" => "test3", "message3" => "test4"}, events[1][2]) assert_equal({"message1" => "test5"}, events[2][2]) assert_equal({"message1" => "test6", "message2" => "test7"}, events[3][2]) assert_equal({"message1" => "test8"}, events[4][2]) end data(flat: MULTILINE_CONFIG, parse: PARSE_MULTILINE_CONFIG) def test_multiline_with_flush_interval(data) File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } config = data + config_element("", "", { "multiline_flush_interval" => "2s" }) d = create_driver(config) assert_equal 2, d.instance.multiline_flush_interval d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "f test1" f.puts "s test2" f.puts "f test3" f.puts "f test4" f.puts "s test5" f.puts "s test6" f.puts "f test7" f.puts "s test8" } end events = d.events assert_equal(4, events.length) assert_equal({"message1" => "test2", "message2" => "test3", "message3" => "test4"}, events[0][2]) assert_equal({"message1" => "test5"}, events[1][2]) assert_equal({"message1" => "test6", "message2" => "test7"}, events[2][2]) assert_equal({"message1" => "test8"}, events[3][2]) end data( 'flat default encoding' => [MULTILINE_CONFIG, Encoding::ASCII_8BIT], 'flat explicit encoding config' => [MULTILINE_CONFIG + config_element("", "", { "encoding" => "utf-8" }), Encoding::UTF_8], 'parse default encoding' => [PARSE_MULTILINE_CONFIG, Encoding::ASCII_8BIT], 'parse explicit encoding config' => [PARSE_MULTILINE_CONFIG + config_element("", "", { "encoding" => "utf-8" }), Encoding::UTF_8]) def test_multiline_encoding_of_flushed_record(data) encoding_config, encoding = data config = config_element("", "", { "multiline_flush_interval" => "2s", "read_from_head" => "true", }) d = create_driver(config + encoding_config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "wb") { |f| f.puts "s test" } end events = d.events assert_equal(1, events.length) assert_equal(encoding, events[0][2]['message1'].encoding) end def test_multiline_from_encoding_of_flushed_record conf = MULTILINE_CONFIG + config_element( "", "", { "multiline_flush_interval" => "1s", "read_from_head" => "true", "from_encoding" => "cp932", "encoding" => "utf-8" }) d = create_driver(conf) cp932_message = "s \x82\xCD\x82\xEB\x81\x5B\x82\xED\x81\x5B\x82\xE9\x82\xC7".force_encoding(Encoding::CP932) utf8_message = "\x82\xCD\x82\xEB\x81\x5B\x82\xED\x81\x5B\x82\xE9\x82\xC7".encode(Encoding::UTF_8, Encoding::CP932) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "w:cp932") { |f| f.puts cp932_message } end events = d.events assert_equal(1, events.length) assert_equal(utf8_message, events[0][2]['message1']) assert_equal(Encoding::UTF_8, events[0][2]['message1'].encoding) end data(flat: config_element( "", "", { "format" => "multiline", "format1" => "/^s (?[^\\n]+)\\n?/", "format2" => "/(f (?[^\\n]+)\\n?)?/", "format3" => "/(f (?.*))?/", "format_firstline" => "/^[s]/" }), parse: config_element( "", "", {}, [config_element("parse", "", { "@type" => "multiline", "format1" => "/^s (?[^\\n]+)\\n?/", "format2" => "/(f (?[^\\n]+)\\n?)?/", "format3" => "/(f (?.*))?/", "format_firstline" => "/^[s]/" }) ]) ) def test_multiline_with_multiple_formats(data) config = data File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "f test1" f.puts "s test2" f.puts "f test3" f.puts "f test4" f.puts "s test5" f.puts "s test6" f.puts "f test7" f.puts "s test8" } end events = d.events assert(events.length > 0) assert_equal({"message1" => "test2", "message2" => "test3", "message3" => "test4"}, events[0][2]) assert_equal({"message1" => "test5"}, events[1][2]) assert_equal({"message1" => "test6", "message2" => "test7"}, events[2][2]) assert_equal({"message1" => "test8"}, events[3][2]) end data(flat: config_element( "", "", { "format" => "multiline", "format1" => "/^[s|f] (?.*)/", "format_firstline" => "/^[s]/" }), parse: config_element( "", "", {}, [config_element("parse", "", { "@type" => "multiline", "format1" => "/^[s|f] (?.*)/", "format_firstline" => "/^[s]/" }) ]) ) def test_multilinelog_with_multiple_paths(data) files = ["#{TMP_DIR}/tail1.txt", "#{TMP_DIR}/tail2.txt"] files.each { |file| File.open(file, "wb") { |f| } } config = data + config_element("", "", { "path" => "#{files[0]},#{files[1]}", "tag" => "t1", }) d = create_driver(config, false) d.run(expect_emits: 2) do files.each do |file| File.open(file, 'ab') { |f| f.puts "f #{file} line should be ignored" f.puts "s test1" f.puts "f test2" f.puts "f test3" f.puts "s test4" } end end events = d.events assert_equal({"message" => "test1\nf test2\nf test3"}, events[0][2]) assert_equal({"message" => "test1\nf test2\nf test3"}, events[1][2]) # "test4" events are here because these events are flushed at shutdown phase assert_equal({"message" => "test4"}, events[2][2]) assert_equal({"message" => "test4"}, events[3][2]) end data(flat: config_element("", "", { "format" => "multiline", "format1" => "/(?foo \\d)\\n/", "format2" => "/(?bar \\d)\\n/", "format3" => "/(?baz \\d)/" }), parse: config_element( "", "", {}, [config_element("parse", "", { "@type" => "multiline", "format1" => "/(?foo \\d)\\n/", "format2" => "/(?bar \\d)\\n/", "format3" => "/(?baz \\d)/" }) ]) ) def test_multiline_without_firstline(data) File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } config = data d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "foo 1" f.puts "bar 1" f.puts "baz 1" f.puts "foo 2" f.puts "bar 2" f.puts "baz 2" } end events = d.events assert_equal(2, events.length) assert_equal({"var1" => "foo 1", "var2" => "bar 1", "var3" => "baz 1"}, events[0][2]) assert_equal({"var1" => "foo 2", "var2" => "bar 2", "var3" => "baz 2"}, events[1][2]) end end sub_test_case "path" do # * path test # TODO: Clean up tests EX_ROTATE_WAIT = 0 EX_CONFIG = config_element("", "", { "tag" => "tail", "path" => "test/plugin/*/%Y/%m/%Y%m%d-%H%M%S.log,test/plugin/data/log/**/*.log", "format" => "none", "pos_file" => "#{TMP_DIR}/tail.pos", "read_from_head" => true, "refresh_interval" => 30, "rotate_wait" => "#{EX_ROTATE_WAIT}s", }) EX_PATHS = [ 'test/plugin/data/2010/01/20100102-030405.log', 'test/plugin/data/log/foo/bar.log', 'test/plugin/data/log/test.log' ] def test_expand_paths plugin = create_driver(EX_CONFIG, false).instance flexstub(Time) do |timeclass| timeclass.should_receive(:now).with_no_args.and_return(Time.new(2010, 1, 2, 3, 4, 5)) assert_equal EX_PATHS, plugin.expand_paths.sort end # Test exclusion exclude_config = EX_CONFIG + config_element("", "", { "exclude_path" => %Q(["#{EX_PATHS.last}"]) }) plugin = create_driver(exclude_config, false).instance assert_equal EX_PATHS - [EX_PATHS.last], plugin.expand_paths.sort end def test_expand_paths_with_timezone ['Asia/Taipei', '+08'].each do |tz_type| taipei_config = EX_CONFIG + config_element("", "", {"path_timezone" => tz_type}) plugin = create_driver(taipei_config, false).instance # Test exclude exclude_config = taipei_config + config_element("", "", { "exclude_path" => %Q(["test/plugin/**/%Y%m%d-%H%M%S.log"]) }) exclude_plugin = create_driver(exclude_config, false).instance with_timezone('utc') do flexstub(Time) do |timeclass| # env : 2010-01-01 19:04:05 (UTC), tail path : 2010-01-02 03:04:05 (Asia/Taipei) timeclass.should_receive(:now).with_no_args.and_return(Time.new(2010, 1, 1, 19, 4, 5)) assert_equal EX_PATHS, plugin.expand_paths.sort assert_equal EX_PATHS - [EX_PATHS.first], exclude_plugin.expand_paths.sort end end end end def test_log_file_without_extension expected_files = [ 'test/plugin/data/log/bar', 'test/plugin/data/log/foo/bar.log', 'test/plugin/data/log/foo/bar2', 'test/plugin/data/log/test.log' ] config = config_element("", "", { "tag" => "tail", "path" => "test/plugin/data/log/**/*", "format" => "none", "pos_file" => "#{TMP_DIR}/tail.pos" }) plugin = create_driver(config, false).instance assert_equal expected_files, plugin.expand_paths.sort end # For https://github.com/fluent/fluentd/issues/1455 # This test is fragile because test content depends on internal implementation. # So if you modify in_tail internal, this test may break. def test_unwatched_files_should_be_removed config = config_element("", "", { "tag" => "tail", "path" => "#{TMP_DIR}/*.txt", "format" => "none", "pos_file" => "#{TMP_DIR}/tail.pos", "read_from_head" => true, "refresh_interval" => 1, }) d = create_driver(config, false) d.run(expect_emits: 1, shutdown: false) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "test3\n" } end assert_equal 1, d.instance.instance_variable_get(:@tails).keys.size cleanup_directory(TMP_DIR) waiting(20) { sleep 0.1 until Dir.glob("#{TMP_DIR}/*.txt").size == 0 } # Ensure file is deleted on Windows waiting(5) { sleep 0.1 until d.instance.instance_variable_get(:@tails).keys.size == 0 } # Previous implementation has an infinite watcher creation bug. # Following code checks such unexpected bug by counting actual object allocation. base_num = count_timer_object 2.times { sleep 1 num = count_timer_object assert_equal base_num, num } d.instance_shutdown end def count_timer_object num = 0 ObjectSpace.each_object(Fluent::PluginHelper::Timer::TimerWatcher) { |obj| num += 1 } num end end def test_pos_file_dir_creation config = config_element("", "", { "tag" => "tail", "path" => "#{TMP_DIR}/*.txt", "format" => "none", "pos_file" => "#{TMP_DIR}/pos/tail.pos", "read_from_head" => true, "refresh_interval" => 1 }) d = create_driver(config, false) d.run(expect_emits: 1, shutdown: false) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "test3\n" } end assert_path_exist("#{TMP_DIR}/pos/tail.pos") cleanup_directory(TMP_DIR) d.instance_shutdown end def test_z_refresh_watchers plugin = create_driver(EX_CONFIG, false).instance sio = StringIO.new plugin.instance_eval do @pf = Fluent::Plugin::TailInput::PositionFile.parse(sio) @loop = Coolio::Loop.new end Timecop.freeze(2010, 1, 2, 3, 4, 5) do flexstub(Fluent::Plugin::TailInput::TailWatcher) do |watcherclass| EX_PATHS.each do |path| watcherclass.should_receive(:new).with(path, EX_ROTATE_WAIT, Fluent::Plugin::TailInput::FilePositionEntry, any, true, true, true, 1000, any, any, any, any, any, any).once.and_return do flexmock('TailWatcher') { |watcher| watcher.should_receive(:attach).once watcher.should_receive(:unwatched=).zero_or_more_times watcher.should_receive(:line_buffer).zero_or_more_times } end end plugin.refresh_watchers end end plugin.instance_eval do @tails['test/plugin/data/2010/01/20100102-030405.log'].should_receive(:close).zero_or_more_times end Timecop.freeze(2010, 1, 2, 3, 4, 6) do flexstub(Fluent::Plugin::TailInput::TailWatcher) do |watcherclass| watcherclass.should_receive(:new).with('test/plugin/data/2010/01/20100102-030406.log', EX_ROTATE_WAIT, Fluent::Plugin::TailInput::FilePositionEntry, any, true, true, true, 1000, any, any, any, any, any, any).once.and_return do flexmock('TailWatcher') do |watcher| watcher.should_receive(:attach).once watcher.should_receive(:unwatched=).zero_or_more_times watcher.should_receive(:line_buffer).zero_or_more_times end end plugin.refresh_watchers end flexstub(Fluent::Plugin::TailInput::TailWatcher) do |watcherclass| watcherclass.should_receive(:new).never plugin.refresh_watchers end end end sub_test_case "receive_lines" do DummyWatcher = Struct.new("DummyWatcher", :tag) def test_tag d = create_driver(EX_CONFIG, false) d.run {} plugin = d.instance mock(plugin.router).emit_stream('tail', anything).once plugin.receive_lines(['foo', 'bar'], DummyWatcher.new('foo.bar.log')) end def test_tag_with_only_star config = config_element("", "", { "tag" => "*", "path" => "test/plugin/*/%Y/%m/%Y%m%d-%H%M%S.log,test/plugin/data/log/**/*.log", "format" => "none", "read_from_head" => true }) d = create_driver(config, false) d.run {} plugin = d.instance mock(plugin.router).emit_stream('foo.bar.log', anything).once plugin.receive_lines(['foo', 'bar'], DummyWatcher.new('foo.bar.log')) end def test_tag_prefix config = config_element("", "", { "tag" => "pre.*", "path" => "test/plugin/*/%Y/%m/%Y%m%d-%H%M%S.log,test/plugin/data/log/**/*.log", "format" => "none", "read_from_head" => true }) d = create_driver(config, false) d.run {} plugin = d.instance mock(plugin.router).emit_stream('pre.foo.bar.log', anything).once plugin.receive_lines(['foo', 'bar'], DummyWatcher.new('foo.bar.log')) end def test_tag_suffix config = config_element("", "", { "tag" => "*.post", "path" => "test/plugin/*/%Y/%m/%Y%m%d-%H%M%S.log,test/plugin/data/log/**/*.log", "format" => "none", "read_from_head" => true }) d = create_driver(config, false) d.run {} plugin = d.instance mock(plugin.router).emit_stream('foo.bar.log.post', anything).once plugin.receive_lines(['foo', 'bar'], DummyWatcher.new('foo.bar.log')) end def test_tag_prefix_and_suffix config = config_element("", "", { "tag" => "pre.*.post", "path" => "test/plugin/*/%Y/%m/%Y%m%d-%H%M%S.log,test/plugin/data/log/**/*.log", "format" => "none", "read_from_head" => true }) d = create_driver(config, false) d.run {} plugin = d.instance mock(plugin.router).emit_stream('pre.foo.bar.log.post', anything).once plugin.receive_lines(['foo', 'bar'], DummyWatcher.new('foo.bar.log')) end def test_tag_prefix_and_suffix_ignore config = config_element("", "", { "tag" => "pre.*.post*ignore", "path" => "test/plugin/*/%Y/%m/%Y%m%d-%H%M%S.log,test/plugin/data/log/**/*.log", "format" => "none", "read_from_head" => true }) d = create_driver(config, false) d.run {} plugin = d.instance mock(plugin.router).emit_stream('pre.foo.bar.log.post', anything).once plugin.receive_lines(['foo', 'bar'], DummyWatcher.new('foo.bar.log')) end end # Ensure that no fatal exception is raised when a file is missing and that # files that do exist are still tailed as expected. def test_missing_file File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } # Try two different configs - one with read_from_head and one without, # since their interactions with the filesystem differ. config1 = config_element("", "", { "tag" => "t1", "path" => "#{TMP_DIR}/non_existent_file.txt,#{TMP_DIR}/tail.txt", "format" => "none", "rotate_wait" => "2s", "pos_file" => "#{TMP_DIR}/tail.pos" }) config2 = config1 + config_element("", "", { "read_from_head" => true }) [config1, config2].each do |config| d = create_driver(config, false) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3" f.puts "test4" } end # This test sometimes fails and it shows a potential bug of in_tail # https://github.com/fluent/fluentd/issues/1434 events = d.events assert_equal(2, events.length) assert_equal({"message" => "test3"}, events[0][2]) assert_equal({"message" => "test4"}, events[1][2]) end end sub_test_case "tail_path" do def test_tail_path_with_singleline File.open("#{TMP_DIR}/tail.txt", "wb") {|f| f.puts "test1" f.puts "test2" } d = create_driver(SINGLE_LINE_CONFIG + config_element("", "", { "path_key" => "path" })) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") {|f| f.puts "test3" f.puts "test4" } end events = d.events assert_equal(true, events.length > 0) events.each do |emit| assert_equal("#{TMP_DIR}/tail.txt", emit[2]["path"]) end end def test_tail_path_with_multiline_with_firstline File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } config = config_element("", "", { "path_key" => "path", "format" => "multiline", "format1" => "/^s (?[^\\n]+)(\\nf (?[^\\n]+))?(\\nf (?.*))?/", "format_firstline" => "/^[s]/" }) d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "f test1" f.puts "s test2" f.puts "f test3" f.puts "f test4" f.puts "s test5" f.puts "s test6" f.puts "f test7" f.puts "s test8" } end events = d.events assert_equal(4, events.length) events.each do |emit| assert_equal("#{TMP_DIR}/tail.txt", emit[2]["path"]) end end def test_tail_path_with_multiline_without_firstline File.open("#{TMP_DIR}/tail.txt", "wb") { |f| } config = config_element("", "", { "path_key" => "path", "format" => "multiline", "format1" => "/(?foo \\d)\\n/", "format2" => "/(?bar \\d)\\n/", "format3" => "/(?baz \\d)/", }) d = create_driver(config) d.run(expect_emits: 1) do File.open("#{TMP_DIR}/tail.txt", "ab") { |f| f.puts "foo 1" f.puts "bar 1" f.puts "baz 1" } end events = d.events assert(events.length > 0) events.each do |emit| assert_equal("#{TMP_DIR}/tail.txt", emit[2]["path"]) end end def test_tail_path_with_multiline_with_multiple_paths files = ["#{TMP_DIR}/tail1.txt", "#{TMP_DIR}/tail2.txt"] files.each { |file| File.open(file, "wb") { |f| } } config = config_element("", "", { "path" => "#{files[0]},#{files[1]}", "path_key" => "path", "tag" => "t1", "format" => "multiline", "format1" => "/^[s|f] (?.*)/", "format_firstline" => "/^[s]/" }) d = create_driver(config, false) d.run(expect_emits: 2) do files.each do |file| File.open(file, 'ab') { |f| f.puts "f #{file} line should be ignored" f.puts "s test1" f.puts "f test2" f.puts "f test3" f.puts "s test4" } end end events = d.events assert_equal(4, events.length) assert_equal(files, [events[0][2]["path"], events[1][2]["path"]].sort) # "test4" events are here because these events are flushed at shutdown phase assert_equal(files, [events[2][2]["path"], events[3][2]["path"]].sort) end end def test_limit_recently_modified now = Time.new(2010, 1, 2, 3, 4, 5) FileUtils.touch("#{TMP_DIR}/tail_unwatch.txt", mtime: (now - 3601)) FileUtils.touch("#{TMP_DIR}/tail_watch1.txt", mtime: (now - 3600)) FileUtils.touch("#{TMP_DIR}/tail_watch2.txt", mtime: now) config = config_element('', '', { 'tag' => 'tail', 'path' => "#{TMP_DIR}/*.txt", 'format' => 'none', 'limit_recently_modified' => '3600s' }) expected_files = [ "#{TMP_DIR}/tail_watch1.txt", "#{TMP_DIR}/tail_watch2.txt" ] Timecop.freeze(now) do plugin = create_driver(config, false).instance assert_equal expected_files, plugin.expand_paths.sort end end def test_skip_refresh_on_startup FileUtils.touch("#{TMP_DIR}/tail.txt") config = config_element('', '', { 'format' => 'none', 'refresh_interval' => 1, 'skip_refresh_on_startup' => true }) d = create_driver(config) d.run(shutdown: false) {} assert_equal 0, d.instance.instance_variable_get(:@tails).keys.size # detect a file at first execution of in_tail_refresh_watchers timer waiting(5) { sleep 0.1 until d.instance.instance_variable_get(:@tails).keys.size == 1 } d.instance_shutdown end end