# encoding: utf-8 require "logstash/devutils/rspec/spec_helper" require "logstash/filters/xml" describe LogStash::Filters::Xml do describe "parse standard xml (Deprecated checks)" do config <<-CONFIG filter { xml { source => "raw" target => "data" } } CONFIG sample("raw" => '') do insist { subject.get("tags") }.nil? insist { subject.get("data")} == {"key" => "value"} end #From parse xml with array as a value sample("raw" => 'value1value2') do insist { subject.get("tags") }.nil? insist { subject.get("data")} == {"key" => ["value1", "value2"]} end #From parse xml with hash as a value sample("raw" => 'value') do insist { subject.get("tags") }.nil? insist { subject.get("data")} == {"key1" => [{"key2" => ["value"]}]} end # parse xml in single item array sample("raw" => [""]) do insist { subject.get("tags") }.nil? insist { subject.get("data")} == {"bar" => "baz"} end # fail in multi items array sample("raw" => ["", "jojoba"]) do insist { subject.get("tags") }.include?("_xmlparsefailure") insist { subject.get("data")} == nil end # fail in empty array sample("raw" => []) do insist { subject.get("tags") }.include?("_xmlparsefailure") insist { subject.get("data")} == nil end # fail for non string field sample("raw" => {"foo" => "bar"}) do insist { subject.get("tags") }.include?("_xmlparsefailure") insist { subject.get("data")} == nil end # fail for non string single item array sample("raw" => [{"foo" => "bar"}]) do insist { subject.get("tags") }.include?("_xmlparsefailure") insist { subject.get("data")} == nil end #From bad xml sample("raw" => ' "raw" target => "data" store_xml => false } } CONFIG sample("raw" => '') do insist { subject.get("tags") }.nil? insist { subject.get("data")} == nil end end describe "parse xml and store values with xpath (Deprecated checks)" do config <<-CONFIG filter { xml { source => "raw" target => "data" xpath => [ "/foo/key/text()", "xpath_field" ] } } CONFIG # Single value sample("raw" => 'value') do insist { subject.get("tags") }.nil? insist { subject.get("xpath_field")} == ["value"] end #Multiple values sample("raw" => 'value1value2') do insist { subject.get("tags") }.nil? insist { subject.get("xpath_field")} == ["value1","value2"] end end ## New tests describe "parse standard xml" do config <<-CONFIG filter { xml { source => "xmldata" target => "data" } } CONFIG sample("xmldata" => '') do insist { subject.get("tags") }.nil? insist { subject.get("data") } == {"key" => "value"} end #From parse xml with array as a value sample("xmldata" => 'value1value2') do insist { subject.get("tags") }.nil? insist { subject.get("data") } == {"key" => ["value1", "value2"]} end #From parse xml with hash as a value sample("xmldata" => 'value') do insist { subject.get("tags") }.nil? insist { subject.get("data") } == {"key1" => [{"key2" => ["value"]}]} end #From bad xml sample("xmldata" => ' "xmldata" target => "data" store_xml => false } } CONFIG sample("xmldata" => '') do insist { subject.get("tags") }.nil? insist { subject.get("data")} == nil end end describe "parse xml and store values with xpath" do config <<-CONFIG filter { xml { source => "xmldata" target => "data" xpath => [ "/foo/key/text()", "xpath_field" ] } } CONFIG # Single value sample("xmldata" => 'value') do insist { subject.get("tags") }.nil? insist { subject.get("xpath_field") } == ["value"] end #Multiple values sample("xmldata" => 'value1value2') do insist { subject.get("tags") }.nil? insist { subject.get("xpath_field") } == ["value1","value2"] end end describe "parse correctly non ascii content with xpath" do config <<-CONFIG filter { xml { source => "xmldata" target => "data" xpath => [ "/foo/key/text()", "xpath_field" ] } } CONFIG # Single value sample("xmldata" => 'Français') do insist { subject.get("tags") }.nil? insist { subject.get("xpath_field")} == ["Français"] end end describe "parse including namespaces" do config <<-CONFIG filter { xml { source => "xmldata" xpath => [ "/foo/h:div", "xpath_field" ] remove_namespaces => false } } CONFIG # Single value sample("xmldata" => 'Content') do insist { subject.get("xpath_field") } == ["Content"] end end describe "parse including namespaces declarations on root" do config <<-CONFIG filter { xml { source => "xmldata" xpath => [ "/foo/h:div", "xpath_field" ] namespaces => {"h" => "http://www.w3.org/TR/html4/"} remove_namespaces => false } } CONFIG # Single value sample("xmldata" => 'Content') do insist { subject.get("xpath_field") } == ["Content"] end end describe "parse including namespaces declarations on child" do config <<-CONFIG filter { xml { source => "xmldata" xpath => [ "/foo/h:div", "xpath_field" ] namespaces => {"h" => "http://www.w3.org/TR/html4/"} remove_namespaces => false } } CONFIG # Single value sample("xmldata" => 'Content') do insist { subject.get("xpath_field") } == ["Content"] end end describe "parse removing namespaces" do config <<-CONFIG filter { xml { source => "xmldata" xpath => [ "/foo/div", "xpath_field" ] remove_namespaces => true } } CONFIG # Single value sample("xmldata" => 'Content') do insist { subject.get("xpath_field") } == ["
Content
"] end end describe "parse with forcing array (Default)" do config <<-CONFIG filter { xml { source => "xmldata" target => "parseddata" } } CONFIG # Single value sample("xmldata" => 'Content') do insist { subject.get("parseddata") } == { "bar" => ["Content"] } end end describe "parse disabling forcing array" do config <<-CONFIG filter { xml { source => "xmldata" target => "parseddata" force_array => false } } CONFIG # Single value sample("xmldata" => 'Content') do insist { subject.get("parseddata") } == { "bar" => "Content" } end end end