require 'spec_helper' describe Riak::MapReduce do before :each do @client = Riak::Client.new @backend = mock("Backend") @client.stub!(:backend).and_yield(@backend) @mr = Riak::MapReduce.new(@client) end it "should require a client" do lambda { Riak::MapReduce.new }.should raise_error lambda { Riak::MapReduce.new(@client) }.should_not raise_error end it "should initialize the inputs and query to empty arrays" do @mr.inputs.should == [] @mr.query.should == [] end it "should yield itself when given a block on initializing" do @mr2 = nil @mr = Riak::MapReduce.new(@client) do |mr| @mr2 = mr end @mr2.should == @mr end describe "adding inputs" do it "should return self for chaining" do @mr.add("foo", "bar").should == @mr end it "should add bucket/key pairs to the inputs" do @mr.add("foo","bar") @mr.inputs.should == [["foo","bar"]] end it "should add an array containing a bucket/key pair to the inputs" do @mr.add(["foo","bar"]) @mr.inputs.should == [["foo","bar"]] end it "should add an object to the inputs by its bucket and key" do bucket = Riak::Bucket.new(@client, "foo") obj = Riak::RObject.new(bucket, "bar") @mr.add(obj) @mr.inputs.should == [["foo", "bar"]] end it "should add an array containing a bucket/key/key-data triple to the inputs" do @mr.add(["foo","bar",1000]) @mr.inputs.should == [["foo","bar",1000]] end it "should use a bucket name as the single input" do @mr.add(Riak::Bucket.new(@client, "foo")) @mr.inputs.should == "foo" @mr.add("docs") @mr.inputs.should == "docs" end it "should accept a list of key-filters along with a bucket" do @mr.add("foo", [[:tokenize, "-", 3], [:string_to_int], [:between, 2009, 2010]]) @mr.inputs.should == {:bucket => "foo", :key_filters => [[:tokenize, "-", 3], [:string_to_int], [:between, 2009, 2010]]} end it "should add a bucket and filter list via a builder block" do @mr.filter("foo") do tokenize "-", 3 string_to_int between 2009, 2010 end @mr.inputs.should == {:bucket => "foo", :key_filters => [[:tokenize, "-", 3], [:string_to_int], [:between, 2009, 2010]]} end context "using secondary indexes as inputs" do it "should set the inputs for equality" do @mr.index("foo", "email_bin", "sean@basho.com").should == @mr @mr.inputs.should == {:bucket => "foo", :index => "email_bin", :key => "sean@basho.com"} end it "should set the inputs for a range" do @mr.index("foo", "rank_int", 10..20).should == @mr @mr.inputs.should == {:bucket => "foo", :index => "rank_int", :start => 10, :end => 20} end it "should raise an error when given an invalid query" do expect { @mr.index("foo", "rank_int", 1.0348) }.to raise_error(ArgumentError) expect { @mr.index("foo", "rank_int", Range.new(1.03, 1.05)) }.to raise_error(ArgumentError) end end describe "escaping" do before { @oldesc, Riak.escaper = Riak.escaper, CGI } after { Riak.escaper = @oldesc } context "when url_decoding is false" do before { @urldecode, Riak.url_decoding = Riak.url_decoding, false } after { Riak.url_decoding = @urldecode } it "should add bucket/key pairs to the inputs with bucket and key escaped" do @mr.add("[foo]","(bar)") @mr.inputs.should == [["%5Bfoo%5D","%28bar%29"]] end it "should add an escaped array containing a bucket/key pair to the inputs" do @mr.add(["[foo]","(bar)"]) @mr.inputs.should == [["%5Bfoo%5D","%28bar%29"]] end it "should add an object to the inputs by its escaped bucket and key" do bucket = Riak::Bucket.new(@client, "[foo]") obj = Riak::RObject.new(bucket, "(bar)") @mr.add(obj) @mr.inputs.should == [["%5Bfoo%5D", "%28bar%29"]] end it "should add an escaped array containing a bucket/key/key-data triple to the inputs" do @mr.add(["[foo]","(bar)","[]()"]) @mr.inputs.should == [["%5Bfoo%5D", "%28bar%29","[]()"]] end it "should use an escaped bucket name as the single input" do @mr.add(Riak::Bucket.new(@client, "[foo]")) @mr.inputs.should == "%5Bfoo%5D" @mr.add("docs") @mr.inputs.should == "docs" end end context "when url_decoding is true" do before { @urldecode, Riak.url_decoding = Riak.url_decoding, true } after { Riak.url_decoding = @urldecode } it "should add bucket/key pairs to the inputs with bucket and key unescaped" do @mr.add("[foo]","(bar)") @mr.inputs.should == [["[foo]","(bar)"]] end it "should add an unescaped array containing a bucket/key pair to the inputs" do @mr.add(["[foo]","(bar)"]) @mr.inputs.should == [["[foo]","(bar)"]] end it "should add an object to the inputs by its unescaped bucket and key" do bucket = Riak::Bucket.new(@client, "[foo]") obj = Riak::RObject.new(bucket, "(bar)") @mr.add(obj) @mr.inputs.should == [["[foo]","(bar)"]] end it "should add an unescaped array containing a bucket/key/key-data triple to the inputs" do @mr.add(["[foo]","(bar)","[]()"]) @mr.inputs.should == [["[foo]","(bar)","[]()"]] end it "should use an unescaped bucket name as the single input" do @mr.add(Riak::Bucket.new(@client, "[foo]")) @mr.inputs.should == "[foo]" @mr.add("docs") @mr.inputs.should == "docs" end end end context "escaping" do before { @oldesc, Riak.escaper = Riak.escaper, CGI } after { Riak.escaper = @oldesc } it "should add bucket/key pairs to the inputs with bucket and key escaped" do @mr.add("[foo]","(bar)") @mr.inputs.should == [["%5Bfoo%5D","%28bar%29"]] end it "should add an escaped array containing a bucket/key pair to the inputs" do @mr.add(["[foo]","(bar)"]) @mr.inputs.should == [["%5Bfoo%5D","%28bar%29"]] end it "should add an object to the inputs by its escaped bucket and key" do bucket = Riak::Bucket.new(@client, "[foo]") obj = Riak::RObject.new(bucket, "(bar)") @mr.add(obj) @mr.inputs.should == [["%5Bfoo%5D", "%28bar%29"]] end it "should add an escaped array containing a bucket/key/key-data triple to the inputs" do @mr.add(["[foo]","(bar)","[]()"]) @mr.inputs.should == [["%5Bfoo%5D", "%28bar%29","[]()"]] end it "should use an escaped bucket name as the single input" do @mr.add(Riak::Bucket.new(@client, "[foo]")) @mr.inputs.should == "%5Bfoo%5D" @mr.add("docs") @mr.inputs.should == "docs" end end context "when adding an input that will result in full-bucket mapreduce" do before { Riak.disable_list_keys_warnings = false } after { Riak.disable_list_keys_warnings = true } it "should warn about list-keys on buckets" do @mr.should_receive(:warn).twice @mr.add("foo") @mr.add(Riak::Bucket.new(@client, "foo")) end it "should warn about list-keys on key-filters" do @mr.should_receive(:warn) @mr.filter("foo") { matches "bar" } end end end [:map, :reduce].each do |type| describe "adding #{type} phases" do it "should return self for chaining" do @mr.send(type, "function(){}").should == @mr end it "should accept a function string" do @mr.send(type, "function(){}") @mr.query.should have(1).items phase = @mr.query.first phase.function.should == "function(){}" phase.type.should == type end it "should accept a function and options" do @mr.send(type, "function(){}", :keep => true) @mr.query.should have(1).items phase = @mr.query.first phase.function.should == "function(){}" phase.type.should == type phase.keep.should be_true end it "should accept a module/function pair" do @mr.send(type, ["riak","mapsomething"]) @mr.query.should have(1).items phase = @mr.query.first phase.function.should == ["riak", "mapsomething"] phase.type.should == type phase.language.should == "erlang" end it "should accept a module/function pair with extra options" do @mr.send(type, ["riak", "mapsomething"], :arg => [1000]) @mr.query.should have(1).items phase = @mr.query.first phase.function.should == ["riak", "mapsomething"] phase.type.should == type phase.language.should == "erlang" phase.arg.should == [1000] end end end describe "adding link phases" do it "should return self for chaining" do @mr.link({}).should == @mr end it "should accept a WalkSpec" do @mr.link(Riak::WalkSpec.new(:tag => "next")) @mr.query.should have(1).items phase = @mr.query.first phase.type.should == :link phase.function.should be_kind_of(Riak::WalkSpec) phase.function.tag.should == "next" end it "should accept a WalkSpec and a hash of options" do @mr.link(Riak::WalkSpec.new(:bucket => "foo"), :keep => true) @mr.query.should have(1).items phase = @mr.query.first phase.type.should == :link phase.function.should be_kind_of(Riak::WalkSpec) phase.function.bucket.should == "foo" phase.keep.should be_true end it "should accept a hash of options intermingled with the walk spec options" do @mr.link(:tag => "snakes", :arg => [1000]) @mr.query.should have(1).items phase = @mr.query.first phase.arg.should == [1000] phase.function.should be_kind_of(Riak::WalkSpec) phase.function.tag.should == "snakes" end end describe "converting to JSON for the job" do it "should include the inputs and query keys" do @mr.to_json.should =~ /"inputs":/ end it "should map phases to their JSON equivalents" do phase = Riak::MapReduce::Phase.new(:type => :map, :function => "function(){}") @mr.query << phase @mr.to_json.should include('"source":"function(){}"') @mr.to_json.should include('"query":[{"map":{') end it "should emit only the bucket name when the input is the whole bucket" do @mr.add("foo") @mr.to_json.should include('"inputs":"foo"') end it "should emit an array of inputs when there are multiple inputs" do @mr.add("foo","bar",1000).add("foo","baz") @mr.to_json.should include('"inputs":[["foo","bar",1000],["foo","baz"]]') end it "should add the timeout value when set" do @mr.timeout(50000) @mr.to_json.should include('"timeout":50000') end end it "should return self from setting the timeout" do @mr.timeout(5000).should == @mr end describe "executing the map reduce job" do before :each do @mr.map("Riak.mapValues",:keep => true) end it "should raise an exception when no phases are defined" do @mr.query.clear lambda { @mr.run }.should raise_error(Riak::MapReduceError) end it "should submit the query to the backend" do @backend.should_receive(:mapred).with(@mr).and_return([]) @mr.run.should == [] end it "should pass the given block to the backend for streaming" do arr = [] @backend.should_receive(:mapred).with(@mr).and_yield("foo").and_yield("bar") @mr.run {|v| arr << v } arr.should == ["foo", "bar"] end it "should interpret failed requests with JSON content-types as map reduce errors" do @backend.stub!(:mapred).and_raise(Riak::HTTPFailedRequest.new(:post, 200, 500, {"content-type" => ["application/json"]}, '{"error":"syntax error"}')) lambda { @mr.run }.should raise_error(Riak::MapReduceError) begin @mr.run rescue Riak::MapReduceError => mre mre.message.should include('{"error":"syntax error"}') else fail "No exception raised!" end end it "should re-raise non-JSON error responses" do @backend.stub!(:mapred).and_raise(Riak::HTTPFailedRequest.new(:post, 200, 500, {"content-type" => ["text/plain"]}, 'Oops, you bwoke it.')) lambda { @mr.run }.should raise_error(Riak::FailedRequest) end end end