Sha256: 2ba7c08b2e592c30c72cb60d1a62e0fc870e613ad52cbcce3a76ba48da85adb7

Contents?: true

Size: 770 Bytes

Versions: 3

Compression:

Stored size: 770 Bytes

Contents

#! /usr/bin/env jruby
$: << File.join(File.dirname(__FILE__), '..', 'lib')

require 'cascading'
require 'samples/cascading'

cascade 'union' do
  flow 'union' do
    source 'input', tap('http://www.census.gov/genealogy/names/dist.all.last')

    assembly 'input' do
      split 'line', ['name', 'score1', 'score2', 'id']

      branch 'branch1' do
        group_by 'score1', 'name' do
          count
        end
        rename 'score1' => 'score'
      end

      branch 'branch2' do
        group_by 'score2', 'name' do
          count
        end
        rename 'score2' => 'score'
      end
    end

    assembly 'union' do
      union 'branch1', 'branch2'
    end

    sink 'union', tap('output/union', :sink_mode => :replace)
  end
end.complete(sample_properties)

Version data entries

3 entries across 3 versions & 1 rubygems

Version Path
cascading.jruby-0.0.6 samples/union.rb
cascading.jruby-0.0.5 samples/union.rb
cascading.jruby-0.0.4 samples/union.rb