Sha256: 4634a5206506fd6822d8108c09578a381c25836f07a19726003b5f28a3cbe1a8
Contents?: true
Size: 1.13 KB
Versions: 2
Compression:
Stored size: 1.13 KB
Contents
# raw_ads = # LOAD '$INPUT/ads*' # USING PigStorage AS ( # ad_id:chararray, # api_key:chararray, # name:chararray, # dimensions:chararray, # destination:chararray, # agent_version:chararray # ); raw_ads << load('$INPUT/ads*').using(:pig_storage).as( [:ad_id, :chararray], [:api_key, :chararray], [:name, :chararray], [:dimensions, :chararray], [:destination, :chararray], [:agent_version, :chararray] ) # ads = # FOREACH # (GROUP raw_ads BY ad_id PARALLEL $PARALLELISM) # GENERATE # $0 AS ad_id, # MAX($1.api_key) AS api_key, # MAX($1.name) AS name, # MAX($1.dimensions) AS dimensions, # MAX($1.destination) AS destination, # MAX($1.agent_version) AS agent_version # ; ads << (raw_ads.group(:ad_id)).foreach do |relation| [ relation[0].as(:ad_id), relation[1].api_key.max.as(:api_key), relation[1].name.max.as(:name), relation[1].dimensions.max.as(:dimensions), relation[1].destination.max.as(:destination), relation[1].agent_version.max.as(:agent_version) ] end # STORE ads INTO '$OUTPUT/ads' USING PigStorage; ads.store('$OUTPUT/ads').using(:pig_storage)
Version data entries
2 entries across 2 versions & 1 rubygems
Version | Path |
---|---|
piglet-0.1.1 | examples/spike1.rb |
piglet-0.1.0 | examples/spike1.rb |