Sha256: 8b764260a6b663e573f2e722e73b19e22ee5887b07923daa7615d0b9f95e30dd

Contents?: true

Size: 1.13 KB

Versions: 7

Compression:

Stored size: 1.13 KB

Contents

/**
 * <%= script_name %>
 */
 
/** 
 * Parameters - set default values here; you can override with -p on the command-line.
 */
 
<%= '%default'%> INPUT_PATH 's3n://hawk-example-data/tutorial/excite.log.bz2'
<%= '%default'%> OUTPUT_PATH 's3n://my-output-bucket/$MORTAR_EMAIL_S3_ESCAPED/<%= script_name %>'

<% if not options[:skip_udf] %>
/**
 * User-Defined Functions (UDFs)
 */

REGISTER '../udfs/python/<%= script_name %>.py' USING streaming_python AS <%= script_name %>;
<% end %>

-- This is an example of loading up input data
my_input_data = LOAD '$INPUT_PATH' 
               USING PigStorage('\t') 
                  AS (field0:chararray, field1:chararray, field2:chararray);

-- This is an example pig operation
filtered = FILTER my_input_data
               BY field0 IS NOT NULL;

-- This is an example call to a python user-defined function
with_udf_output = FOREACH filtered 
                 GENERATE field0..field2, 
                          <%= script_name %>.example_udf(field0) AS example_udf_field;

-- remove any existing data
rmf $OUTPUT_PATH;

-- store the results
STORE with_udf_output 
 INTO '$OUTPUT_PATH' 
USING PigStorage('\t');

Version data entries

7 entries across 7 versions & 1 rubygems

Version Path
mortar-0.7.1 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.7.0 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.6.2 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.6.1 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.6.0 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.5.1 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.5.0 lib/mortar/templates/pigscript/pigscript.pig