Sha256: 014e2521324ec3b4655773929ab2f951547fd1077473916060afe24cd1887e22

Contents?: true

Size: 1.08 KB

Versions: 5

Compression:

Stored size: 1.08 KB

Contents

/**
 * <%= script_name %>
 *
 * Required parameters:
 *
 * - INPUT_PATH Input path for script data (e.g. s3n://hawk-example-data/tutorial/excite.log.bz2)
 * - OUTPUT_PATH Output path for script data (e.g. s3n://my-output-bucket/<%= script_name %>)
 */

<% if not options[:skip_udf] %>
/**
 * User-Defined Functions (UDFs)
 */

REGISTER '../udfs/python/<%= script_name %>.py' USING streaming_python AS <%= script_name %>;
<% end %>

-- This is an example of loading up input data
my_input_data = LOAD '$INPUT_PATH' 
               USING PigStorage('\t') 
                  AS (field0:chararray, field1:chararray, field2:chararray);

-- This is an example pig operation
filtered = FILTER my_input_data
               BY field0 IS NOT NULL;

-- This is an example call to a python user-defined function
with_udf_output = FOREACH filtered 
                 GENERATE field0..field2, 
                          <%= script_name %>.example_udf(field0) AS example_udf_field;

-- remove any existing data
rmf $OUTPUT_PATH;

-- store the results
STORE with_udf_output 
 INTO '$OUTPUT_PATH' 
USING PigStorage('\t');

Version data entries

5 entries across 5 versions & 1 rubygems

Version Path
mortar-0.4.4 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.4.3 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.4.2 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.4.1 lib/mortar/templates/pigscript/pigscript.pig
mortar-0.4.0 lib/mortar/templates/pigscript/pigscript.pig