blob: 4f823708252e3c79202113386df1d0bfe698aeae [file] [log] [blame]
-- This script tests using a join small enough to do in fragment and replicate.
register $PIGMIX_JAR
A = load '$HDFS_ROOT/page_views' using org.apache.pig.test.pigmix.udf.PigPerformanceLoader()
as (user, action, timespent, query_term, ip_addr, timestamp,
estimated_revenue, page_info, page_links);
B = foreach A generate user, estimated_revenue;
alpha = load '$HDFS_ROOT/power_users' using PigStorage('\u0001') as (name, phone,
address, city, state, zip);
beta = foreach alpha generate name;
C = join B by user, beta by name using 'replicated' parallel $PARALLEL;
store C into '$PIGMIX_OUTPUT/L2out';