| -- This script tests using a join small enough to do in fragment and replicate. |
| register $PIGMIX_JAR |
| A = load '$HDFS_ROOT/page_views' using org.apache.pig.test.pigmix.udf.PigPerformanceLoader() |
| as (user, action, timespent, query_term, ip_addr, timestamp, |
| estimated_revenue, page_info, page_links); |
| B = foreach A generate user, estimated_revenue; |
| alpha = load '$HDFS_ROOT/power_users' using PigStorage('\u0001') as (name, phone, |
| address, city, state, zip); |
| beta = foreach alpha generate name; |
| C = join B by user, beta by name using 'replicated' parallel $PARALLEL; |
| store C into '$PIGMIX_OUTPUT/L2out'; |
| |