register $PIGMIX_JAR | |
A = load '$HDFS_ROOT/page_views' using org.apache.pig.test.pigmix.udf.PigPerformanceLoader() | |
as (user, action, timespent, query_term, ip_addr, timestamp, estimated_revenue, page_info, page_links); | |
B = foreach A generate user, estimated_revenue; | |
C = group B by user parallel $PARALLEL; | |
D = foreach C { | |
E = order B by estimated_revenue; | |
F = E.estimated_revenue; | |
generate group, SUM(F); | |
} | |
store D into '$PIGMIX_OUTPUT/L16out'; | |