| register $PIGMIX_JAR |
| A = load '$HDFS_ROOT/page_views' using org.apache.pig.test.pigmix.udf.PigPerformanceLoader() |
| as (user, action, timespent, query_term, ip_addr, timestamp, estimated_revenue, page_info, page_links); |
| B = foreach A generate user, action, estimated_revenue, timespent; |
| C = group B by user parallel $PARALLEL; |
| D = foreach C { |
| beth = distinct B.action; |
| rev = distinct B.estimated_revenue; |
| ts = distinct B.timespent; |
| generate group, COUNT(beth), SUM(rev), (int)AVG(ts); |
| } |
| store D into '$PIGMIX_OUTPUT/L15out'; |
| |