blob: 97c4b76f507eaf02d9806913bcab71dc04ee24fb [file] [log] [blame]
register $PIGMIX_JAR
A = load '$HDFS_ROOT/page_views' using org.apache.pig.test.pigmix.udf.PigPerformanceLoader()
as (user, action, timespent, query_term, ip_addr, timestamp, estimated_revenue, page_info, page_links);
B = foreach A generate user, action, estimated_revenue, timespent;
C = group B by user parallel $PARALLEL;
D = foreach C {
beth = distinct B.action;
rev = distinct B.estimated_revenue;
ts = distinct B.timespent;
generate group, COUNT(beth), SUM(rev), (int)AVG(ts);
}
store D into '$PIGMIX_OUTPUT/L15out';