blob: a868ca0c7741ee784916f76c09c989b4703c0596 [file] [log] [blame]
-- This script covers having a nested plan with splits.
register $PIGMIX_JAR
A = load '$HDFS_ROOT/page_views' using org.apache.pig.test.pigmix.udf.PigPerformanceLoader() as (user, action, timespent, query_term,
ip_addr, timestamp, estimated_revenue, page_info, page_links);
B = foreach A generate user, timestamp;
C = group B by user parallel $PARALLEL;
D = foreach C {
morning = filter B by timestamp < 43200;
afternoon = filter B by timestamp >= 43200;
generate group, COUNT(morning), COUNT(afternoon);
}
store D into '$PIGMIX_OUTPUT/L7out';