blob: f660800bf132b3fbd7a3cdd378abfefc219a83cc [file] [log] [blame]
---------------------------------------------------------------------
-- Top N Queries.
---------------------------------------------------------------------
data =
LOAD '$input'
AS (query:CHARARRAY, count:INT);
queries_group =
GROUP data
BY query
PARALLEL $reducers;
queries_sum =
FOREACH queries_group
GENERATE
group AS query,
SUM(data.count) AS count;
queries_ordered =
ORDER queries_sum
BY count DESC
PARALLEL $reducers;
queries_limit = LIMIT queries_ordered $n;
STORE queries_limit INTO '$output';