--------------------------------------------------------------------- | |
-- Top N Queries. | |
--------------------------------------------------------------------- | |
data = | |
LOAD '$input' | |
AS (query:CHARARRAY, count:INT); | |
queries_group = | |
GROUP data | |
BY query | |
PARALLEL $reducers; | |
queries_sum = | |
FOREACH queries_group | |
GENERATE | |
group AS query, | |
SUM(data.count) AS count; | |
queries_ordered = | |
ORDER queries_sum | |
BY count DESC | |
PARALLEL $reducers; | |
queries_limit = LIMIT queries_ordered $n; | |
STORE queries_limit INTO '$output'; |