blob: d10fee577c70b6b5cfc83f3a86edd4c94b975d1a [file] [log] [blame]
PREHOOK: query: DESCRIBE FUNCTION percentile_disc
PREHOOK: type: DESCFUNCTION
POSTHOOK: query: DESCRIBE FUNCTION percentile_disc
POSTHOOK: type: DESCFUNCTION
percentile_disc(input, pc) - Returns the percentile of expr at pc (range: [0,1]) without interpolation.
PREHOOK: query: DESCRIBE FUNCTION EXTENDED percentile_disc
PREHOOK: type: DESCFUNCTION
POSTHOOK: query: DESCRIBE FUNCTION EXTENDED percentile_disc
POSTHOOK: type: DESCFUNCTION
percentile_disc(input, pc) - Returns the percentile of expr at pc (range: [0,1]) without interpolation.
Function class:org.apache.hadoop.hive.ql.udf.generic.GenericUDAFPercentileDisc
Function type:BUILTIN
PREHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
PREHOOK: type: QUERY
PREHOOK: Input: default@src
#### A masked pattern was here ####
POSTHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
#### A masked pattern was here ####
0 0.0 5.0 5.0 9.0 [0.0,5.0,9.0]
1 10.0 15.0 15.0 19.0 [10.0,15.0,19.0]
10 100.0 103.0 103.0 105.0 [100.0,103.0,105.0]
11 111.0 118.0 118.0 119.0 [111.0,118.0,119.0]
12 120.0 128.0 128.0 129.0 [120.0,128.0,129.0]
13 131.0 137.0 137.0 138.0 [131.0,137.0,138.0]
14 143.0 146.0 146.0 149.0 [143.0,146.0,149.0]
15 150.0 155.0 155.0 158.0 [150.0,155.0,158.0]
16 160.0 167.0 167.0 169.0 [160.0,167.0,169.0]
17 170.0 175.0 175.0 179.0 [170.0,175.0,179.0]
18 180.0 187.0 187.0 189.0 [180.0,187.0,189.0]
19 190.0 195.0 195.0 199.0 [190.0,195.0,199.0]
2 20.0 26.0 26.0 28.0 [20.0,26.0,28.0]
20 200.0 205.0 205.0 209.0 [200.0,205.0,209.0]
21 213.0 217.0 217.0 219.0 [213.0,217.0,219.0]
22 221.0 224.0 224.0 229.0 [221.0,224.0,229.0]
23 230.0 235.0 235.0 239.0 [230.0,235.0,239.0]
24 241.0 244.0 244.0 249.0 [241.0,244.0,249.0]
25 252.0 256.0 256.0 258.0 [252.0,256.0,258.0]
26 260.0 265.0 265.0 266.0 [260.0,265.0,266.0]
27 272.0 275.0 275.0 278.0 [272.0,275.0,278.0]
28 280.0 284.0 284.0 289.0 [280.0,284.0,289.0]
29 291.0 298.0 298.0 298.0 [291.0,298.0,298.0]
3 30.0 35.0 35.0 37.0 [30.0,35.0,37.0]
30 302.0 307.0 307.0 309.0 [302.0,307.0,309.0]
31 310.0 316.0 316.0 318.0 [310.0,316.0,318.0]
32 321.0 325.0 325.0 327.0 [321.0,325.0,327.0]
33 331.0 333.0 333.0 339.0 [331.0,333.0,339.0]
34 341.0 345.0 345.0 348.0 [341.0,345.0,348.0]
35 351.0 353.0 353.0 356.0 [351.0,353.0,356.0]
36 360.0 367.0 367.0 369.0 [360.0,367.0,369.0]
37 373.0 377.0 377.0 379.0 [373.0,377.0,379.0]
38 382.0 384.0 384.0 389.0 [382.0,384.0,389.0]
39 392.0 396.0 396.0 399.0 [392.0,396.0,399.0]
4 41.0 43.0 43.0 47.0 [41.0,43.0,47.0]
40 400.0 404.0 404.0 409.0 [400.0,404.0,409.0]
41 411.0 417.0 417.0 419.0 [411.0,417.0,419.0]
42 421.0 427.0 427.0 429.0 [421.0,427.0,429.0]
43 430.0 435.0 435.0 439.0 [430.0,435.0,439.0]
44 443.0 446.0 446.0 449.0 [443.0,446.0,449.0]
45 452.0 455.0 455.0 459.0 [452.0,455.0,459.0]
46 460.0 468.0 468.0 469.0 [460.0,468.0,469.0]
47 470.0 477.0 477.0 479.0 [470.0,477.0,479.0]
48 480.0 484.0 484.0 489.0 [480.0,484.0,489.0]
49 490.0 495.0 495.0 498.0 [490.0,495.0,498.0]
5 51.0 54.0 54.0 58.0 [51.0,54.0,58.0]
6 64.0 67.0 67.0 69.0 [64.0,67.0,69.0]
7 70.0 74.0 74.0 78.0 [70.0,74.0,78.0]
8 80.0 84.0 84.0 87.0 [80.0,84.0,87.0]
9 90.0 95.0 95.0 98.0 [90.0,95.0,98.0]
PREHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
PREHOOK: type: QUERY
PREHOOK: Input: default@src
#### A masked pattern was here ####
POSTHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
#### A masked pattern was here ####
0 0.0 5.0 5.0 9.0 [0.0,5.0,9.0]
1 10.0 15.0 15.0 19.0 [10.0,15.0,19.0]
10 100.0 103.0 103.0 105.0 [100.0,103.0,105.0]
11 111.0 118.0 118.0 119.0 [111.0,118.0,119.0]
12 120.0 128.0 128.0 129.0 [120.0,128.0,129.0]
13 131.0 137.0 137.0 138.0 [131.0,137.0,138.0]
14 143.0 146.0 146.0 149.0 [143.0,146.0,149.0]
15 150.0 155.0 155.0 158.0 [150.0,155.0,158.0]
16 160.0 167.0 167.0 169.0 [160.0,167.0,169.0]
17 170.0 175.0 175.0 179.0 [170.0,175.0,179.0]
18 180.0 187.0 187.0 189.0 [180.0,187.0,189.0]
19 190.0 195.0 195.0 199.0 [190.0,195.0,199.0]
2 20.0 26.0 26.0 28.0 [20.0,26.0,28.0]
20 200.0 205.0 205.0 209.0 [200.0,205.0,209.0]
21 213.0 217.0 217.0 219.0 [213.0,217.0,219.0]
22 221.0 224.0 224.0 229.0 [221.0,224.0,229.0]
23 230.0 235.0 235.0 239.0 [230.0,235.0,239.0]
24 241.0 244.0 244.0 249.0 [241.0,244.0,249.0]
25 252.0 256.0 256.0 258.0 [252.0,256.0,258.0]
26 260.0 265.0 265.0 266.0 [260.0,265.0,266.0]
27 272.0 275.0 275.0 278.0 [272.0,275.0,278.0]
28 280.0 284.0 284.0 289.0 [280.0,284.0,289.0]
29 291.0 298.0 298.0 298.0 [291.0,298.0,298.0]
3 30.0 35.0 35.0 37.0 [30.0,35.0,37.0]
30 302.0 307.0 307.0 309.0 [302.0,307.0,309.0]
31 310.0 316.0 316.0 318.0 [310.0,316.0,318.0]
32 321.0 325.0 325.0 327.0 [321.0,325.0,327.0]
33 331.0 333.0 333.0 339.0 [331.0,333.0,339.0]
34 341.0 345.0 345.0 348.0 [341.0,345.0,348.0]
35 351.0 353.0 353.0 356.0 [351.0,353.0,356.0]
36 360.0 367.0 367.0 369.0 [360.0,367.0,369.0]
37 373.0 377.0 377.0 379.0 [373.0,377.0,379.0]
38 382.0 384.0 384.0 389.0 [382.0,384.0,389.0]
39 392.0 396.0 396.0 399.0 [392.0,396.0,399.0]
4 41.0 43.0 43.0 47.0 [41.0,43.0,47.0]
40 400.0 404.0 404.0 409.0 [400.0,404.0,409.0]
41 411.0 417.0 417.0 419.0 [411.0,417.0,419.0]
42 421.0 427.0 427.0 429.0 [421.0,427.0,429.0]
43 430.0 435.0 435.0 439.0 [430.0,435.0,439.0]
44 443.0 446.0 446.0 449.0 [443.0,446.0,449.0]
45 452.0 455.0 455.0 459.0 [452.0,455.0,459.0]
46 460.0 468.0 468.0 469.0 [460.0,468.0,469.0]
47 470.0 477.0 477.0 479.0 [470.0,477.0,479.0]
48 480.0 484.0 484.0 489.0 [480.0,484.0,489.0]
49 490.0 495.0 495.0 498.0 [490.0,495.0,498.0]
5 51.0 54.0 54.0 58.0 [51.0,54.0,58.0]
6 64.0 67.0 67.0 69.0 [64.0,67.0,69.0]
7 70.0 74.0 74.0 78.0 [70.0,74.0,78.0]
8 80.0 84.0 84.0 87.0 [80.0,84.0,87.0]
9 90.0 95.0 95.0 98.0 [90.0,95.0,98.0]
PREHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
PREHOOK: type: QUERY
PREHOOK: Input: default@src
#### A masked pattern was here ####
POSTHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
#### A masked pattern was here ####
0 0.0 5.0 5.0 9.0 [0.0,5.0,9.0]
1 10.0 15.0 15.0 19.0 [10.0,15.0,19.0]
10 100.0 103.0 103.0 105.0 [100.0,103.0,105.0]
11 111.0 118.0 118.0 119.0 [111.0,118.0,119.0]
12 120.0 128.0 128.0 129.0 [120.0,128.0,129.0]
13 131.0 137.0 137.0 138.0 [131.0,137.0,138.0]
14 143.0 146.0 146.0 149.0 [143.0,146.0,149.0]
15 150.0 155.0 155.0 158.0 [150.0,155.0,158.0]
16 160.0 167.0 167.0 169.0 [160.0,167.0,169.0]
17 170.0 175.0 175.0 179.0 [170.0,175.0,179.0]
18 180.0 187.0 187.0 189.0 [180.0,187.0,189.0]
19 190.0 195.0 195.0 199.0 [190.0,195.0,199.0]
2 20.0 26.0 26.0 28.0 [20.0,26.0,28.0]
20 200.0 205.0 205.0 209.0 [200.0,205.0,209.0]
21 213.0 217.0 217.0 219.0 [213.0,217.0,219.0]
22 221.0 224.0 224.0 229.0 [221.0,224.0,229.0]
23 230.0 235.0 235.0 239.0 [230.0,235.0,239.0]
24 241.0 244.0 244.0 249.0 [241.0,244.0,249.0]
25 252.0 256.0 256.0 258.0 [252.0,256.0,258.0]
26 260.0 265.0 265.0 266.0 [260.0,265.0,266.0]
27 272.0 275.0 275.0 278.0 [272.0,275.0,278.0]
28 280.0 284.0 284.0 289.0 [280.0,284.0,289.0]
29 291.0 298.0 298.0 298.0 [291.0,298.0,298.0]
3 30.0 35.0 35.0 37.0 [30.0,35.0,37.0]
30 302.0 307.0 307.0 309.0 [302.0,307.0,309.0]
31 310.0 316.0 316.0 318.0 [310.0,316.0,318.0]
32 321.0 325.0 325.0 327.0 [321.0,325.0,327.0]
33 331.0 333.0 333.0 339.0 [331.0,333.0,339.0]
34 341.0 345.0 345.0 348.0 [341.0,345.0,348.0]
35 351.0 353.0 353.0 356.0 [351.0,353.0,356.0]
36 360.0 367.0 367.0 369.0 [360.0,367.0,369.0]
37 373.0 377.0 377.0 379.0 [373.0,377.0,379.0]
38 382.0 384.0 384.0 389.0 [382.0,384.0,389.0]
39 392.0 396.0 396.0 399.0 [392.0,396.0,399.0]
4 41.0 43.0 43.0 47.0 [41.0,43.0,47.0]
40 400.0 404.0 404.0 409.0 [400.0,404.0,409.0]
41 411.0 417.0 417.0 419.0 [411.0,417.0,419.0]
42 421.0 427.0 427.0 429.0 [421.0,427.0,429.0]
43 430.0 435.0 435.0 439.0 [430.0,435.0,439.0]
44 443.0 446.0 446.0 449.0 [443.0,446.0,449.0]
45 452.0 455.0 455.0 459.0 [452.0,455.0,459.0]
46 460.0 468.0 468.0 469.0 [460.0,468.0,469.0]
47 470.0 477.0 477.0 479.0 [470.0,477.0,479.0]
48 480.0 484.0 484.0 489.0 [480.0,484.0,489.0]
49 490.0 495.0 495.0 498.0 [490.0,495.0,498.0]
5 51.0 54.0 54.0 58.0 [51.0,54.0,58.0]
6 64.0 67.0 67.0 69.0 [64.0,67.0,69.0]
7 70.0 74.0 74.0 78.0 [70.0,74.0,78.0]
8 80.0 84.0 84.0 87.0 [80.0,84.0,87.0]
9 90.0 95.0 95.0 98.0 [90.0,95.0,98.0]
PREHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
PREHOOK: type: QUERY
PREHOOK: Input: default@src
#### A masked pattern was here ####
POSTHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(CAST(substr(value, 5) AS INT), 0.0),
percentile_disc(CAST(substr(value, 5) AS DOUBLE), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS INT)),
percentile_disc(CAST(substr(value, 5) AS DECIMAL), 1.0),
percentile_disc(array(0.0, 0.5, 1.0)) WITHIN GROUP (ORDER BY CAST(substr(value, 5) AS DOUBLE))
FROM src
GROUP BY CAST(key AS INT) DIV 10
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
#### A masked pattern was here ####
0 0.0 5.0 5.0 9.0 [0.0,5.0,9.0]
1 10.0 15.0 15.0 19.0 [10.0,15.0,19.0]
10 100.0 103.0 103.0 105.0 [100.0,103.0,105.0]
11 111.0 118.0 118.0 119.0 [111.0,118.0,119.0]
12 120.0 128.0 128.0 129.0 [120.0,128.0,129.0]
13 131.0 137.0 137.0 138.0 [131.0,137.0,138.0]
14 143.0 146.0 146.0 149.0 [143.0,146.0,149.0]
15 150.0 155.0 155.0 158.0 [150.0,155.0,158.0]
16 160.0 167.0 167.0 169.0 [160.0,167.0,169.0]
17 170.0 175.0 175.0 179.0 [170.0,175.0,179.0]
18 180.0 187.0 187.0 189.0 [180.0,187.0,189.0]
19 190.0 195.0 195.0 199.0 [190.0,195.0,199.0]
2 20.0 26.0 26.0 28.0 [20.0,26.0,28.0]
20 200.0 205.0 205.0 209.0 [200.0,205.0,209.0]
21 213.0 217.0 217.0 219.0 [213.0,217.0,219.0]
22 221.0 224.0 224.0 229.0 [221.0,224.0,229.0]
23 230.0 235.0 235.0 239.0 [230.0,235.0,239.0]
24 241.0 244.0 244.0 249.0 [241.0,244.0,249.0]
25 252.0 256.0 256.0 258.0 [252.0,256.0,258.0]
26 260.0 265.0 265.0 266.0 [260.0,265.0,266.0]
27 272.0 275.0 275.0 278.0 [272.0,275.0,278.0]
28 280.0 284.0 284.0 289.0 [280.0,284.0,289.0]
29 291.0 298.0 298.0 298.0 [291.0,298.0,298.0]
3 30.0 35.0 35.0 37.0 [30.0,35.0,37.0]
30 302.0 307.0 307.0 309.0 [302.0,307.0,309.0]
31 310.0 316.0 316.0 318.0 [310.0,316.0,318.0]
32 321.0 325.0 325.0 327.0 [321.0,325.0,327.0]
33 331.0 333.0 333.0 339.0 [331.0,333.0,339.0]
34 341.0 345.0 345.0 348.0 [341.0,345.0,348.0]
35 351.0 353.0 353.0 356.0 [351.0,353.0,356.0]
36 360.0 367.0 367.0 369.0 [360.0,367.0,369.0]
37 373.0 377.0 377.0 379.0 [373.0,377.0,379.0]
38 382.0 384.0 384.0 389.0 [382.0,384.0,389.0]
39 392.0 396.0 396.0 399.0 [392.0,396.0,399.0]
4 41.0 43.0 43.0 47.0 [41.0,43.0,47.0]
40 400.0 404.0 404.0 409.0 [400.0,404.0,409.0]
41 411.0 417.0 417.0 419.0 [411.0,417.0,419.0]
42 421.0 427.0 427.0 429.0 [421.0,427.0,429.0]
43 430.0 435.0 435.0 439.0 [430.0,435.0,439.0]
44 443.0 446.0 446.0 449.0 [443.0,446.0,449.0]
45 452.0 455.0 455.0 459.0 [452.0,455.0,459.0]
46 460.0 468.0 468.0 469.0 [460.0,468.0,469.0]
47 470.0 477.0 477.0 479.0 [470.0,477.0,479.0]
48 480.0 484.0 484.0 489.0 [480.0,484.0,489.0]
49 490.0 495.0 495.0 498.0 [490.0,495.0,498.0]
5 51.0 54.0 54.0 58.0 [51.0,54.0,58.0]
6 64.0 67.0 67.0 69.0 [64.0,67.0,69.0]
7 70.0 74.0 74.0 78.0 [70.0,74.0,78.0]
8 80.0 84.0 84.0 87.0 [80.0,84.0,87.0]
9 90.0 95.0 95.0 98.0 [90.0,95.0,98.0]
PREHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(NULL, 0.0),
percentile_disc(0.0) WITHIN GROUP (ORDER BY NULL)
FROM src
GROUP BY CAST(key AS INT) DIV 10
PREHOOK: type: QUERY
PREHOOK: Input: default@src
#### A masked pattern was here ####
POSTHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(NULL, 0.0),
percentile_disc(0.0) WITHIN GROUP (ORDER BY NULL)
FROM src
GROUP BY CAST(key AS INT) DIV 10
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
#### A masked pattern was here ####
0 NULL NULL
1 NULL NULL
10 NULL NULL
11 NULL NULL
12 NULL NULL
13 NULL NULL
14 NULL NULL
15 NULL NULL
16 NULL NULL
17 NULL NULL
18 NULL NULL
19 NULL NULL
2 NULL NULL
20 NULL NULL
21 NULL NULL
22 NULL NULL
23 NULL NULL
24 NULL NULL
25 NULL NULL
26 NULL NULL
27 NULL NULL
28 NULL NULL
29 NULL NULL
3 NULL NULL
30 NULL NULL
31 NULL NULL
32 NULL NULL
33 NULL NULL
34 NULL NULL
35 NULL NULL
36 NULL NULL
37 NULL NULL
38 NULL NULL
39 NULL NULL
4 NULL NULL
40 NULL NULL
41 NULL NULL
42 NULL NULL
43 NULL NULL
44 NULL NULL
45 NULL NULL
46 NULL NULL
47 NULL NULL
48 NULL NULL
49 NULL NULL
5 NULL NULL
6 NULL NULL
7 NULL NULL
8 NULL NULL
9 NULL NULL
PREHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(IF(CAST(key AS INT) DIV 10 < 5, 1, NULL), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY IF(CAST(key AS INT) DIV 10 < 5, 1, NULL))
FROM src
GROUP BY CAST(key AS INT) DIV 10
PREHOOK: type: QUERY
PREHOOK: Input: default@src
#### A masked pattern was here ####
POSTHOOK: query: SELECT CAST(key AS INT) DIV 10,
percentile_disc(IF(CAST(key AS INT) DIV 10 < 5, 1, NULL), 0.5),
percentile_disc(0.5) WITHIN GROUP (ORDER BY IF(CAST(key AS INT) DIV 10 < 5, 1, NULL))
FROM src
GROUP BY CAST(key AS INT) DIV 10
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
#### A masked pattern was here ####
0 1.0 1.0
1 1.0 1.0
10 NULL NULL
11 NULL NULL
12 NULL NULL
13 NULL NULL
14 NULL NULL
15 NULL NULL
16 NULL NULL
17 NULL NULL
18 NULL NULL
19 NULL NULL
2 1.0 1.0
20 NULL NULL
21 NULL NULL
22 NULL NULL
23 NULL NULL
24 NULL NULL
25 NULL NULL
26 NULL NULL
27 NULL NULL
28 NULL NULL
29 NULL NULL
3 1.0 1.0
30 NULL NULL
31 NULL NULL
32 NULL NULL
33 NULL NULL
34 NULL NULL
35 NULL NULL
36 NULL NULL
37 NULL NULL
38 NULL NULL
39 NULL NULL
4 1.0 1.0
40 NULL NULL
41 NULL NULL
42 NULL NULL
43 NULL NULL
44 NULL NULL
45 NULL NULL
46 NULL NULL
47 NULL NULL
48 NULL NULL
49 NULL NULL
5 NULL NULL
6 NULL NULL
7 NULL NULL
8 NULL NULL
9 NULL NULL
PREHOOK: query: select percentile_disc(cast(key as bigint), 0.5),
percentile_disc(0.5) within group (order by cast(key as bigint))
from src where false
PREHOOK: type: QUERY
PREHOOK: Input: default@src
#### A masked pattern was here ####
POSTHOOK: query: select percentile_disc(cast(key as bigint), 0.5),
percentile_disc(0.5) within group (order by cast(key as bigint))
from src where false
POSTHOOK: type: QUERY
POSTHOOK: Input: default@src
#### A masked pattern was here ####
NULL NULL
PREHOOK: query: CREATE TABLE t_test (value int)
PREHOOK: type: CREATETABLE
PREHOOK: Output: database:default
PREHOOK: Output: default@t_test
POSTHOOK: query: CREATE TABLE t_test (value int)
POSTHOOK: type: CREATETABLE
POSTHOOK: Output: database:default
POSTHOOK: Output: default@t_test
PREHOOK: query: INSERT INTO t_test VALUES (NULL), (3), (8), (13), (7), (6), (20), (NULL), (NULL), (10), (7), (15), (16), (8), (7), (8), (NULL)
PREHOOK: type: QUERY
PREHOOK: Input: _dummy_database@_dummy_table
PREHOOK: Output: default@t_test
POSTHOOK: query: INSERT INTO t_test VALUES (NULL), (3), (8), (13), (7), (6), (20), (NULL), (NULL), (10), (7), (15), (16), (8), (7), (8), (NULL)
POSTHOOK: type: QUERY
POSTHOOK: Input: _dummy_database@_dummy_table
POSTHOOK: Output: default@t_test
POSTHOOK: Lineage: t_test.value SCRIPT []
PREHOOK: query: EXPLAIN SELECT
percentile_disc(value, 0.0),
percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS LAST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS LAST)
FROM t_test
PREHOOK: type: QUERY
PREHOOK: Input: default@t_test
#### A masked pattern was here ####
POSTHOOK: query: EXPLAIN SELECT
percentile_disc(value, 0.0),
percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS LAST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS LAST)
FROM t_test
POSTHOOK: type: QUERY
POSTHOOK: Input: default@t_test
#### A masked pattern was here ####
STAGE DEPENDENCIES:
Stage-1 is a root stage
Stage-0 depends on stages: Stage-1
STAGE PLANS:
Stage: Stage-1
Map Reduce
Map Operator Tree:
TableScan
alias: t_test
Statistics: Num rows: 17 Data size: 56 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: value (type: int)
outputColumnNames: _col0
Statistics: Num rows: 17 Data size: 56 Basic stats: COMPLETE Column stats: COMPLETE
Group By Operator
aggregations: percentile_disc(_col0, 0), percentile_disc(_col0, 0.2), percentile_disc(_col0, 0.2, 1), percentile_disc(_col0, 0.2, 0)
minReductionHashAggr: 0.99
mode: hash
outputColumnNames: _col0, _col1, _col2, _col3
Statistics: Num rows: 1 Data size: 3152 Basic stats: COMPLETE Column stats: COMPLETE
Reduce Output Operator
sort order:
Statistics: Num rows: 1 Data size: 3152 Basic stats: COMPLETE Column stats: COMPLETE
value expressions: _col0 (type: struct<counts:map<bigint,bigint>,percentiles:array<double>,isascending:boolean>), _col1 (type: struct<counts:map<bigint,bigint>,percentiles:array<double>,isascending:boolean>), _col2 (type: struct<counts:map<bigint,bigint>,percentiles:array<double>,isascending:boolean>), _col3 (type: struct<counts:map<bigint,bigint>,percentiles:array<double>,isascending:boolean>)
Reduce Operator Tree:
Group By Operator
aggregations: percentile_disc(VALUE._col0), percentile_disc(VALUE._col1), percentile_disc(VALUE._col2), percentile_disc(VALUE._col3)
mode: mergepartial
outputColumnNames: _col0, _col1, _col2, _col3
Statistics: Num rows: 1 Data size: 32 Basic stats: COMPLETE Column stats: COMPLETE
Select Operator
expressions: _col0 (type: double), _col1 (type: double), _col2 (type: double), _col2 (type: double), _col2 (type: double), (_col2 = _col1) (type: boolean), _col2 (type: double), (_col2 = _col1) (type: boolean), _col3 (type: double), _col3 (type: double), _col3 (type: double)
outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10
Statistics: Num rows: 1 Data size: 80 Basic stats: COMPLETE Column stats: COMPLETE
File Output Operator
compressed: false
Statistics: Num rows: 1 Data size: 80 Basic stats: COMPLETE Column stats: COMPLETE
table:
input format: org.apache.hadoop.mapred.SequenceFileInputFormat
output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
Stage: Stage-0
Fetch Operator
limit: -1
Processor Tree:
ListSink
PREHOOK: query: SELECT
percentile_disc(value, 0.0),
percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS LAST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS LAST)
FROM t_test
PREHOOK: type: QUERY
PREHOOK: Input: default@t_test
#### A masked pattern was here ####
POSTHOOK: query: SELECT
percentile_disc(value, 0.0),
percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value NULLS LAST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value ASC) = percentile_disc(value, 0.2),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS FIRST),
percentile_disc(0.2) WITHIN GROUP (ORDER BY value DESC NULLS LAST)
FROM t_test
POSTHOOK: type: QUERY
POSTHOOK: Input: default@t_test
#### A masked pattern was here ####
3.0 7.0 7.0 7.0 7.0 true 7.0 true 13.0 13.0 13.0
PREHOOK: query: DROP TABLE t_test
PREHOOK: type: DROPTABLE
PREHOOK: Input: default@t_test
PREHOOK: Output: default@t_test
POSTHOOK: query: DROP TABLE t_test
POSTHOOK: type: DROPTABLE
POSTHOOK: Input: default@t_test
POSTHOOK: Output: default@t_test