tests/integration_tests/viz_tests.py - superset - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
 # isort:skip_file
 from datetime import date, datetime, timezone
 import logging
 from math import nan
 from unittest.mock import Mock, patch
 from typing import Any, Dict, List, Set

 import numpy as np
 import pandas as pd
 import pytest

 import tests.integration_tests.test_app
 import superset.viz as viz
 from superset import app
 from superset.constants import NULL_STRING
 from superset.exceptions import QueryObjectValidationError, SpatialException
 from superset.utils.core import DTTM_ALIAS

 from .base_tests import SupersetTestCase
 from .utils import load_fixture

 logger = logging.getLogger(__name__)


 class TestBaseViz(SupersetTestCase):
     def test_constructor_exception_no_datasource(self):
         form_data = {}
         datasource = None
         with self.assertRaises(Exception):
             viz.BaseViz(datasource, form_data)

     def test_process_metrics(self):
         # test TableViz metrics in correct order
         form_data = {
             "url_params": {},
             "row_limit": 500,
             "metric": "sum__SP_POP_TOTL",
             "entity": "country_code",
             "secondary_metric": "sum__SP_POP_TOTL",
             "granularity_sqla": "year",
             "page_length": 0,
             "all_columns": [],
             "viz_type": "table",
             "since": "2014-01-01",
             "until": "2014-01-02",
             "metrics": ["sum__SP_POP_TOTL", "SUM(SE_PRM_NENR_MA)", "SUM(SP_URB_TOTL)"],
             "country_fieldtype": "cca3",
             "percent_metrics": ["count"],
             "slice_id": 74,
             "time_grain_sqla": None,
             "order_by_cols": [],
             "groupby": ["country_name"],
             "compare_lag": "10",
             "limit": "25",
             "datasource": "2__table",
             "table_timestamp_format": "%Y-%m-%d %H:%M:%S",
             "markup_type": "markdown",
             "where": "",
             "compare_suffix": "o10Y",
         }
         datasource = Mock()
         datasource.type = "table"
         test_viz = viz.BaseViz(datasource, form_data)
         expect_metric_labels = [
             "sum__SP_POP_TOTL",
             "SUM(SE_PRM_NENR_MA)",
             "SUM(SP_URB_TOTL)",
             "count",
         ]
         self.assertEqual(test_viz.metric_labels, expect_metric_labels)
         self.assertEqual(test_viz.all_metrics, expect_metric_labels)

     def test_get_df_returns_empty_df(self):
         form_data = {"dummy": 123}
         query_obj = {"granularity": "day"}
         datasource = self.get_datasource_mock()
         test_viz = viz.BaseViz(datasource, form_data)
         result = test_viz.get_df(query_obj)
         self.assertEqual(type(result), pd.DataFrame)
         self.assertTrue(result.empty)

     def test_get_df_handles_dttm_col(self):
         form_data = {"dummy": 123}
         query_obj = {"granularity": "day"}
         results = Mock()
         results.query = Mock()
         results.status = Mock()
         results.error_message = Mock()
         datasource = Mock()
         datasource.type = "table"
         datasource.query = Mock(return_value=results)
         mock_dttm_col = Mock()
         datasource.get_column = Mock(return_value=mock_dttm_col)

         test_viz = viz.BaseViz(datasource, form_data)
         test_viz.df_metrics_to_num = Mock()
         test_viz.get_fillna_for_columns = Mock(return_value=0)

         results.df = pd.DataFrame(data={DTTM_ALIAS: ["1960-01-01 05:00:00"]})
         datasource.offset = 0
         mock_dttm_col = Mock()
         datasource.get_column = Mock(return_value=mock_dttm_col)
         mock_dttm_col.python_date_format = "epoch_ms"
         result = test_viz.get_df(query_obj)
         import logging

         logger.info(result)
         pd.testing.assert_series_equal(
             result[DTTM_ALIAS], pd.Series([datetime(1960, 1, 1, 5, 0)], name=DTTM_ALIAS)
         )

         mock_dttm_col.python_date_format = None
         result = test_viz.get_df(query_obj)
         pd.testing.assert_series_equal(
             result[DTTM_ALIAS], pd.Series([datetime(1960, 1, 1, 5, 0)], name=DTTM_ALIAS)
         )

         datasource.offset = 1
         result = test_viz.get_df(query_obj)
         pd.testing.assert_series_equal(
             result[DTTM_ALIAS], pd.Series([datetime(1960, 1, 1, 6, 0)], name=DTTM_ALIAS)
         )

         datasource.offset = 0
         results.df = pd.DataFrame(data={DTTM_ALIAS: ["1960-01-01"]})
         mock_dttm_col.python_date_format = "%Y-%m-%d"
         result = test_viz.get_df(query_obj)
         pd.testing.assert_series_equal(
             result[DTTM_ALIAS], pd.Series([datetime(1960, 1, 1, 0, 0)], name=DTTM_ALIAS)
         )

     def test_cache_timeout(self):
         datasource = self.get_datasource_mock()
         datasource.cache_timeout = 0
         test_viz = viz.BaseViz(datasource, form_data={})
         self.assertEqual(0, test_viz.cache_timeout)

         datasource.cache_timeout = 156
         test_viz = viz.BaseViz(datasource, form_data={})
         self.assertEqual(156, test_viz.cache_timeout)

         datasource.cache_timeout = None
         datasource.database.cache_timeout = 0
         self.assertEqual(0, test_viz.cache_timeout)

         datasource.database.cache_timeout = 1666
         self.assertEqual(1666, test_viz.cache_timeout)

         datasource.database.cache_timeout = None
         test_viz = viz.BaseViz(datasource, form_data={})
         self.assertEqual(
             app.config["DATA_CACHE_CONFIG"]["CACHE_DEFAULT_TIMEOUT"],
             test_viz.cache_timeout,
         )

         data_cache_timeout = app.config["DATA_CACHE_CONFIG"]["CACHE_DEFAULT_TIMEOUT"]
         app.config["DATA_CACHE_CONFIG"]["CACHE_DEFAULT_TIMEOUT"] = None
         datasource.database.cache_timeout = None
         test_viz = viz.BaseViz(datasource, form_data={})
         self.assertEqual(app.config["CACHE_DEFAULT_TIMEOUT"], test_viz.cache_timeout)
         # restore DATA_CACHE_CONFIG timeout
         app.config["DATA_CACHE_CONFIG"]["CACHE_DEFAULT_TIMEOUT"] = data_cache_timeout


 class TestTableViz(SupersetTestCase):
     def test_get_data_applies_percentage(self):
         form_data = {
             "groupby": ["groupA", "groupB"],
             "metrics": [
                 {
                     "expressionType": "SIMPLE",
                     "aggregate": "SUM",
                     "label": "SUM(value1)",
                     "column": {"column_name": "value1", "type": "DOUBLE"},
                 },
                 "count",
                 "avg__C",
             ],
             "percent_metrics": [
                 {
                     "expressionType": "SIMPLE",
                     "aggregate": "SUM",
                     "label": "SUM(value1)",
                     "column": {"column_name": "value1", "type": "DOUBLE"},
                 },
                 "avg__B",
             ],
         }
         datasource = self.get_datasource_mock()

         df = pd.DataFrame(
             {
                 "SUM(value1)": [15, 20, 25, 40],
                 "avg__B": [10, 20, 5, 15],
                 "avg__C": [11, 22, 33, 44],
                 "count": [6, 7, 8, 9],
                 "groupA": ["A", "B", "C", "C"],
                 "groupB": ["x", "x", "y", "z"],
             }
         )

         test_viz = viz.TableViz(datasource, form_data)
         data = test_viz.get_data(df)
         # Check method correctly transforms data and computes percents
         self.assertEqual(
             [
                 "groupA",
                 "groupB",
                 "SUM(value1)",
                 "count",
                 "avg__C",
                 "%SUM(value1)",
                 "%avg__B",
             ],
             list(data["columns"]),
         )
         expected = [
             {
                 "groupA": "A",
                 "groupB": "x",
                 "SUM(value1)": 15,
                 "count": 6,
                 "avg__C": 11,
                 "%SUM(value1)": 0.15,
                 "%avg__B": 0.2,
             },
             {
                 "groupA": "B",
                 "groupB": "x",
                 "SUM(value1)": 20,
                 "count": 7,
                 "avg__C": 22,
                 "%SUM(value1)": 0.2,
                 "%avg__B": 0.4,
             },
             {
                 "groupA": "C",
                 "groupB": "y",
                 "SUM(value1)": 25,
                 "count": 8,
                 "avg__C": 33,
                 "%SUM(value1)": 0.25,
                 "%avg__B": 0.1,
             },
             {
                 "groupA": "C",
                 "groupB": "z",
                 "SUM(value1)": 40,
                 "count": 9,
                 "avg__C": 44,
                 "%SUM(value1)": 0.4,
                 "%avg__B": 0.3,
             },
         ]
         self.assertEqual(expected, data["records"])

     def test_parse_adhoc_filters(self):
         form_data = {
             "metrics": [
                 {
                     "expressionType": "SIMPLE",
                     "aggregate": "SUM",
                     "label": "SUM(value1)",
                     "column": {"column_name": "value1", "type": "DOUBLE"},
                 }
             ],
             "adhoc_filters": [
                 {
                     "expressionType": "SIMPLE",
                     "clause": "WHERE",
                     "subject": "value2",
                     "operator": ">",
                     "comparator": "100",
                 },
                 {
                     "expressionType": "SIMPLE",
                     "clause": "HAVING",
                     "subject": "SUM(value1)",
                     "operator": "<",
                     "comparator": "10",
                 },
                 {
                     "expressionType": "SQL",
                     "clause": "HAVING",
                     "sqlExpression": "SUM(value1) > 5",
                 },
                 {
                     "expressionType": "SQL",
                     "clause": "WHERE",
                     "sqlExpression": "value3 in ('North America')",
                 },
             ],
         }
         datasource = self.get_datasource_mock()
         test_viz = viz.TableViz(datasource, form_data)
         query_obj = test_viz.query_obj()
         self.assertEqual(
             [{"col": "value2", "val": "100", "op": ">"}], query_obj["filter"]
         )
         self.assertEqual(
             [{"op": "<", "val": "10", "col": "SUM(value1)"}],
             query_obj["extras"]["having_druid"],
         )
         self.assertEqual("(value3 in ('North America'))", query_obj["extras"]["where"])
         self.assertEqual("(SUM(value1) > 5)", query_obj["extras"]["having"])

     def test_adhoc_filters_overwrite_legacy_filters(self):
         form_data = {
             "metrics": [
                 {
                     "expressionType": "SIMPLE",
                     "aggregate": "SUM",
                     "label": "SUM(value1)",
                     "column": {"column_name": "value1", "type": "DOUBLE"},
                 }
             ],
             "adhoc_filters": [
                 {
                     "expressionType": "SIMPLE",
                     "clause": "WHERE",
                     "subject": "value2",
                     "operator": ">",
                     "comparator": "100",
                 },
                 {
                     "expressionType": "SQL",
                     "clause": "WHERE",
                     "sqlExpression": "value3 in ('North America')",
                 },
             ],
             "having": "SUM(value1) > 5",
         }
         datasource = self.get_datasource_mock()
         test_viz = viz.TableViz(datasource, form_data)
         query_obj = test_viz.query_obj()
         self.assertEqual(
             [{"col": "value2", "val": "100", "op": ">"}], query_obj["filter"]
         )
         self.assertEqual([], query_obj["extras"]["having_druid"])
         self.assertEqual("(value3 in ('North America'))", query_obj["extras"]["where"])
         self.assertEqual("", query_obj["extras"]["having"])

     def test_query_obj_merges_percent_metrics(self):
         datasource = self.get_datasource_mock()
         form_data = {
             "metrics": ["sum__A", "count", "avg__C"],
             "percent_metrics": ["sum__A", "avg__B", "max__Y"],
         }
         test_viz = viz.TableViz(datasource, form_data)
         query_obj = test_viz.query_obj()
         self.assertEqual(
             ["sum__A", "count", "avg__C", "avg__B", "max__Y"], query_obj["metrics"]
         )

     def test_query_obj_throws_columns_and_metrics(self):
         datasource = self.get_datasource_mock()
         form_data = {"all_columns": ["A", "B"], "metrics": ["x", "y"]}
         with self.assertRaises(Exception):
             test_viz = viz.TableViz(datasource, form_data)
             test_viz.query_obj()
         del form_data["metrics"]
         form_data["groupby"] = ["B", "C"]
         with self.assertRaises(Exception):
             test_viz = viz.TableViz(datasource, form_data)
             test_viz.query_obj()

     @patch("superset.viz.BaseViz.query_obj")
     def test_query_obj_merges_all_columns(self, super_query_obj):
         datasource = self.get_datasource_mock()
         form_data = {
             "all_columns": ["colA", "colB", "colC"],
             "order_by_cols": ['["colA", "colB"]', '["colC"]'],
         }
         super_query_obj.return_value = {
             "columns": ["colD", "colC"],
             "groupby": ["colA", "colB"],
         }
         test_viz = viz.TableViz(datasource, form_data)
         query_obj = test_viz.query_obj()
         self.assertEqual(form_data["all_columns"], query_obj["columns"])
         self.assertEqual([], query_obj["groupby"])
         self.assertEqual([["colA", "colB"], ["colC"]], query_obj["orderby"])

     def test_query_obj_uses_sortby(self):
         datasource = self.get_datasource_mock()
         form_data = {
             "metrics": ["colA", "colB"],
             "order_desc": False,
         }

         def run_test(metric):
             form_data["timeseries_limit_metric"] = metric
             test_viz = viz.TableViz(datasource, form_data)
             query_obj = test_viz.query_obj()
             self.assertEqual(["colA", "colB", metric], query_obj["metrics"])
             self.assertEqual([(metric, True)], query_obj["orderby"])

         run_test("simple_metric")
         run_test(
             {
                 "label": "adhoc_metric",
                 "expressionType": "SIMPLE",
                 "aggregate": "SUM",
                 "column": {"column_name": "sort_column",},
             }
         )

     def test_should_be_timeseries_raises_when_no_granularity(self):
         datasource = self.get_datasource_mock()
         form_data = {"include_time": True}
         with self.assertRaises(Exception):
             test_viz = viz.TableViz(datasource, form_data)
             test_viz.should_be_timeseries()

     def test_adhoc_metric_with_sortby(self):
         metrics = [
             {
                 "expressionType": "SIMPLE",
                 "aggregate": "SUM",
                 "label": "sum_value",
                 "column": {"column_name": "value1", "type": "DOUBLE"},
             }
         ]
         form_data = {
             "metrics": metrics,
             "timeseries_limit_metric": {
                 "expressionType": "SIMPLE",
                 "aggregate": "SUM",
                 "label": "SUM(value1)",
                 "column": {"column_name": "value1", "type": "DOUBLE"},
             },
             "order_desc": False,
         }

         df = pd.DataFrame({"SUM(value1)": [15], "sum_value": [15]})
         datasource = self.get_datasource_mock()
         test_viz = viz.TableViz(datasource, form_data)
         data = test_viz.get_data(df)
         self.assertEqual(["sum_value"], data["columns"])


 class TestDistBarViz(SupersetTestCase):
     def test_groupby_nulls(self):
         form_data = {
             "metrics": ["votes"],
             "adhoc_filters": [],
             "groupby": ["toppings"],
             "columns": [],
             "order_desc": True,
         }
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             {
                 "toppings": ["cheese", "pepperoni", "anchovies", None],
                 "votes": [3, 5, 1, 2],
             }
         )
         test_viz = viz.DistributionBarViz(datasource, form_data)
         data = test_viz.get_data(df)[0]
         self.assertEqual("votes", data["key"])
         expected_values = [
             {"x": "pepperoni", "y": 5},
             {"x": "cheese", "y": 3},
             {"x": NULL_STRING, "y": 2},
             {"x": "anchovies", "y": 1},
         ]
         self.assertEqual(expected_values, data["values"])

     def test_groupby_nans(self):
         form_data = {
             "metrics": ["count"],
             "adhoc_filters": [],
             "groupby": ["beds"],
             "columns": [],
             "order_desc": True,
         }
         datasource = self.get_datasource_mock()
         df = pd.DataFrame({"beds": [0, 1, nan, 2], "count": [30, 42, 3, 29]})
         test_viz = viz.DistributionBarViz(datasource, form_data)
         data = test_viz.get_data(df)[0]
         self.assertEqual("count", data["key"])
         expected_values = [
             {"x": "1.0", "y": 42},
             {"x": "0.0", "y": 30},
             {"x": "2.0", "y": 29},
             {"x": NULL_STRING, "y": 3},
         ]

         self.assertEqual(expected_values, data["values"])

     def test_column_nulls(self):
         form_data = {
             "metrics": ["votes"],
             "adhoc_filters": [],
             "groupby": ["toppings"],
             "columns": ["role"],
             "order_desc": True,
         }
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             {
                 "toppings": ["cheese", "pepperoni", "cheese", "pepperoni"],
                 "role": ["engineer", "engineer", None, None],
                 "votes": [3, 5, 1, 2],
             }
         )
         test_viz = viz.DistributionBarViz(datasource, form_data)
         data = test_viz.get_data(df)
         expected = [
             {
                 "key": NULL_STRING,
                 "values": [{"x": "pepperoni", "y": 2}, {"x": "cheese", "y": 1}],
             },
             {
                 "key": "engineer",
                 "values": [{"x": "pepperoni", "y": 5}, {"x": "cheese", "y": 3}],
             },
         ]
         self.assertEqual(expected, data)

     def test_column_metrics_in_order(self):
         form_data = {
             "metrics": ["z_column", "votes", "a_column"],
             "adhoc_filters": [],
             "groupby": ["toppings"],
             "columns": [],
             "order_desc": True,
         }
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             {
                 "toppings": ["cheese", "pepperoni", "cheese", "pepperoni"],
                 "role": ["engineer", "engineer", None, None],
                 "votes": [3, 5, 1, 2],
                 "a_column": [3, 5, 1, 2],
                 "z_column": [3, 5, 1, 2],
             }
         )
         test_viz = viz.DistributionBarViz(datasource, form_data)
         data = test_viz.get_data(df)

         expected = [
             {
                 "key": "z_column",
                 "values": [{"x": "pepperoni", "y": 3.5}, {"x": "cheese", "y": 2.0}],
             },
             {
                 "key": "votes",
                 "values": [{"x": "pepperoni", "y": 3.5}, {"x": "cheese", "y": 2.0}],
             },
             {
                 "key": "a_column",
                 "values": [{"x": "pepperoni", "y": 3.5}, {"x": "cheese", "y": 2.0}],
             },
         ]

         self.assertEqual(expected, data)

     def test_column_metrics_in_order_with_breakdowns(self):
         form_data = {
             "metrics": ["z_column", "votes", "a_column"],
             "adhoc_filters": [],
             "groupby": ["toppings"],
             "columns": ["role"],
             "order_desc": True,
         }
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             {
                 "toppings": ["cheese", "pepperoni", "cheese", "pepperoni"],
                 "role": ["engineer", "engineer", None, None],
                 "votes": [3, 5, 1, 2],
                 "a_column": [3, 5, 1, 2],
                 "z_column": [3, 5, 1, 2],
             }
         )
         test_viz = viz.DistributionBarViz(datasource, form_data)
         data = test_viz.get_data(df)

         expected = [
             {
                 "key": f"z_column, {NULL_STRING}",
                 "values": [{"x": "pepperoni", "y": 2}, {"x": "cheese", "y": 1}],
             },
             {
                 "key": "z_column, engineer",
                 "values": [{"x": "pepperoni", "y": 5}, {"x": "cheese", "y": 3}],
             },
             {
                 "key": f"votes, {NULL_STRING}",
                 "values": [{"x": "pepperoni", "y": 2}, {"x": "cheese", "y": 1}],
             },
             {
                 "key": "votes, engineer",
                 "values": [{"x": "pepperoni", "y": 5}, {"x": "cheese", "y": 3}],
             },
             {
                 "key": f"a_column, {NULL_STRING}",
                 "values": [{"x": "pepperoni", "y": 2}, {"x": "cheese", "y": 1}],
             },
             {
                 "key": "a_column, engineer",
                 "values": [{"x": "pepperoni", "y": 5}, {"x": "cheese", "y": 3}],
             },
         ]

         self.assertEqual(expected, data)


 class TestPairedTTest(SupersetTestCase):
     def test_get_data_transforms_dataframe(self):
         form_data = {
             "groupby": ["groupA", "groupB", "groupC"],
             "metrics": ["metric1", "metric2", "metric3"],
         }
         datasource = self.get_datasource_mock()
         # Test data
         raw = {}
         raw[DTTM_ALIAS] = [100, 200, 300, 100, 200, 300, 100, 200, 300]
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         raw["metric2"] = [10, 20, 30, 40, 50, 60, 70, 80, 90]
         raw["metric3"] = [100, 200, 300, 400, 500, 600, 700, 800, 900]
         df = pd.DataFrame(raw)
         pairedTTestViz = viz.viz_types["paired_ttest"](datasource, form_data)
         data = pairedTTestViz.get_data(df)
         # Check method correctly transforms data
         expected = {
             "metric1": [
                 {
                     "values": [
                         {"x": 100, "y": 1},
                         {"x": 200, "y": 2},
                         {"x": 300, "y": 3},
                     ],
                     "group": ("a1", "a2", "a3"),
                 },
                 {
                     "values": [
                         {"x": 100, "y": 4},
                         {"x": 200, "y": 5},
                         {"x": 300, "y": 6},
                     ],
                     "group": ("b1", "b2", "b3"),
                 },
                 {
                     "values": [
                         {"x": 100, "y": 7},
                         {"x": 200, "y": 8},
                         {"x": 300, "y": 9},
                     ],
                     "group": ("c1", "c2", "c3"),
                 },
             ],
             "metric2": [
                 {
                     "values": [
                         {"x": 100, "y": 10},
                         {"x": 200, "y": 20},
                         {"x": 300, "y": 30},
                     ],
                     "group": ("a1", "a2", "a3"),
                 },
                 {
                     "values": [
                         {"x": 100, "y": 40},
                         {"x": 200, "y": 50},
                         {"x": 300, "y": 60},
                     ],
                     "group": ("b1", "b2", "b3"),
                 },
                 {
                     "values": [
                         {"x": 100, "y": 70},
                         {"x": 200, "y": 80},
                         {"x": 300, "y": 90},
                     ],
                     "group": ("c1", "c2", "c3"),
                 },
             ],
             "metric3": [
                 {
                     "values": [
                         {"x": 100, "y": 100},
                         {"x": 200, "y": 200},
                         {"x": 300, "y": 300},
                     ],
                     "group": ("a1", "a2", "a3"),
                 },
                 {
                     "values": [
                         {"x": 100, "y": 400},
                         {"x": 200, "y": 500},
                         {"x": 300, "y": 600},
                     ],
                     "group": ("b1", "b2", "b3"),
                 },
                 {
                     "values": [
                         {"x": 100, "y": 700},
                         {"x": 200, "y": 800},
                         {"x": 300, "y": 900},
                     ],
                     "group": ("c1", "c2", "c3"),
                 },
             ],
         }
         self.assertEqual(data, expected)

     def test_get_data_empty_null_keys(self):
         form_data = {"groupby": [], "metrics": ["", None]}
         datasource = self.get_datasource_mock()
         # Test data
         raw = {}
         raw[DTTM_ALIAS] = [100, 200, 300]
         raw[""] = [1, 2, 3]
         raw[None] = [10, 20, 30]

         df = pd.DataFrame(raw)
         pairedTTestViz = viz.viz_types["paired_ttest"](datasource, form_data)
         data = pairedTTestViz.get_data(df)
         # Check method correctly transforms data
         expected = {
             "N/A": [
                 {
                     "values": [
                         {"x": 100, "y": 1},
                         {"x": 200, "y": 2},
                         {"x": 300, "y": 3},
                     ],
                     "group": "All",
                 }
             ],
             "NULL": [
                 {
                     "values": [
                         {"x": 100, "y": 10},
                         {"x": 200, "y": 20},
                         {"x": 300, "y": 30},
                     ],
                     "group": "All",
                 }
             ],
         }
         self.assertEqual(data, expected)


 class TestPartitionViz(SupersetTestCase):
     @patch("superset.viz.BaseViz.query_obj")
     def test_query_obj_time_series_option(self, super_query_obj):
         datasource = self.get_datasource_mock()
         form_data = {}
         test_viz = viz.PartitionViz(datasource, form_data)
         super_query_obj.return_value = {}
         query_obj = test_viz.query_obj()
         self.assertFalse(query_obj["is_timeseries"])
         test_viz.form_data["time_series_option"] = "agg_sum"
         query_obj = test_viz.query_obj()
         self.assertTrue(query_obj["is_timeseries"])

     def test_levels_for_computes_levels(self):
         raw = {}
         raw[DTTM_ALIAS] = [100, 200, 300, 100, 200, 300, 100, 200, 300]
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         raw["metric2"] = [10, 20, 30, 40, 50, 60, 70, 80, 90]
         raw["metric3"] = [100, 200, 300, 400, 500, 600, 700, 800, 900]
         df = pd.DataFrame(raw)
         groups = ["groupA", "groupB", "groupC"]
         time_op = "agg_sum"
         test_viz = viz.PartitionViz(Mock(), {})
         levels = test_viz.levels_for(time_op, groups, df)
         self.assertEqual(4, len(levels))
         expected = {DTTM_ALIAS: 1800, "metric1": 45, "metric2": 450, "metric3": 4500}
         self.assertEqual(expected, levels[0].to_dict())
         expected = {
             DTTM_ALIAS: {"a1": 600, "b1": 600, "c1": 600},
             "metric1": {"a1": 6, "b1": 15, "c1": 24},
             "metric2": {"a1": 60, "b1": 150, "c1": 240},
             "metric3": {"a1": 600, "b1": 1500, "c1": 2400},
         }
         self.assertEqual(expected, levels[1].to_dict())
         self.assertEqual(["groupA", "groupB"], levels[2].index.names)
         self.assertEqual(["groupA", "groupB", "groupC"], levels[3].index.names)
         time_op = "agg_mean"
         levels = test_viz.levels_for(time_op, groups, df)
         self.assertEqual(4, len(levels))
         expected = {
             DTTM_ALIAS: 200.0,
             "metric1": 5.0,
             "metric2": 50.0,
             "metric3": 500.0,
         }
         self.assertEqual(expected, levels[0].to_dict())
         expected = {
             DTTM_ALIAS: {"a1": 200, "c1": 200, "b1": 200},
             "metric1": {"a1": 2, "b1": 5, "c1": 8},
             "metric2": {"a1": 20, "b1": 50, "c1": 80},
             "metric3": {"a1": 200, "b1": 500, "c1": 800},
         }
         self.assertEqual(expected, levels[1].to_dict())
         self.assertEqual(["groupA", "groupB"], levels[2].index.names)
         self.assertEqual(["groupA", "groupB", "groupC"], levels[3].index.names)

     def test_levels_for_diff_computes_difference(self):
         raw = {}
         raw[DTTM_ALIAS] = [100, 200, 300, 100, 200, 300, 100, 200, 300]
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         raw["metric2"] = [10, 20, 30, 40, 50, 60, 70, 80, 90]
         raw["metric3"] = [100, 200, 300, 400, 500, 600, 700, 800, 900]
         df = pd.DataFrame(raw)
         groups = ["groupA", "groupB", "groupC"]
         test_viz = viz.PartitionViz(Mock(), {})
         time_op = "point_diff"
         levels = test_viz.levels_for_diff(time_op, groups, df)
         expected = {"metric1": 6, "metric2": 60, "metric3": 600}
         self.assertEqual(expected, levels[0].to_dict())
         expected = {
             "metric1": {"a1": 2, "b1": 2, "c1": 2},
             "metric2": {"a1": 20, "b1": 20, "c1": 20},
             "metric3": {"a1": 200, "b1": 200, "c1": 200},
         }
         self.assertEqual(expected, levels[1].to_dict())
         self.assertEqual(4, len(levels))
         self.assertEqual(["groupA", "groupB", "groupC"], levels[3].index.names)

     def test_levels_for_time_calls_process_data_and_drops_cols(self):
         raw = {}
         raw[DTTM_ALIAS] = [100, 200, 300, 100, 200, 300, 100, 200, 300]
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         raw["metric2"] = [10, 20, 30, 40, 50, 60, 70, 80, 90]
         raw["metric3"] = [100, 200, 300, 400, 500, 600, 700, 800, 900]
         df = pd.DataFrame(raw)
         groups = ["groupA", "groupB", "groupC"]
         test_viz = viz.PartitionViz(Mock(), {"groupby": groups})

         def return_args(df_drop, aggregate):
             return df_drop

         test_viz.process_data = Mock(side_effect=return_args)
         levels = test_viz.levels_for_time(groups, df)
         self.assertEqual(4, len(levels))
         cols = [DTTM_ALIAS, "metric1", "metric2", "metric3"]
         self.assertEqual(sorted(cols), sorted(levels[0].columns.tolist()))
         cols += ["groupA"]
         self.assertEqual(sorted(cols), sorted(levels[1].columns.tolist()))
         cols += ["groupB"]
         self.assertEqual(sorted(cols), sorted(levels[2].columns.tolist()))
         cols += ["groupC"]
         self.assertEqual(sorted(cols), sorted(levels[3].columns.tolist()))
         self.assertEqual(4, len(test_viz.process_data.mock_calls))

     def test_nest_values_returns_hierarchy(self):
         raw = {}
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         raw["metric2"] = [10, 20, 30, 40, 50, 60, 70, 80, 90]
         raw["metric3"] = [100, 200, 300, 400, 500, 600, 700, 800, 900]
         df = pd.DataFrame(raw)
         test_viz = viz.PartitionViz(Mock(), {})
         groups = ["groupA", "groupB", "groupC"]
         levels = test_viz.levels_for("agg_sum", groups, df)
         nest = test_viz.nest_values(levels)
         self.assertEqual(3, len(nest))
         for i in range(0, 3):
             self.assertEqual("metric" + str(i + 1), nest[i]["name"])
         self.assertEqual(3, len(nest[0]["children"]))
         self.assertEqual(1, len(nest[0]["children"][0]["children"]))
         self.assertEqual(1, len(nest[0]["children"][0]["children"][0]["children"]))

     def test_nest_procs_returns_hierarchy(self):
         raw = {}
         raw[DTTM_ALIAS] = [100, 200, 300, 100, 200, 300, 100, 200, 300]
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         raw["metric2"] = [10, 20, 30, 40, 50, 60, 70, 80, 90]
         raw["metric3"] = [100, 200, 300, 400, 500, 600, 700, 800, 900]
         df = pd.DataFrame(raw)
         test_viz = viz.PartitionViz(Mock(), {})
         groups = ["groupA", "groupB", "groupC"]
         metrics = ["metric1", "metric2", "metric3"]
         procs = {}
         for i in range(0, 4):
             df_drop = df.drop(groups[i:], 1)
             pivot = df_drop.pivot_table(
                 index=DTTM_ALIAS, columns=groups[:i], values=metrics
             )
             procs[i] = pivot
         nest = test_viz.nest_procs(procs)
         self.assertEqual(3, len(nest))
         for i in range(0, 3):
             self.assertEqual("metric" + str(i + 1), nest[i]["name"])
             self.assertEqual(None, nest[i].get("val"))
         self.assertEqual(3, len(nest[0]["children"]))
         self.assertEqual(3, len(nest[0]["children"][0]["children"]))
         self.assertEqual(1, len(nest[0]["children"][0]["children"][0]["children"]))
         self.assertEqual(
             1, len(nest[0]["children"][0]["children"][0]["children"][0]["children"])
         )

     def test_get_data_calls_correct_method(self):
         raw = {}
         raw[DTTM_ALIAS] = [100, 200, 300, 100, 200, 300, 100, 200, 300]
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         raw["metric2"] = [10, 20, 30, 40, 50, 60, 70, 80, 90]
         raw["metric3"] = [100, 200, 300, 400, 500, 600, 700, 800, 900]
         df = pd.DataFrame(raw)
         test_viz = viz.PartitionViz(Mock(), {})
         with self.assertRaises(ValueError):
             test_viz.get_data(df)
         test_viz.levels_for = Mock(return_value=1)
         test_viz.nest_values = Mock(return_value=1)
         test_viz.form_data["groupby"] = ["groups"]
         test_viz.form_data["time_series_option"] = "not_time"
         test_viz.get_data(df)
         self.assertEqual("agg_sum", test_viz.levels_for.mock_calls[0][1][0])
         test_viz.form_data["time_series_option"] = "agg_sum"
         test_viz.get_data(df)
         self.assertEqual("agg_sum", test_viz.levels_for.mock_calls[1][1][0])
         test_viz.form_data["time_series_option"] = "agg_mean"
         test_viz.get_data(df)
         self.assertEqual("agg_mean", test_viz.levels_for.mock_calls[2][1][0])
         test_viz.form_data["time_series_option"] = "point_diff"
         test_viz.levels_for_diff = Mock(return_value=1)
         test_viz.get_data(df)
         self.assertEqual("point_diff", test_viz.levels_for_diff.mock_calls[0][1][0])
         test_viz.form_data["time_series_option"] = "point_percent"
         test_viz.get_data(df)
         self.assertEqual("point_percent", test_viz.levels_for_diff.mock_calls[1][1][0])
         test_viz.form_data["time_series_option"] = "point_factor"
         test_viz.get_data(df)
         self.assertEqual("point_factor", test_viz.levels_for_diff.mock_calls[2][1][0])
         test_viz.levels_for_time = Mock(return_value=1)
         test_viz.nest_procs = Mock(return_value=1)
         test_viz.form_data["time_series_option"] = "adv_anal"
         test_viz.get_data(df)
         self.assertEqual(1, len(test_viz.levels_for_time.mock_calls))
         self.assertEqual(1, len(test_viz.nest_procs.mock_calls))
         test_viz.form_data["time_series_option"] = "time_series"
         test_viz.get_data(df)
         self.assertEqual("agg_sum", test_viz.levels_for.mock_calls[3][1][0])
         self.assertEqual(7, len(test_viz.nest_values.mock_calls))


 class TestRoseVis(SupersetTestCase):
     def test_rose_vis_get_data(self):
         raw = {}
         t1 = pd.Timestamp("2000")
         t2 = pd.Timestamp("2002")
         t3 = pd.Timestamp("2004")
         raw[DTTM_ALIAS] = [t1, t2, t3, t1, t2, t3, t1, t2, t3]
         raw["groupA"] = ["a1", "a1", "a1", "b1", "b1", "b1", "c1", "c1", "c1"]
         raw["groupB"] = ["a2", "a2", "a2", "b2", "b2", "b2", "c2", "c2", "c2"]
         raw["groupC"] = ["a3", "a3", "a3", "b3", "b3", "b3", "c3", "c3", "c3"]
         raw["metric1"] = [1, 2, 3, 4, 5, 6, 7, 8, 9]
         df = pd.DataFrame(raw)
         fd = {"metrics": ["metric1"], "groupby": ["groupA"]}
         test_viz = viz.RoseViz(Mock(), fd)
         test_viz.metrics = fd["metrics"]
         res = test_viz.get_data(df)
         expected = {
             946684800000000000: [
                 {"time": t1, "value": 1, "key": ("a1",), "name": ("a1",)},
                 {"time": t1, "value": 4, "key": ("b1",), "name": ("b1",)},
                 {"time": t1, "value": 7, "key": ("c1",), "name": ("c1",)},
             ],
             1009843200000000000: [
                 {"time": t2, "value": 2, "key": ("a1",), "name": ("a1",)},
                 {"time": t2, "value": 5, "key": ("b1",), "name": ("b1",)},
                 {"time": t2, "value": 8, "key": ("c1",), "name": ("c1",)},
             ],
             1072915200000000000: [
                 {"time": t3, "value": 3, "key": ("a1",), "name": ("a1",)},
                 {"time": t3, "value": 6, "key": ("b1",), "name": ("b1",)},
                 {"time": t3, "value": 9, "key": ("c1",), "name": ("c1",)},
             ],
         }
         self.assertEqual(expected, res)


 class TestTimeSeriesTableViz(SupersetTestCase):
     def test_get_data_metrics(self):
         form_data = {"metrics": ["sum__A", "count"], "groupby": []}
         datasource = self.get_datasource_mock()
         raw = {}
         t1 = pd.Timestamp("2000")
         t2 = pd.Timestamp("2002")
         raw[DTTM_ALIAS] = [t1, t2]
         raw["sum__A"] = [15, 20]
         raw["count"] = [6, 7]
         df = pd.DataFrame(raw)
         test_viz = viz.TimeTableViz(datasource, form_data)
         data = test_viz.get_data(df)
         # Check method correctly transforms data
         self.assertEqual(set(["count", "sum__A"]), set(data["columns"]))
         time_format = "%Y-%m-%d %H:%M:%S"
         expected = {
             t1.strftime(time_format): {"sum__A": 15, "count": 6},
             t2.strftime(time_format): {"sum__A": 20, "count": 7},
         }
         self.assertEqual(expected, data["records"])

     def test_get_data_group_by(self):
         form_data = {"metrics": ["sum__A"], "groupby": ["groupby1"]}
         datasource = self.get_datasource_mock()
         raw = {}
         t1 = pd.Timestamp("2000")
         t2 = pd.Timestamp("2002")
         raw[DTTM_ALIAS] = [t1, t1, t1, t2, t2, t2]
         raw["sum__A"] = [15, 20, 25, 30, 35, 40]
         raw["groupby1"] = ["a1", "a2", "a3", "a1", "a2", "a3"]
         df = pd.DataFrame(raw)
         test_viz = viz.TimeTableViz(datasource, form_data)
         data = test_viz.get_data(df)
         # Check method correctly transforms data
         self.assertEqual(set(["a1", "a2", "a3"]), set(data["columns"]))
         time_format = "%Y-%m-%d %H:%M:%S"
         expected = {
             t1.strftime(time_format): {"a1": 15, "a2": 20, "a3": 25},
             t2.strftime(time_format): {"a1": 30, "a2": 35, "a3": 40},
         }
         self.assertEqual(expected, data["records"])

     @patch("superset.viz.BaseViz.query_obj")
     def test_query_obj_throws_metrics_and_groupby(self, super_query_obj):
         datasource = self.get_datasource_mock()
         form_data = {"groupby": ["a"]}
         super_query_obj.return_value = {}
         test_viz = viz.TimeTableViz(datasource, form_data)
         with self.assertRaises(Exception):
             test_viz.query_obj()
         form_data["metrics"] = ["x", "y"]
         test_viz = viz.TimeTableViz(datasource, form_data)
         with self.assertRaises(Exception):
             test_viz.query_obj()


 class TestBaseDeckGLViz(SupersetTestCase):
     def test_get_metrics(self):
         form_data = load_fixture("deck_path_form_data.json")
         datasource = self.get_datasource_mock()
         test_viz_deckgl = viz.BaseDeckGLViz(datasource, form_data)
         result = test_viz_deckgl.get_metrics()
         assert result == [form_data.get("size")]

         form_data = {}
         test_viz_deckgl = viz.BaseDeckGLViz(datasource, form_data)
         result = test_viz_deckgl.get_metrics()
         assert result == []

     def test_scatterviz_get_metrics(self):
         form_data = load_fixture("deck_path_form_data.json")
         datasource = self.get_datasource_mock()

         form_data = {}
         test_viz_deckgl = viz.DeckScatterViz(datasource, form_data)
         test_viz_deckgl.point_radius_fixed = {"type": "metric", "value": "int"}
         result = test_viz_deckgl.get_metrics()
         assert result == ["int"]

         form_data = {}
         test_viz_deckgl = viz.DeckScatterViz(datasource, form_data)
         test_viz_deckgl.point_radius_fixed = {}
         result = test_viz_deckgl.get_metrics()
         assert result == []

     def test_get_js_columns(self):
         form_data = load_fixture("deck_path_form_data.json")
         datasource = self.get_datasource_mock()
         mock_d = {"a": "dummy1", "b": "dummy2", "c": "dummy3"}
         test_viz_deckgl = viz.BaseDeckGLViz(datasource, form_data)
         result = test_viz_deckgl.get_js_columns(mock_d)

         assert result == {"color": None}

     def test_get_properties(self):
         mock_d = {}
         form_data = load_fixture("deck_path_form_data.json")
         datasource = self.get_datasource_mock()
         test_viz_deckgl = viz.BaseDeckGLViz(datasource, form_data)

         with self.assertRaises(NotImplementedError) as context:
             test_viz_deckgl.get_properties(mock_d)

         self.assertTrue("" in str(context.exception))

     def test_process_spatial_query_obj(self):
         form_data = load_fixture("deck_path_form_data.json")
         datasource = self.get_datasource_mock()
         mock_key = "spatial_key"
         mock_gb = []
         test_viz_deckgl = viz.BaseDeckGLViz(datasource, form_data)

         with self.assertRaises(ValueError) as context:
             test_viz_deckgl.process_spatial_query_obj(mock_key, mock_gb)

         self.assertTrue("Bad spatial key" in str(context.exception))

         test_form_data = {
             "latlong_key": {"type": "latlong", "lonCol": "lon", "latCol": "lat"},
             "delimited_key": {"type": "delimited", "lonlatCol": "lonlat"},
             "geohash_key": {"type": "geohash", "geohashCol": "geo"},
         }

         datasource = self.get_datasource_mock()
         expected_results = {
             "latlong_key": ["lon", "lat"],
             "delimited_key": ["lonlat"],
             "geohash_key": ["geo"],
         }
         for mock_key in ["latlong_key", "delimited_key", "geohash_key"]:
             mock_gb = []
             test_viz_deckgl = viz.BaseDeckGLViz(datasource, test_form_data)
             test_viz_deckgl.process_spatial_query_obj(mock_key, mock_gb)
             assert expected_results.get(mock_key) == mock_gb

     def test_geojson_query_obj(self):
         form_data = load_fixture("deck_geojson_form_data.json")
         datasource = self.get_datasource_mock()
         test_viz_deckgl = viz.DeckGeoJson(datasource, form_data)
         results = test_viz_deckgl.query_obj()

         assert results["metrics"] == []
         assert results["groupby"] == []
         assert results["columns"] == ["test_col"]

     def test_parse_coordinates(self):
         form_data = load_fixture("deck_path_form_data.json")
         datasource = self.get_datasource_mock()
         viz_instance = viz.BaseDeckGLViz(datasource, form_data)

         coord = viz_instance.parse_coordinates("1.23, 3.21")
         self.assertEqual(coord, (1.23, 3.21))

         coord = viz_instance.parse_coordinates("1.23 3.21")
         self.assertEqual(coord, (1.23, 3.21))

         self.assertEqual(viz_instance.parse_coordinates(None), None)

         self.assertEqual(viz_instance.parse_coordinates(""), None)

     def test_parse_coordinates_raises(self):
         form_data = load_fixture("deck_path_form_data.json")
         datasource = self.get_datasource_mock()
         test_viz_deckgl = viz.BaseDeckGLViz(datasource, form_data)

         with self.assertRaises(SpatialException):
             test_viz_deckgl.parse_coordinates("NULL")

         with self.assertRaises(SpatialException):
             test_viz_deckgl.parse_coordinates("fldkjsalkj,fdlaskjfjadlksj")

     def test_filter_nulls(self):
         test_form_data = {
             "latlong_key": {"type": "latlong", "lonCol": "lon", "latCol": "lat"},
             "delimited_key": {"type": "delimited", "lonlatCol": "lonlat"},
             "geohash_key": {"type": "geohash", "geohashCol": "geo"},
         }

         datasource = self.get_datasource_mock()
         expected_results = {
             "latlong_key": [
                 {
                     "clause": "WHERE",
                     "expressionType": "SIMPLE",
                     "filterOptionName": "c7f171cf3204bcbf456acfeac5cd9afd",
                     "comparator": "",
                     "operator": "IS NOT NULL",
                     "subject": "lat",
                 },
                 {
                     "clause": "WHERE",
                     "expressionType": "SIMPLE",
                     "filterOptionName": "52634073fbb8ae0a3aa59ad48abac55e",
                     "comparator": "",
                     "operator": "IS NOT NULL",
                     "subject": "lon",
                 },
             ],
             "delimited_key": [
                 {
                     "clause": "WHERE",
                     "expressionType": "SIMPLE",
                     "filterOptionName": "cae5c925c140593743da08499e6fb207",
                     "comparator": "",
                     "operator": "IS NOT NULL",
                     "subject": "lonlat",
                 }
             ],
             "geohash_key": [
                 {
                     "clause": "WHERE",
                     "expressionType": "SIMPLE",
                     "filterOptionName": "d84f55222d8e414e888fa5f990b341d2",
                     "comparator": "",
                     "operator": "IS NOT NULL",
                     "subject": "geo",
                 }
             ],
         }
         for mock_key in ["latlong_key", "delimited_key", "geohash_key"]:
             test_viz_deckgl = viz.BaseDeckGLViz(datasource, test_form_data.copy())
             test_viz_deckgl.spatial_control_keys = [mock_key]
             test_viz_deckgl.add_null_filters()
             adhoc_filters = test_viz_deckgl.form_data["adhoc_filters"]
             assert expected_results.get(mock_key) == adhoc_filters


 class TestTimeSeriesViz(SupersetTestCase):
     def test_timeseries_unicode_data(self):
         datasource = self.get_datasource_mock()
         form_data = {"groupby": ["name"], "metrics": ["sum__payout"]}
         raw = {}
         raw["name"] = [
             "Real Madrid C.F.🇺🇸🇬🇧",
             "Real Madrid C.F.🇺🇸🇬🇧",
             "Real Madrid Basket",
             "Real Madrid Basket",
         ]
         raw["__timestamp"] = [
             "2018-02-20T00:00:00",
             "2018-03-09T00:00:00",
             "2018-02-20T00:00:00",
             "2018-03-09T00:00:00",
         ]
         raw["sum__payout"] = [2, 2, 4, 4]
         df = pd.DataFrame(raw)

         test_viz = viz.NVD3TimeSeriesViz(datasource, form_data)
         viz_data = {}
         viz_data = test_viz.get_data(df)
         expected = [
             {
                 "values": [
                     {"y": 4, "x": "2018-02-20T00:00:00"},
                     {"y": 4, "x": "2018-03-09T00:00:00"},
                 ],
                 "key": ("Real Madrid Basket",),
             },
             {
                 "values": [
                     {"y": 2, "x": "2018-02-20T00:00:00"},
                     {"y": 2, "x": "2018-03-09T00:00:00"},
                 ],
                 "key": ("Real Madrid C.F.\U0001f1fa\U0001f1f8\U0001f1ec\U0001f1e7",),
             },
         ]
         self.assertEqual(expected, viz_data)

     def test_process_data_resample(self):
         datasource = self.get_datasource_mock()

         df = pd.DataFrame(
             {
                 "__timestamp": pd.to_datetime(
                     ["2019-01-01", "2019-01-02", "2019-01-05", "2019-01-07"]
                 ),
                 "y": [1.0, 2.0, 5.0, 7.0],
             }
         )

         self.assertEqual(
             viz.NVD3TimeSeriesViz(
                 datasource,
                 {"metrics": ["y"], "resample_method": "sum", "resample_rule": "1D"},
             )
             .process_data(df)["y"]
             .tolist(),
             [1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 7.0],
         )

         np.testing.assert_equal(
             viz.NVD3TimeSeriesViz(
                 datasource,
                 {"metrics": ["y"], "resample_method": "asfreq", "resample_rule": "1D"},
             )
             .process_data(df)["y"]
             .tolist(),
             [1.0, 2.0, np.nan, np.nan, 5.0, np.nan, 7.0],
         )

     def test_apply_rolling(self):
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             index=pd.to_datetime(
                 ["2019-01-01", "2019-01-02", "2019-01-05", "2019-01-07"]
             ),
             data={"y": [1.0, 2.0, 3.0, 4.0]},
         )
         self.assertEqual(
             viz.BigNumberViz(
                 datasource,
                 {
                     "metrics": ["y"],
                     "rolling_type": "cumsum",
                     "rolling_periods": 0,
                     "min_periods": 0,
                 },
             )
             .apply_rolling(df)["y"]
             .tolist(),
             [1.0, 3.0, 6.0, 10.0],
         )
         self.assertEqual(
             viz.BigNumberViz(
                 datasource,
                 {
                     "metrics": ["y"],
                     "rolling_type": "sum",
                     "rolling_periods": 2,
                     "min_periods": 0,
                 },
             )
             .apply_rolling(df)["y"]
             .tolist(),
             [1.0, 3.0, 5.0, 7.0],
         )
         self.assertEqual(
             viz.BigNumberViz(
                 datasource,
                 {
                     "metrics": ["y"],
                     "rolling_type": "mean",
                     "rolling_periods": 10,
                     "min_periods": 0,
                 },
             )
             .apply_rolling(df)["y"]
             .tolist(),
             [1.0, 1.5, 2.0, 2.5],
         )

     def test_apply_rolling_without_data(self):
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             index=pd.to_datetime(
                 ["2019-01-01", "2019-01-02", "2019-01-05", "2019-01-07"]
             ),
             data={"y": [1.0, 2.0, 3.0, 4.0]},
         )
         test_viz = viz.BigNumberViz(
             datasource,
             {
                 "metrics": ["y"],
                 "rolling_type": "cumsum",
                 "rolling_periods": 4,
                 "min_periods": 4,
             },
         )
         with pytest.raises(QueryObjectValidationError):
             test_viz.apply_rolling(df)


 class TestBigNumberViz(SupersetTestCase):
     def test_get_data(self):
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             data={
                 DTTM_ALIAS: pd.to_datetime(
                     ["2019-01-01", "2019-01-02", "2019-01-05", "2019-01-07"]
                 ),
                 "y": [1.0, 2.0, 3.0, 4.0],
             }
         )
         data = viz.BigNumberViz(datasource, {"metrics": ["y"]}).get_data(df)
         self.assertEqual(data[2], {DTTM_ALIAS: pd.Timestamp("2019-01-05"), "y": 3})

     def test_get_data_with_none(self):
         datasource = self.get_datasource_mock()
         df = pd.DataFrame(
             data={
                 DTTM_ALIAS: pd.to_datetime(
                     ["2019-01-01", "2019-01-02", "2019-01-05", "2019-01-07"]
                 ),
                 "y": [1.0, 2.0, None, 4.0],
             }
         )
         data = viz.BigNumberViz(datasource, {"metrics": ["y"]}).get_data(df)
         assert np.isnan(data[2]["y"])


 class TestPivotTableViz(SupersetTestCase):
     df = pd.DataFrame(
         data={
             "intcol": [1, 2, 3, None],
             "floatcol": [0.1, 0.2, 0.3, None],
             "strcol": ["a", "b", "c", None],
         }
     )

     def test_get_aggfunc_numeric(self):
         # is a sum function
         func = viz.PivotTableViz.get_aggfunc("intcol", self.df, {})
         assert hasattr(func, "__call__")
         assert func(self.df["intcol"]) == 6

         assert (
             viz.PivotTableViz.get_aggfunc("intcol", self.df, {"pandas_aggfunc": "min"})
             == "min"
         )
         assert (
             viz.PivotTableViz.get_aggfunc(
                 "floatcol", self.df, {"pandas_aggfunc": "max"}
             )
             == "max"
         )

     def test_get_aggfunc_non_numeric(self):
         assert viz.PivotTableViz.get_aggfunc("strcol", self.df, {}) == "max"
         assert (
             viz.PivotTableViz.get_aggfunc("strcol", self.df, {"pandas_aggfunc": "sum"})
             == "max"
         )
         assert (
             viz.PivotTableViz.get_aggfunc("strcol", self.df, {"pandas_aggfunc": "min"})
             == "min"
         )

     def test_format_datetime_from_pd_timestamp(self):
         tstamp = pd.Timestamp(datetime(2020, 9, 3, tzinfo=timezone.utc))
         assert (
             viz.PivotTableViz._format_datetime(tstamp) == "__timestamp:1599091200000.0"
         )

     def test_format_datetime_from_datetime(self):
         tstamp = datetime(2020, 9, 3, tzinfo=timezone.utc)
         assert (
             viz.PivotTableViz._format_datetime(tstamp) == "__timestamp:1599091200000.0"
         )

     def test_format_datetime_from_date(self):
         tstamp = date(2020, 9, 3)
         assert (
             viz.PivotTableViz._format_datetime(tstamp) == "__timestamp:1599091200000.0"
         )

     def test_format_datetime_from_string(self):
         tstamp = "2020-09-03T00:00:00"
         assert (
             viz.PivotTableViz._format_datetime(tstamp) == "__timestamp:1599091200000.0"
         )

     def test_format_datetime_from_invalid_string(self):
         tstamp = "abracadabra"
         assert viz.PivotTableViz._format_datetime(tstamp) == tstamp

     def test_format_datetime_from_int(self):
         assert viz.PivotTableViz._format_datetime(123) == 123
         assert viz.PivotTableViz._format_datetime(123.0) == 123.0


 class TestFilterBoxViz(SupersetTestCase):
     def test_get_data(self):
         form_data = {
             "filter_configs": [
                 {"column": "value1", "metric": "metric1"},
                 {"column": "value2", "metric": "metric2", "asc": True},
                 {"column": "value3"},
                 {"column": "value4", "asc": True},
                 {"column": "value5"},
                 {"column": "value6"},
             ],
         }
         datasource = self.get_datasource_mock()
         test_viz = viz.FilterBoxViz(datasource, form_data)
         test_viz.dataframes = {
             "value1": pd.DataFrame(
                 data=[{"value1": "v1", "metric1": 1}, {"value1": "v2", "metric1": 2},]
             ),
             "value2": pd.DataFrame(
                 data=[{"value2": "v3", "metric2": 3}, {"value2": "v4", "metric2": 4},]
             ),
             "value3": pd.DataFrame(data=[{"value3": "v5"}, {"value3": "v6"},]),
             "value4": pd.DataFrame(data=[{"value4": "v7"}, {"value4": "v8"},]),
             "value5": pd.DataFrame(),
         }

         df = pd.DataFrame()
         data = test_viz.get_data(df)
         expected = {
             "value1": [
                 {"id": "v2", "text": "v2", "metric": 2},
                 {"id": "v1", "text": "v1", "metric": 1},
             ],
             "value2": [
                 {"id": "v3", "text": "v3", "metric": 3},
                 {"id": "v4", "text": "v4", "metric": 4},
             ],
             "value3": [{"id": "v6", "text": "v6"}, {"id": "v5", "text": "v5"},],
             "value4": [{"id": "v7", "text": "v7"}, {"id": "v8", "text": "v8"},],
             "value5": [],
             "value6": [],
         }
         self.assertEqual(expected, data)