tests/query_context_tests.py - superset - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
 import re
 from typing import Any, Dict

 import pytest

 from superset import db
 from superset.charts.schemas import ChartDataQueryContextSchema
 from superset.common.query_context import QueryContext
 from superset.common.query_object import QueryObject
 from superset.connectors.connector_registry import ConnectorRegistry
 from superset.extensions import cache_manager
 from superset.utils.core import (
     AdhocMetricExpressionType,
     backend,
     ChartDataResultFormat,
     ChartDataResultType,
     TimeRangeEndpoint,
 )
 from tests.base_tests import SupersetTestCase
 from tests.fixtures.birth_names_dashboard import load_birth_names_dashboard_with_slices
 from tests.fixtures.query_context import get_query_context


 def get_sql_text(payload: Dict[str, Any]) -> str:
     payload["result_type"] = ChartDataResultType.QUERY.value
     query_context = ChartDataQueryContextSchema().load(payload)
     responses = query_context.get_payload()
     assert len(responses) == 1
     response = responses["queries"][0]
     assert len(response) == 2
     assert response["language"] == "sql"
     return response["query"]


 class TestQueryContext(SupersetTestCase):
     def test_schema_deserialization(self):
         """
         Ensure that the deserialized QueryContext contains all required fields.
         """

         payload = get_query_context("birth_names", add_postprocessing_operations=True)
         query_context = ChartDataQueryContextSchema().load(payload)
         self.assertEqual(len(query_context.queries), len(payload["queries"]))

         for query_idx, query in enumerate(query_context.queries):
             payload_query = payload["queries"][query_idx]

             # check basic properies
             self.assertEqual(query.extras, payload_query["extras"])
             self.assertEqual(query.filter, payload_query["filters"])
             self.assertEqual(query.groupby, payload_query["groupby"])

             # metrics are mutated during creation
             for metric_idx, metric in enumerate(query.metrics):
                 payload_metric = payload_query["metrics"][metric_idx]
                 payload_metric = (
                     payload_metric
                     if "expressionType" in payload_metric
                     else payload_metric["label"]
                 )
                 self.assertEqual(metric, payload_metric)

             self.assertEqual(query.orderby, payload_query["orderby"])
             self.assertEqual(query.time_range, payload_query["time_range"])

             # check post processing operation properties
             for post_proc_idx, post_proc in enumerate(query.post_processing):
                 payload_post_proc = payload_query["post_processing"][post_proc_idx]
                 self.assertEqual(post_proc["operation"], payload_post_proc["operation"])
                 self.assertEqual(post_proc["options"], payload_post_proc["options"])

     def test_cache(self):
         table_name = "birth_names"
         table = self.get_table_by_name(table_name)
         payload = get_query_context(table.name, table.id)
         payload["force"] = True

         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         query_cache_key = query_context.query_cache_key(query_object)

         response = query_context.get_payload(cache_query_context=True)
         cache_key = response["cache_key"]
         assert cache_key is not None

         cached = cache_manager.cache.get(cache_key)
         assert cached is not None

         rehydrated_qc = ChartDataQueryContextSchema().load(cached["data"])
         rehydrated_qo = rehydrated_qc.queries[0]
         rehydrated_query_cache_key = rehydrated_qc.query_cache_key(rehydrated_qo)

         self.assertEqual(rehydrated_qc.datasource, query_context.datasource)
         self.assertEqual(len(rehydrated_qc.queries), 1)
         self.assertEqual(query_cache_key, rehydrated_query_cache_key)
         self.assertEqual(rehydrated_qc.result_type, query_context.result_type)
         self.assertEqual(rehydrated_qc.result_format, query_context.result_format)
         self.assertFalse(rehydrated_qc.force)

     def test_query_cache_key_changes_when_datasource_is_updated(self):
         self.login(username="admin")
         payload = get_query_context("birth_names")

         # construct baseline query_cache_key
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         cache_key_original = query_context.query_cache_key(query_object)

         # make temporary change and revert it to refresh the changed_on property
         datasource = ConnectorRegistry.get_datasource(
             datasource_type=payload["datasource"]["type"],
             datasource_id=payload["datasource"]["id"],
             session=db.session,
         )
         description_original = datasource.description
         datasource.description = "temporary description"
         db.session.commit()
         datasource.description = description_original
         db.session.commit()

         # create new QueryContext with unchanged attributes, extract new query_cache_key
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         cache_key_new = query_context.query_cache_key(query_object)

         # the new cache_key should be different due to updated datasource
         self.assertNotEqual(cache_key_original, cache_key_new)

     def test_query_cache_key_does_not_change_for_non_existent_or_null(self):
         self.login(username="admin")
         payload = get_query_context("birth_names", add_postprocessing_operations=True)
         del payload["queries"][0]["granularity"]

         # construct baseline query_cache_key from query_context with post processing operation
         query_context: QueryContext = ChartDataQueryContextSchema().load(payload)
         query_object: QueryObject = query_context.queries[0]
         cache_key_original = query_context.query_cache_key(query_object)

         payload["queries"][0]["granularity"] = None
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]

         assert query_context.query_cache_key(query_object) == cache_key_original

     def test_query_cache_key_changes_when_post_processing_is_updated(self):
         self.login(username="admin")
         payload = get_query_context("birth_names", add_postprocessing_operations=True)

         # construct baseline query_cache_key from query_context with post processing operation
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         cache_key_original = query_context.query_cache_key(query_object)

         # ensure added None post_processing operation doesn't change query_cache_key
         payload["queries"][0]["post_processing"].append(None)
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         cache_key = query_context.query_cache_key(query_object)
         self.assertEqual(cache_key_original, cache_key)

         # ensure query without post processing operation is different
         payload["queries"][0].pop("post_processing")
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         cache_key = query_context.query_cache_key(query_object)
         self.assertNotEqual(cache_key_original, cache_key)

     def test_query_context_time_range_endpoints(self):
         """
         Ensure that time_range_endpoints are populated automatically when missing
         from the payload.
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         del payload["queries"][0]["extras"]["time_range_endpoints"]
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         extras = query_object.to_dict()["extras"]
         assert "time_range_endpoints" in extras
         self.assertEqual(
             extras["time_range_endpoints"],
             (TimeRangeEndpoint.INCLUSIVE, TimeRangeEndpoint.EXCLUSIVE),
         )

     def test_handle_metrics_field(self):
         """
         Should support both predefined and adhoc metrics.
         """
         self.login(username="admin")
         adhoc_metric = {
             "expressionType": "SIMPLE",
             "column": {"column_name": "num_boys", "type": "BIGINT(20)"},
             "aggregate": "SUM",
             "label": "Boys",
             "optionName": "metric_11",
         }
         payload = get_query_context("birth_names")
         payload["queries"][0]["metrics"] = ["sum__num", {"label": "abc"}, adhoc_metric]
         query_context = ChartDataQueryContextSchema().load(payload)
         query_object = query_context.queries[0]
         self.assertEqual(query_object.metrics, ["sum__num", "abc", adhoc_metric])

     def test_convert_deprecated_fields(self):
         """
         Ensure that deprecated fields are converted correctly
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         payload["queries"][0]["granularity_sqla"] = "timecol"
         payload["queries"][0]["having_filters"] = [{"col": "a", "op": "==", "val": "b"}]
         query_context = ChartDataQueryContextSchema().load(payload)
         self.assertEqual(len(query_context.queries), 1)
         query_object = query_context.queries[0]
         self.assertEqual(query_object.granularity, "timecol")
         self.assertIn("having_druid", query_object.extras)

     @pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
     def test_csv_response_format(self):
         """
         Ensure that CSV result format works
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         payload["result_format"] = ChartDataResultFormat.CSV.value
         payload["queries"][0]["row_limit"] = 10
         query_context = ChartDataQueryContextSchema().load(payload)
         responses = query_context.get_payload()
         self.assertEqual(len(responses), 1)
         data = responses["queries"][0]["data"]
         self.assertIn("name,sum__num\n", data)
         self.assertEqual(len(data.split("\n")), 12)

     def test_sql_injection_via_groupby(self):
         """
         Ensure that calling invalid columns names in groupby are caught
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         payload["queries"][0]["groupby"] = ["currentDatabase()"]
         query_context = ChartDataQueryContextSchema().load(payload)
         query_payload = query_context.get_payload()
         assert query_payload["queries"][0].get("error") is not None

     def test_sql_injection_via_columns(self):
         """
         Ensure that calling invalid column names in columns are caught
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         payload["queries"][0]["groupby"] = []
         payload["queries"][0]["metrics"] = []
         payload["queries"][0]["columns"] = ["*, 'extra'"]
         query_context = ChartDataQueryContextSchema().load(payload)
         query_payload = query_context.get_payload()
         assert query_payload["queries"][0].get("error") is not None

     def test_sql_injection_via_metrics(self):
         """
         Ensure that calling invalid column names in filters are caught
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         payload["queries"][0]["groupby"] = ["name"]
         payload["queries"][0]["metrics"] = [
             {
                 "expressionType": AdhocMetricExpressionType.SIMPLE.value,
                 "column": {"column_name": "invalid_col"},
                 "aggregate": "SUM",
                 "label": "My Simple Label",
             }
         ]
         query_context = ChartDataQueryContextSchema().load(payload)
         query_payload = query_context.get_payload()
         assert query_payload["queries"][0].get("error") is not None

     @pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
     def test_samples_response_type(self):
         """
         Ensure that samples result type works
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         payload["result_type"] = ChartDataResultType.SAMPLES.value
         payload["queries"][0]["row_limit"] = 5
         query_context = ChartDataQueryContextSchema().load(payload)
         responses = query_context.get_payload()
         self.assertEqual(len(responses), 1)
         data = responses["queries"][0]["data"]
         self.assertIsInstance(data, list)
         self.assertEqual(len(data), 5)
         self.assertNotIn("sum__num", data[0])

     @pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
     def test_query_response_type(self):
         """
         Ensure that query result type works
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         sql_text = get_sql_text(payload)
         assert "SELECT" in sql_text
         assert re.search(r'[`"\[]?num[`"\]]? IS NOT NULL', sql_text)
         assert re.search(
             r"""NOT \([`"\[]?name[`"\]]? IS NULL[\s\n]* """
             r"""OR [`"\[]?name[`"\]]? IN \('abc'\)\)""",
             sql_text,
         )

     @pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
     def test_handle_sort_by_metrics(self):
         """
         Should properly handle sort by metrics in various scenarios.
         """
         self.login(username="admin")

         sql_text = get_sql_text(get_query_context("birth_names"))
         if backend() == "hive":
             # should have no duplicate `SUM(num)`
             assert "SUM(num) AS `sum__num`," not in sql_text
             assert "SUM(num) AS `sum__num`" in sql_text
             # the alias should be in ORDER BY
             assert "ORDER BY `sum__num` DESC" in sql_text
         else:
             assert re.search(r'ORDER BY [`"\[]?sum__num[`"\]]? DESC', sql_text)

         sql_text = get_sql_text(
             get_query_context("birth_names:only_orderby_has_metric")
         )
         if backend() == "hive":
             assert "SUM(num) AS `sum__num`," not in sql_text
             assert "SUM(num) AS `sum__num`" in sql_text
             assert "ORDER BY `sum__num` DESC" in sql_text
         else:
             assert re.search(
                 r'ORDER BY SUM\([`"\[]?num[`"\]]?\) DESC', sql_text, re.IGNORECASE
             )

         sql_text = get_sql_text(get_query_context("birth_names:orderby_dup_alias"))

         # Check SELECT clauses
         if backend() == "presto":
             # presto cannot have ambiguous alias in order by, so selected column
             # alias is renamed.
             assert 'sum("num_boys") AS "num_boys__"' in sql_text
         else:
             assert re.search(
                 r'SUM\([`"\[]?num_boys[`"\]]?\) AS [`\"\[]?num_boys[`"\]]?',
                 sql_text,
                 re.IGNORECASE,
             )

         # Check ORDER BY clauses
         if backend() == "hive":
             # Hive must add additional SORT BY metrics to SELECT
             assert re.search(
                 r"MAX\(CASE.*END\) AS `MAX\(CASE WHEN...`",
                 sql_text,
                 re.IGNORECASE | re.DOTALL,
             )

             # The additional column with the same expression but a different label
             # as an existing metric should not be added
             assert "sum(`num_girls`) AS `SUM(num_girls)`" not in sql_text

             # Should reference all ORDER BY columns by aliases
             assert "ORDER BY `num_girls` DESC," in sql_text
             assert "`AVG(num_boys)` DESC," in sql_text
             assert "`MAX(CASE WHEN...` ASC" in sql_text
         else:
             if backend() == "presto":
                 # since the selected `num_boys` is renamed to `num_boys__`
                 # it must be references as expression
                 assert re.search(
                     r'ORDER BY SUM\([`"\[]?num_girls[`"\]]?\) DESC',
                     sql_text,
                     re.IGNORECASE,
                 )
             else:
                 # Should reference the adhoc metric by alias when possible
                 assert re.search(
                     r'ORDER BY [`"\[]?num_girls[`"\]]? DESC', sql_text, re.IGNORECASE,
                 )

             # ORDER BY only columns should always be expressions
             assert re.search(
                 r'AVG\([`"\[]?num_boys[`"\]]?\) DESC', sql_text, re.IGNORECASE,
             )
             assert re.search(
                 r"MAX\(CASE.*END\) ASC", sql_text, re.IGNORECASE | re.DOTALL
             )

     @pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
     def test_fetch_values_predicate(self):
         """
         Ensure that fetch values predicate is added to query if needed
         """
         self.login(username="admin")

         payload = get_query_context("birth_names")
         sql_text = get_sql_text(payload)
         assert "123 = 123" not in sql_text

         payload["queries"][0]["apply_fetch_values_predicate"] = True
         sql_text = get_sql_text(payload)
         assert "123 = 123" in sql_text

     def test_query_object_unknown_fields(self):
         """
         Ensure that query objects with unknown fields don't raise an Exception and
         have an identical cache key as one without the unknown field
         """
         self.login(username="admin")
         payload = get_query_context("birth_names")
         query_context = ChartDataQueryContextSchema().load(payload)
         responses = query_context.get_payload()
         orig_cache_key = responses["queries"][0]["cache_key"]
         payload["queries"][0]["foo"] = "bar"
         query_context = ChartDataQueryContextSchema().load(payload)
         responses = query_context.get_payload()
         new_cache_key = responses["queries"][0]["cache_key"]
         self.assertEqual(orig_cache_key, new_cache_key)
	# Licensed to the Apache Software Foundation (ASF) under one
	# or more contributor license agreements. See the NOTICE file
	# distributed with this work for additional information
	# regarding copyright ownership. The ASF licenses this file
	# to you under the Apache License, Version 2.0 (the
	# "License"); you may not use this file except in compliance
	# with the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing,
	# software distributed under the License is distributed on an
	# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	# KIND, either express or implied. See the License for the
	# specific language governing permissions and limitations
	# under the License.
	import re
	from typing import Any, Dict

	import pytest

	from superset import db
	from superset.charts.schemas import ChartDataQueryContextSchema
	from superset.common.query_context import QueryContext
	from superset.common.query_object import QueryObject
	from superset.connectors.connector_registry import ConnectorRegistry
	from superset.extensions import cache_manager
	from superset.utils.core import (
	AdhocMetricExpressionType,
	backend,
	ChartDataResultFormat,
	ChartDataResultType,
	TimeRangeEndpoint,
	)
	from tests.base_tests import SupersetTestCase
	from tests.fixtures.birth_names_dashboard import load_birth_names_dashboard_with_slices
	from tests.fixtures.query_context import get_query_context


	def get_sql_text(payload: Dict[str, Any]) -> str:
	payload["result_type"] = ChartDataResultType.QUERY.value
	query_context = ChartDataQueryContextSchema().load(payload)
	responses = query_context.get_payload()
	assert len(responses) == 1
	response = responses["queries"][0]
	assert len(response) == 2
	assert response["language"] == "sql"
	return response["query"]


	class TestQueryContext(SupersetTestCase):
	def test_schema_deserialization(self):
	"""
	Ensure that the deserialized QueryContext contains all required fields.
	"""

	payload = get_query_context("birth_names", add_postprocessing_operations=True)
	query_context = ChartDataQueryContextSchema().load(payload)
	self.assertEqual(len(query_context.queries), len(payload["queries"]))

	for query_idx, query in enumerate(query_context.queries):
	payload_query = payload["queries"][query_idx]

	# check basic properies
	self.assertEqual(query.extras, payload_query["extras"])
	self.assertEqual(query.filter, payload_query["filters"])
	self.assertEqual(query.groupby, payload_query["groupby"])

	# metrics are mutated during creation
	for metric_idx, metric in enumerate(query.metrics):
	payload_metric = payload_query["metrics"][metric_idx]
	payload_metric = (
	payload_metric
	if "expressionType" in payload_metric
	else payload_metric["label"]
	)
	self.assertEqual(metric, payload_metric)

	self.assertEqual(query.orderby, payload_query["orderby"])
	self.assertEqual(query.time_range, payload_query["time_range"])

	# check post processing operation properties
	for post_proc_idx, post_proc in enumerate(query.post_processing):
	payload_post_proc = payload_query["post_processing"][post_proc_idx]
	self.assertEqual(post_proc["operation"], payload_post_proc["operation"])
	self.assertEqual(post_proc["options"], payload_post_proc["options"])

	def test_cache(self):
	table_name = "birth_names"
	table = self.get_table_by_name(table_name)
	payload = get_query_context(table.name, table.id)
	payload["force"] = True

	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	query_cache_key = query_context.query_cache_key(query_object)

	response = query_context.get_payload(cache_query_context=True)
	cache_key = response["cache_key"]
	assert cache_key is not None

	cached = cache_manager.cache.get(cache_key)
	assert cached is not None

	rehydrated_qc = ChartDataQueryContextSchema().load(cached["data"])
	rehydrated_qo = rehydrated_qc.queries[0]
	rehydrated_query_cache_key = rehydrated_qc.query_cache_key(rehydrated_qo)

	self.assertEqual(rehydrated_qc.datasource, query_context.datasource)
	self.assertEqual(len(rehydrated_qc.queries), 1)
	self.assertEqual(query_cache_key, rehydrated_query_cache_key)
	self.assertEqual(rehydrated_qc.result_type, query_context.result_type)
	self.assertEqual(rehydrated_qc.result_format, query_context.result_format)
	self.assertFalse(rehydrated_qc.force)

	def test_query_cache_key_changes_when_datasource_is_updated(self):
	self.login(username="admin")
	payload = get_query_context("birth_names")

	# construct baseline query_cache_key
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	cache_key_original = query_context.query_cache_key(query_object)

	# make temporary change and revert it to refresh the changed_on property
	datasource = ConnectorRegistry.get_datasource(
	datasource_type=payload["datasource"]["type"],
	datasource_id=payload["datasource"]["id"],
	session=db.session,
	)
	description_original = datasource.description
	datasource.description = "temporary description"
	db.session.commit()
	datasource.description = description_original
	db.session.commit()

	# create new QueryContext with unchanged attributes, extract new query_cache_key
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	cache_key_new = query_context.query_cache_key(query_object)

	# the new cache_key should be different due to updated datasource
	self.assertNotEqual(cache_key_original, cache_key_new)

	def test_query_cache_key_does_not_change_for_non_existent_or_null(self):
	self.login(username="admin")
	payload = get_query_context("birth_names", add_postprocessing_operations=True)
	del payload["queries"][0]["granularity"]

	# construct baseline query_cache_key from query_context with post processing operation
	query_context: QueryContext = ChartDataQueryContextSchema().load(payload)
	query_object: QueryObject = query_context.queries[0]
	cache_key_original = query_context.query_cache_key(query_object)

	payload["queries"][0]["granularity"] = None
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]

	assert query_context.query_cache_key(query_object) == cache_key_original

	def test_query_cache_key_changes_when_post_processing_is_updated(self):
	self.login(username="admin")
	payload = get_query_context("birth_names", add_postprocessing_operations=True)

	# construct baseline query_cache_key from query_context with post processing operation
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	cache_key_original = query_context.query_cache_key(query_object)

	# ensure added None post_processing operation doesn't change query_cache_key
	payload["queries"][0]["post_processing"].append(None)
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	cache_key = query_context.query_cache_key(query_object)
	self.assertEqual(cache_key_original, cache_key)

	# ensure query without post processing operation is different
	payload["queries"][0].pop("post_processing")
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	cache_key = query_context.query_cache_key(query_object)
	self.assertNotEqual(cache_key_original, cache_key)

	def test_query_context_time_range_endpoints(self):
	"""
	Ensure that time_range_endpoints are populated automatically when missing
	from the payload.
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	del payload["queries"][0]["extras"]["time_range_endpoints"]
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	extras = query_object.to_dict()["extras"]
	assert "time_range_endpoints" in extras
	self.assertEqual(
	extras["time_range_endpoints"],
	(TimeRangeEndpoint.INCLUSIVE, TimeRangeEndpoint.EXCLUSIVE),
	)

	def test_handle_metrics_field(self):
	"""
	Should support both predefined and adhoc metrics.
	"""
	self.login(username="admin")
	adhoc_metric = {
	"expressionType": "SIMPLE",
	"column": {"column_name": "num_boys", "type": "BIGINT(20)"},
	"aggregate": "SUM",
	"label": "Boys",
	"optionName": "metric_11",
	}
	payload = get_query_context("birth_names")
	payload["queries"][0]["metrics"] = ["sum__num", {"label": "abc"}, adhoc_metric]
	query_context = ChartDataQueryContextSchema().load(payload)
	query_object = query_context.queries[0]
	self.assertEqual(query_object.metrics, ["sum__num", "abc", adhoc_metric])

	def test_convert_deprecated_fields(self):
	"""
	Ensure that deprecated fields are converted correctly
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	payload["queries"][0]["granularity_sqla"] = "timecol"
	payload["queries"][0]["having_filters"] = [{"col": "a", "op": "==", "val": "b"}]
	query_context = ChartDataQueryContextSchema().load(payload)
	self.assertEqual(len(query_context.queries), 1)
	query_object = query_context.queries[0]
	self.assertEqual(query_object.granularity, "timecol")
	self.assertIn("having_druid", query_object.extras)

	@pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
	def test_csv_response_format(self):
	"""
	Ensure that CSV result format works
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	payload["result_format"] = ChartDataResultFormat.CSV.value
	payload["queries"][0]["row_limit"] = 10
	query_context = ChartDataQueryContextSchema().load(payload)
	responses = query_context.get_payload()
	self.assertEqual(len(responses), 1)
	data = responses["queries"][0]["data"]
	self.assertIn("name,sum__num\n", data)
	self.assertEqual(len(data.split("\n")), 12)

	def test_sql_injection_via_groupby(self):
	"""
	Ensure that calling invalid columns names in groupby are caught
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	payload["queries"][0]["groupby"] = ["currentDatabase()"]
	query_context = ChartDataQueryContextSchema().load(payload)
	query_payload = query_context.get_payload()
	assert query_payload["queries"][0].get("error") is not None

	def test_sql_injection_via_columns(self):
	"""
	Ensure that calling invalid column names in columns are caught
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	payload["queries"][0]["groupby"] = []
	payload["queries"][0]["metrics"] = []
	payload["queries"][0]["columns"] = ["*, 'extra'"]
	query_context = ChartDataQueryContextSchema().load(payload)
	query_payload = query_context.get_payload()
	assert query_payload["queries"][0].get("error") is not None

	def test_sql_injection_via_metrics(self):
	"""
	Ensure that calling invalid column names in filters are caught
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	payload["queries"][0]["groupby"] = ["name"]
	payload["queries"][0]["metrics"] = [
	{
	"expressionType": AdhocMetricExpressionType.SIMPLE.value,
	"column": {"column_name": "invalid_col"},
	"aggregate": "SUM",
	"label": "My Simple Label",
	}
	]
	query_context = ChartDataQueryContextSchema().load(payload)
	query_payload = query_context.get_payload()
	assert query_payload["queries"][0].get("error") is not None

	@pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
	def test_samples_response_type(self):
	"""
	Ensure that samples result type works
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	payload["result_type"] = ChartDataResultType.SAMPLES.value
	payload["queries"][0]["row_limit"] = 5
	query_context = ChartDataQueryContextSchema().load(payload)
	responses = query_context.get_payload()
	self.assertEqual(len(responses), 1)
	data = responses["queries"][0]["data"]
	self.assertIsInstance(data, list)
	self.assertEqual(len(data), 5)
	self.assertNotIn("sum__num", data[0])

	@pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
	def test_query_response_type(self):
	"""
	Ensure that query result type works
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	sql_text = get_sql_text(payload)
	assert "SELECT" in sql_text
	assert re.search(r'[`"\[]?num[`"\]]? IS NOT NULL', sql_text)
	assert re.search(
	r"""NOT \([`"\[]?name[`"\]]? IS NULL[\s\n]* """
	r"""OR [`"\[]?name[`"\]]? IN \('abc'\)\)""",
	sql_text,
	)

	@pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
	def test_handle_sort_by_metrics(self):
	"""
	Should properly handle sort by metrics in various scenarios.
	"""
	self.login(username="admin")

	sql_text = get_sql_text(get_query_context("birth_names"))
	if backend() == "hive":
	# should have no duplicate `SUM(num)`
	assert "SUM(num) AS `sum__num`," not in sql_text
	assert "SUM(num) AS `sum__num`" in sql_text
	# the alias should be in ORDER BY
	assert "ORDER BY `sum__num` DESC" in sql_text
	else:
	assert re.search(r'ORDER BY [`"\[]?sum__num[`"\]]? DESC', sql_text)

	sql_text = get_sql_text(
	get_query_context("birth_names:only_orderby_has_metric")
	)
	if backend() == "hive":
	assert "SUM(num) AS `sum__num`," not in sql_text
	assert "SUM(num) AS `sum__num`" in sql_text
	assert "ORDER BY `sum__num` DESC" in sql_text
	else:
	assert re.search(
	r'ORDER BY SUM\([`"\[]?num[`"\]]?\) DESC', sql_text, re.IGNORECASE
	)

	sql_text = get_sql_text(get_query_context("birth_names:orderby_dup_alias"))

	# Check SELECT clauses
	if backend() == "presto":
	# presto cannot have ambiguous alias in order by, so selected column
	# alias is renamed.
	assert 'sum("num_boys") AS "num_boys__"' in sql_text
	else:
	assert re.search(
	r'SUM\([`"\[]?num_boys[`"\]]?\) AS [`\"\[]?num_boys[`"\]]?',
	sql_text,
	re.IGNORECASE,
	)

	# Check ORDER BY clauses
	if backend() == "hive":
	# Hive must add additional SORT BY metrics to SELECT
	assert re.search(
	r"MAX\(CASE.*END\) AS `MAX\(CASE WHEN...`",
	sql_text,
	re.IGNORECASE \| re.DOTALL,
	)

	# The additional column with the same expression but a different label
	# as an existing metric should not be added
	assert "sum(`num_girls`) AS `SUM(num_girls)`" not in sql_text

	# Should reference all ORDER BY columns by aliases
	assert "ORDER BY `num_girls` DESC," in sql_text
	assert "`AVG(num_boys)` DESC," in sql_text
	assert "`MAX(CASE WHEN...` ASC" in sql_text
	else:
	if backend() == "presto":
	# since the selected `num_boys` is renamed to `num_boys__`
	# it must be references as expression
	assert re.search(
	r'ORDER BY SUM\([`"\[]?num_girls[`"\]]?\) DESC',
	sql_text,
	re.IGNORECASE,
	)
	else:
	# Should reference the adhoc metric by alias when possible
	assert re.search(
	r'ORDER BY [`"\[]?num_girls[`"\]]? DESC', sql_text, re.IGNORECASE,
	)

	# ORDER BY only columns should always be expressions
	assert re.search(
	r'AVG\([`"\[]?num_boys[`"\]]?\) DESC', sql_text, re.IGNORECASE,
	)
	assert re.search(
	r"MAX\(CASE.*END\) ASC", sql_text, re.IGNORECASE \| re.DOTALL
	)

	@pytest.mark.usefixtures("load_birth_names_dashboard_with_slices")
	def test_fetch_values_predicate(self):
	"""
	Ensure that fetch values predicate is added to query if needed
	"""
	self.login(username="admin")

	payload = get_query_context("birth_names")
	sql_text = get_sql_text(payload)
	assert "123 = 123" not in sql_text

	payload["queries"][0]["apply_fetch_values_predicate"] = True
	sql_text = get_sql_text(payload)
	assert "123 = 123" in sql_text

	def test_query_object_unknown_fields(self):
	"""
	Ensure that query objects with unknown fields don't raise an Exception and
	have an identical cache key as one without the unknown field
	"""
	self.login(username="admin")
	payload = get_query_context("birth_names")
	query_context = ChartDataQueryContextSchema().load(payload)
	responses = query_context.get_payload()
	orig_cache_key = responses["queries"][0]["cache_key"]
	payload["queries"][0]["foo"] = "bar"
	query_context = ChartDataQueryContextSchema().load(payload)
	responses = query_context.get_payload()
	new_cache_key = responses["queries"][0]["cache_key"]
	self.assertEqual(orig_cache_key, new_cache_key)