mirror of
https://github.com/apache/superset.git
synced 2024-09-19 20:19:37 -04:00
331 lines
10 KiB
Python
331 lines
10 KiB
Python
# Licensed to the Apache Software Foundation (ASF) under one
|
|
# or more contributor license agreements. See the NOTICE file
|
|
# distributed with this work for additional information
|
|
# regarding copyright ownership. The ASF licenses this file
|
|
# to you under the Apache License, Version 2.0 (the
|
|
# "License"); you may not use this file except in compliance
|
|
# with the License. You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing,
|
|
# software distributed under the License is distributed on an
|
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
# KIND, either express or implied. See the License for the
|
|
# specific language governing permissions and limitations
|
|
# under the License.
|
|
# pylint: disable=import-outside-toplevel, unused-argument, redefined-outer-name, invalid-name
|
|
|
|
from functools import partial
|
|
from typing import Any, Dict, TYPE_CHECKING
|
|
|
|
import pytest
|
|
from pytest_mock import MockerFixture
|
|
from sqlalchemy.orm.session import Session
|
|
|
|
if TYPE_CHECKING:
|
|
from superset.connectors.sqla.models import SqlaTable
|
|
|
|
FULL_DTTM_DEFAULTS_EXAMPLE = {
|
|
"main_dttm_col": "id",
|
|
"dttm_columns": {
|
|
"dttm": {
|
|
"python_date_format": "epoch_s",
|
|
"expression": "CAST(dttm as INTEGER)",
|
|
},
|
|
"id": {"python_date_format": "epoch_ms"},
|
|
"month": {
|
|
"python_date_format": "%Y-%m-%d",
|
|
"expression": (
|
|
"CASE WHEN length(month) = 7 THEN month || '-01' ELSE month END"
|
|
),
|
|
},
|
|
},
|
|
}
|
|
|
|
|
|
def apply_dttm_defaults(table: "SqlaTable", dttm_defaults: Dict[str, Any]) -> None:
|
|
"""Applies dttm defaults to the table, mutates in place."""
|
|
for dbcol in table.columns:
|
|
# Set is_dttm is column is listed in dttm_columns.
|
|
if dbcol.column_name in dttm_defaults.get("dttm_columns", {}):
|
|
dbcol.is_dttm = True
|
|
|
|
# Skip non dttm columns.
|
|
if dbcol.column_name not in dttm_defaults.get("dttm_columns", {}):
|
|
continue
|
|
|
|
# Set table main_dttm_col.
|
|
if dbcol.column_name == dttm_defaults.get("main_dttm_col"):
|
|
table.main_dttm_col = dbcol.column_name
|
|
|
|
# Apply defaults if empty.
|
|
dttm_column_defaults = dttm_defaults.get("dttm_columns", {}).get(
|
|
dbcol.column_name, {}
|
|
)
|
|
dbcol.is_dttm = True
|
|
if (
|
|
not dbcol.python_date_format
|
|
and "python_date_format" in dttm_column_defaults
|
|
):
|
|
dbcol.python_date_format = dttm_column_defaults["python_date_format"]
|
|
if not dbcol.expression and "expression" in dttm_column_defaults:
|
|
dbcol.expression = dttm_column_defaults["expression"]
|
|
|
|
|
|
@pytest.fixture
|
|
def test_table(session: Session) -> "SqlaTable":
|
|
"""
|
|
Fixture that generates an in-memory table.
|
|
"""
|
|
from superset.connectors.sqla.models import SqlaTable, TableColumn
|
|
from superset.models.core import Database
|
|
|
|
engine = session.get_bind()
|
|
SqlaTable.metadata.create_all(engine) # pylint: disable=no-member
|
|
|
|
columns = [
|
|
TableColumn(column_name="ds", is_dttm=1, type="TIMESTAMP"),
|
|
TableColumn(column_name="event_time", is_dttm=1, type="TIMESTAMP"),
|
|
TableColumn(column_name="id", type="INTEGER"),
|
|
TableColumn(column_name="dttm", type="INTEGER"),
|
|
TableColumn(column_name="duration_ms", type="INTEGER"),
|
|
]
|
|
|
|
return SqlaTable(
|
|
table_name="test_table",
|
|
columns=columns,
|
|
metrics=[],
|
|
main_dttm_col=None,
|
|
database=Database(database_name="my_database", sqlalchemy_uri="sqlite://"),
|
|
)
|
|
|
|
|
|
def test_main_dttm_col(mocker: MockerFixture, test_table: "SqlaTable") -> None:
|
|
"""
|
|
Test the ``SQLA_TABLE_MUTATOR`` config.
|
|
"""
|
|
dttm_defaults = {
|
|
"main_dttm_col": "event_time",
|
|
"dttm_columns": {"ds": {}, "event_time": {}},
|
|
}
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.config",
|
|
new={
|
|
"SQLA_TABLE_MUTATOR": partial(
|
|
apply_dttm_defaults,
|
|
dttm_defaults=dttm_defaults,
|
|
)
|
|
},
|
|
)
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.get_physical_table_metadata",
|
|
return_value=[
|
|
{"name": "ds", "type": "TIMESTAMP", "is_dttm": True},
|
|
{"name": "event_time", "type": "TIMESTAMP", "is_dttm": True},
|
|
{"name": "id", "type": "INTEGER", "is_dttm": False},
|
|
],
|
|
)
|
|
|
|
assert test_table.main_dttm_col is None
|
|
test_table.fetch_metadata()
|
|
assert test_table.main_dttm_col == "event_time"
|
|
|
|
|
|
def test_main_dttm_col_nonexistent(
|
|
mocker: MockerFixture,
|
|
test_table: "SqlaTable",
|
|
) -> None:
|
|
"""
|
|
Test the ``SQLA_TABLE_MUTATOR`` config when main datetime column doesn't exist.
|
|
"""
|
|
dttm_defaults = {
|
|
"main_dttm_col": "nonexistent",
|
|
}
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.config",
|
|
new={
|
|
"SQLA_TABLE_MUTATOR": partial(
|
|
apply_dttm_defaults,
|
|
dttm_defaults=dttm_defaults,
|
|
)
|
|
},
|
|
)
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.get_physical_table_metadata",
|
|
return_value=[
|
|
{"name": "ds", "type": "TIMESTAMP", "is_dttm": True},
|
|
{"name": "event_time", "type": "TIMESTAMP", "is_dttm": True},
|
|
{"name": "id", "type": "INTEGER", "is_dttm": False},
|
|
],
|
|
)
|
|
|
|
assert test_table.main_dttm_col is None
|
|
test_table.fetch_metadata()
|
|
# fall back to ds
|
|
assert test_table.main_dttm_col == "ds"
|
|
|
|
|
|
def test_main_dttm_col_nondttm(
|
|
mocker: MockerFixture,
|
|
test_table: "SqlaTable",
|
|
) -> None:
|
|
"""
|
|
Test the ``SQLA_TABLE_MUTATOR`` config when main datetime column has wrong type.
|
|
"""
|
|
dttm_defaults = {
|
|
"main_dttm_col": "id",
|
|
}
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.config",
|
|
new={
|
|
"SQLA_TABLE_MUTATOR": partial(
|
|
apply_dttm_defaults,
|
|
dttm_defaults=dttm_defaults,
|
|
)
|
|
},
|
|
)
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.get_physical_table_metadata",
|
|
return_value=[
|
|
{"name": "ds", "type": "TIMESTAMP", "is_dttm": True},
|
|
{"name": "event_time", "type": "TIMESTAMP", "is_dttm": True},
|
|
{"name": "id", "type": "INTEGER", "is_dttm": False},
|
|
],
|
|
)
|
|
|
|
assert test_table.main_dttm_col is None
|
|
test_table.fetch_metadata()
|
|
# fall back to ds
|
|
assert test_table.main_dttm_col == "ds"
|
|
|
|
|
|
def test_python_date_format_by_column_name(
|
|
mocker: MockerFixture,
|
|
test_table: "SqlaTable",
|
|
) -> None:
|
|
"""
|
|
Test the ``SQLA_TABLE_MUTATOR`` setting for "python_date_format".
|
|
"""
|
|
table_defaults = {
|
|
"dttm_columns": {
|
|
"id": {"python_date_format": "epoch_ms"},
|
|
"dttm": {"python_date_format": "epoch_s"},
|
|
"duration_ms": {"python_date_format": "invalid"},
|
|
},
|
|
}
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.config",
|
|
new={
|
|
"SQLA_TABLE_MUTATOR": partial(
|
|
apply_dttm_defaults,
|
|
dttm_defaults=table_defaults,
|
|
)
|
|
},
|
|
)
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.get_physical_table_metadata",
|
|
return_value=[
|
|
{"name": "id", "type": "INTEGER", "is_dttm": False},
|
|
{"name": "dttm", "type": "INTEGER", "is_dttm": False},
|
|
{"name": "duration_ms", "type": "INTEGER", "is_dttm": False},
|
|
],
|
|
)
|
|
|
|
test_table.fetch_metadata()
|
|
|
|
id_col = [c for c in test_table.columns if c.column_name == "id"][0]
|
|
assert id_col.is_dttm
|
|
assert id_col.python_date_format == "epoch_ms"
|
|
|
|
dttm_col = [c for c in test_table.columns if c.column_name == "dttm"][0]
|
|
assert dttm_col.is_dttm
|
|
assert dttm_col.python_date_format == "epoch_s"
|
|
|
|
duration_ms_col = [c for c in test_table.columns if c.column_name == "duration_ms"][
|
|
0
|
|
]
|
|
assert duration_ms_col.is_dttm
|
|
assert duration_ms_col.python_date_format == "invalid"
|
|
|
|
|
|
def test_expression_by_column_name(
|
|
mocker: MockerFixture,
|
|
test_table: "SqlaTable",
|
|
) -> None:
|
|
"""
|
|
Test the ``SQLA_TABLE_MUTATOR`` setting for expression.
|
|
"""
|
|
table_defaults = {
|
|
"dttm_columns": {
|
|
"dttm": {"expression": "CAST(dttm as INTEGER)"},
|
|
"duration_ms": {"expression": "CAST(duration_ms as DOUBLE)"},
|
|
},
|
|
}
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.config",
|
|
new={
|
|
"SQLA_TABLE_MUTATOR": partial(
|
|
apply_dttm_defaults,
|
|
dttm_defaults=table_defaults,
|
|
)
|
|
},
|
|
)
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.get_physical_table_metadata",
|
|
return_value=[
|
|
{"name": "dttm", "type": "INTEGER", "is_dttm": False},
|
|
{"name": "duration_ms", "type": "INTEGER", "is_dttm": False},
|
|
],
|
|
)
|
|
|
|
test_table.fetch_metadata()
|
|
|
|
dttm_col = [c for c in test_table.columns if c.column_name == "dttm"][0]
|
|
assert dttm_col.is_dttm
|
|
assert dttm_col.expression == "CAST(dttm as INTEGER)"
|
|
|
|
duration_ms_col = [c for c in test_table.columns if c.column_name == "duration_ms"][
|
|
0
|
|
]
|
|
assert duration_ms_col.is_dttm
|
|
assert duration_ms_col.expression == "CAST(duration_ms as DOUBLE)"
|
|
|
|
|
|
def test_full_setting(
|
|
mocker: MockerFixture,
|
|
test_table: "SqlaTable",
|
|
) -> None:
|
|
"""
|
|
Test the ``SQLA_TABLE_MUTATOR`` with full settings.
|
|
"""
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.config",
|
|
new={
|
|
"SQLA_TABLE_MUTATOR": partial(
|
|
apply_dttm_defaults,
|
|
dttm_defaults=FULL_DTTM_DEFAULTS_EXAMPLE,
|
|
)
|
|
},
|
|
)
|
|
mocker.patch(
|
|
"superset.connectors.sqla.models.get_physical_table_metadata",
|
|
return_value=[
|
|
{"name": "id", "type": "INTEGER", "is_dttm": False},
|
|
{"name": "dttm", "type": "INTEGER", "is_dttm": False},
|
|
{"name": "duration_ms", "type": "INTEGER", "is_dttm": False},
|
|
],
|
|
)
|
|
|
|
test_table.fetch_metadata()
|
|
|
|
id_col = [c for c in test_table.columns if c.column_name == "id"][0]
|
|
assert id_col.is_dttm
|
|
assert id_col.python_date_format == "epoch_ms"
|
|
assert id_col.expression == ""
|
|
|
|
dttm_col = [c for c in test_table.columns if c.column_name == "dttm"][0]
|
|
assert dttm_col.is_dttm
|
|
assert dttm_col.python_date_format == "epoch_s"
|
|
assert dttm_col.expression == "CAST(dttm as INTEGER)"
|