mirror of
https://github.com/apache/superset.git
synced 2026-04-17 07:05:04 +00:00
feat(database): SIP-195 Add MongoDB database engine support (#37368)
Co-authored-by: Peng Ren <ia250@cummins.com>
This commit is contained in:
BIN
docs/static/img/databases/mongodb.png
vendored
Normal file
BIN
docs/static/img/databases/mongodb.png
vendored
Normal file
Binary file not shown.
|
After Width: | Height: | Size: 22 KiB |
125
superset/db_engine_specs/mongodb.py
Normal file
125
superset/db_engine_specs/mongodb.py
Normal file
@@ -0,0 +1,125 @@
|
||||
# Licensed to the Apache Software Foundation (ASF) under one
|
||||
# or more contributor license agreements. See the NOTICE file
|
||||
# distributed with this work for additional information
|
||||
# regarding copyright ownership. The ASF licenses this file
|
||||
# to you under the Apache License, Version 2.0 (the
|
||||
# "License"); you may not use this file except in compliance
|
||||
# with the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing,
|
||||
# software distributed under the License is distributed on an
|
||||
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
||||
# KIND, either express or implied. See the License for the
|
||||
# specific language governing permissions and limitations
|
||||
# under the License.
|
||||
"""MongoDB engine spec for Superset.
|
||||
|
||||
Uses PyMongoSQL (https://github.com/passren/PyMongoSQL) as the SQLAlchemy dialect
|
||||
to enable SQL queries on MongoDB collections.
|
||||
"""
|
||||
|
||||
from __future__ import annotations
|
||||
|
||||
from datetime import datetime
|
||||
from typing import Any, Optional
|
||||
|
||||
from sqlalchemy import types
|
||||
|
||||
from superset.constants import TimeGrain
|
||||
from superset.db_engine_specs.base import BaseEngineSpec, DatabaseCategory
|
||||
|
||||
|
||||
class MongoDBEngineSpec(BaseEngineSpec):
|
||||
"""Engine spec for MongoDB using PyMongoSQL dialect."""
|
||||
|
||||
engine = "mongodb"
|
||||
engine_name = "MongoDB"
|
||||
force_column_alias_quotes = False
|
||||
|
||||
metadata = {
|
||||
"description": ("MongoDB is a document-oriented, operational NoSQL database."),
|
||||
"logo": "mongodb.png",
|
||||
"homepage_url": "https://www.mongodb.com/",
|
||||
"categories": [
|
||||
DatabaseCategory.SEARCH_NOSQL,
|
||||
DatabaseCategory.PROPRIETARY,
|
||||
],
|
||||
"pypi_packages": ["pymongosql"],
|
||||
"connection_string": (
|
||||
"mongodb://{username}:{password}@{host}:{port}/{database}?mode=superset"
|
||||
),
|
||||
"parameters": {
|
||||
"username": "Username for MongoDB",
|
||||
"password": "Password for MongoDB",
|
||||
"host": "MongoDB host",
|
||||
"port": "MongoDB port",
|
||||
"database": "Database name",
|
||||
},
|
||||
"drivers": [
|
||||
{
|
||||
"name": "MongoDB Atlas Cloud",
|
||||
"pypi_package": "pymongosql",
|
||||
"connection_string": "mongodb+srv://{username}:{password}@{host}/{database}?mode=superset",
|
||||
"notes": "For MongoDB Atlas cloud service.",
|
||||
"is_recommended": True,
|
||||
},
|
||||
{
|
||||
"name": "MongoDB Cluster",
|
||||
"pypi_package": "pymongosql",
|
||||
"connection_string": "mongodb://{username}:{password}@{host}:{port}/{database}?mode=superset",
|
||||
"is_recommended": False,
|
||||
"notes": ("For self-hosted MongoDB instances."),
|
||||
},
|
||||
],
|
||||
"notes": "Uses PartiQL for SQL queries. Requires mode=superset parameter.",
|
||||
"docs_url": "https://github.com/passren/PyMongoSQL",
|
||||
}
|
||||
|
||||
_time_grain_expressions = {
|
||||
None: "{col}",
|
||||
TimeGrain.SECOND: "DATETIME(STRFTIME('%Y-%m-%dT%H:%M:%S', {col}))",
|
||||
TimeGrain.MINUTE: "DATETIME(STRFTIME('%Y-%m-%dT%H:%M:00', {col}))",
|
||||
TimeGrain.HOUR: "DATETIME(STRFTIME('%Y-%m-%dT%H:00:00', {col}))",
|
||||
TimeGrain.DAY: "DATETIME({col}, 'start of day')",
|
||||
TimeGrain.WEEK: (
|
||||
"DATETIME({col}, 'start of day', -strftime('%w', {col}) || ' days')"
|
||||
),
|
||||
TimeGrain.MONTH: "DATETIME({col}, 'start of month')",
|
||||
TimeGrain.QUARTER: (
|
||||
"DATETIME({col}, 'start of month', "
|
||||
"printf('-%d month', (strftime('%m', {col}) - 1) % 3))"
|
||||
),
|
||||
TimeGrain.YEAR: "DATETIME({col}, 'start of year')",
|
||||
TimeGrain.WEEK_ENDING_SATURDAY: "DATETIME({col}, 'start of day', 'weekday 6')",
|
||||
TimeGrain.WEEK_ENDING_SUNDAY: "DATETIME({col}, 'start of day', 'weekday 0')",
|
||||
TimeGrain.WEEK_STARTING_SUNDAY: (
|
||||
"DATETIME({col}, 'start of day', 'weekday 0', '-7 days')"
|
||||
),
|
||||
TimeGrain.WEEK_STARTING_MONDAY: (
|
||||
"DATETIME({col}, 'start of day', 'weekday 1', '-7 days')"
|
||||
),
|
||||
}
|
||||
|
||||
@classmethod
|
||||
def epoch_to_dttm(cls) -> str:
|
||||
return "datetime({col}, 'unixepoch')"
|
||||
|
||||
@classmethod
|
||||
def convert_dttm(
|
||||
cls,
|
||||
target_type: str,
|
||||
dttm: datetime,
|
||||
db_extra: Optional[dict[str, Any]] = None,
|
||||
) -> Optional[str]:
|
||||
"""Convert Python datetime to MongoDB/SQL datetime string."""
|
||||
sqla_type = cls.get_sqla_column_type(target_type)
|
||||
|
||||
if isinstance(
|
||||
sqla_type, (types.String, types.DateTime, types.Date, types.TIMESTAMP)
|
||||
):
|
||||
# Return ISO format datetime string for MongoDB compatibility
|
||||
return f"""{dttm.isoformat(sep=" ", timespec="seconds")!r}"""
|
||||
|
||||
return None
|
||||
125
tests/unit_tests/db_engine_specs/test_mongodb.py
Normal file
125
tests/unit_tests/db_engine_specs/test_mongodb.py
Normal file
@@ -0,0 +1,125 @@
|
||||
# Licensed to the Apache Software Foundation (ASF) under one
|
||||
# or more contributor license agreements. See the NOTICE file
|
||||
# distributed with this work for additional information
|
||||
# regarding copyright ownership. The ASF licenses this file
|
||||
# to you under the Apache License, Version 2.0 (the
|
||||
# "License"); you may not use this file except in compliance
|
||||
# with the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing,
|
||||
# software distributed under the License is distributed on an
|
||||
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
||||
# KIND, either express or implied. See the License for the
|
||||
# specific language governing permissions and limitations
|
||||
# under the License.
|
||||
from datetime import datetime
|
||||
from typing import Optional
|
||||
|
||||
import pytest
|
||||
|
||||
from superset.constants import TimeGrain
|
||||
from tests.unit_tests.db_engine_specs.utils import assert_convert_dttm
|
||||
from tests.unit_tests.fixtures.common import dttm # noqa: F401
|
||||
|
||||
|
||||
@pytest.mark.parametrize(
|
||||
"target_type,expected_result",
|
||||
[
|
||||
("text", "'2019-01-02 03:04:05'"),
|
||||
("TEXT", "'2019-01-02 03:04:05'"),
|
||||
("dateTime", "'2019-01-02 03:04:05'"),
|
||||
("DateTime", "'2019-01-02 03:04:05'"),
|
||||
("DATETIME", "'2019-01-02 03:04:05'"),
|
||||
("string", "'2019-01-02 03:04:05'"),
|
||||
("String", "'2019-01-02 03:04:05'"),
|
||||
("STRING", "'2019-01-02 03:04:05'"),
|
||||
("integer", None),
|
||||
("number", None),
|
||||
("unknowntype", None),
|
||||
],
|
||||
)
|
||||
def test_convert_dttm(
|
||||
target_type: str,
|
||||
expected_result: Optional[str],
|
||||
dttm: datetime, # noqa: F811
|
||||
) -> None:
|
||||
"""Test datetime conversion for various MongoDB column types."""
|
||||
from superset.db_engine_specs.mongodb import (
|
||||
MongoDBEngineSpec as spec, # noqa: N813
|
||||
)
|
||||
|
||||
assert_convert_dttm(spec, target_type, expected_result, dttm)
|
||||
|
||||
|
||||
def test_epoch_to_dttm() -> None:
|
||||
"""Test epoch to datetime conversion."""
|
||||
from superset.db_engine_specs.mongodb import (
|
||||
MongoDBEngineSpec as spec, # noqa: N813
|
||||
)
|
||||
|
||||
# MongoDB engine just passes through the column expression
|
||||
assert spec.epoch_to_dttm() == "datetime({col}, 'unixepoch')"
|
||||
|
||||
|
||||
@pytest.mark.parametrize(
|
||||
"grain,expected_expression",
|
||||
[
|
||||
(None, "{col}"),
|
||||
(TimeGrain.SECOND, "DATETIME(STRFTIME('%Y-%m-%dT%H:%M:%S', {col}))"),
|
||||
(TimeGrain.MINUTE, "DATETIME(STRFTIME('%Y-%m-%dT%H:%M:00', {col}))"),
|
||||
(TimeGrain.HOUR, "DATETIME(STRFTIME('%Y-%m-%dT%H:00:00', {col}))"),
|
||||
(TimeGrain.DAY, "DATETIME({col}, 'start of day')"),
|
||||
(
|
||||
TimeGrain.WEEK,
|
||||
"DATETIME({col}, 'start of day', -strftime('%w', {col}) || ' days')",
|
||||
),
|
||||
(TimeGrain.MONTH, "DATETIME({col}, 'start of month')"),
|
||||
(
|
||||
TimeGrain.QUARTER,
|
||||
"DATETIME({col}, 'start of month', "
|
||||
"printf('-%d month', (strftime('%m', {col}) - 1) % 3))",
|
||||
),
|
||||
(TimeGrain.YEAR, "DATETIME({col}, 'start of year')"),
|
||||
(
|
||||
TimeGrain.WEEK_ENDING_SATURDAY,
|
||||
"DATETIME({col}, 'start of day', 'weekday 6')",
|
||||
),
|
||||
(
|
||||
TimeGrain.WEEK_ENDING_SUNDAY,
|
||||
"DATETIME({col}, 'start of day', 'weekday 0')",
|
||||
),
|
||||
(
|
||||
TimeGrain.WEEK_STARTING_SUNDAY,
|
||||
"DATETIME({col}, 'start of day', 'weekday 0', '-7 days')",
|
||||
),
|
||||
(
|
||||
TimeGrain.WEEK_STARTING_MONDAY,
|
||||
"DATETIME({col}, 'start of day', 'weekday 1', '-7 days')",
|
||||
),
|
||||
],
|
||||
)
|
||||
def test_time_grain_expressions(
|
||||
grain: Optional[TimeGrain],
|
||||
expected_expression: str,
|
||||
) -> None:
|
||||
"""Test time grain expressions for MongoDB."""
|
||||
from superset.db_engine_specs.mongodb import (
|
||||
MongoDBEngineSpec as spec, # noqa: N813
|
||||
)
|
||||
|
||||
# pylint: disable=protected-access
|
||||
actual = spec._time_grain_expressions.get(grain)
|
||||
assert actual == expected_expression
|
||||
|
||||
|
||||
def test_engine_metadata() -> None:
|
||||
"""Test MongoDB engine specification metadata."""
|
||||
from superset.db_engine_specs.mongodb import (
|
||||
MongoDBEngineSpec as spec, # noqa: N813
|
||||
)
|
||||
|
||||
assert spec.engine == "mongodb"
|
||||
assert spec.engine_name == "MongoDB"
|
||||
assert spec.force_column_alias_quotes is False
|
||||
Reference in New Issue
Block a user