Copilot commented on code in PR #37368: URL: https://github.com/apache/superset/pull/37368#discussion_r2728760515
########## superset/db_engine_specs/mongodb.py: ########## @@ -0,0 +1,125 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. +"""MongoDB engine spec for Superset. + +Uses PyMongoSQL (https://github.com/passren/PyMongoSQL) as the SQLAlchemy dialect +to enable SQL queries on MongoDB collections. +""" + +from __future__ import annotations + +from datetime import datetime +from typing import Any, Optional + +from sqlalchemy import types + +from superset.constants import TimeGrain +from superset.db_engine_specs.base import BaseEngineSpec, DatabaseCategory + + +class MongoDBEngineSpec(BaseEngineSpec): + """Engine spec for MongoDB using PyMongoSQL dialect.""" + + engine = "mongodb" + engine_name = "MongoDB" + force_column_alias_quotes = False + + metadata = { + "description": ("MongoDB is a document-oriented, operational NoSQL database."), + "logo": "mongodb.png", + "homepage_url": "https://www.mongodb.com/", + "categories": [ + DatabaseCategory.SEARCH_NOSQL, + DatabaseCategory.PROPRIETARY, + ], + "pypi_packages": ["pymongosql"], + "connection_string": ( + "mongodb://{username}:{password}@{host}:{port}/{database}?mode=superset" + ), + "parameters": { + "username": "Username for MongoDB", + "password": "Password for MongoDB", + "host": "MongoDB host", + "port": "MongoDB port", + "database": "Database name", + }, + "drivers": [ + { + "name": "MongoDB Atlas Cloud", + "pypi_package": "pymongosql", + "connection_string": "mongodb+srv://{username}:{password}@{host}/{database}?mode=superset", + "notes": "For MongoDB Atlas cloud service.", + "is_recommended": True, + }, + { + "name": "MongoDB Cluster", + "pypi_package": "pymongosql", + "connection_string": "mongodb://{username}:{password}@{host}:{port}/{database}?mode=superset", + "is_recommended": False, + "notes": ("For self-hosted MongoDB instances."), + }, + ], + "notes": "Uses PartiQL for SQL queries. Requires mode=superset parameter.", + "docs_url": "https://github.com/passren/PyMongoSQL", + } + + _time_grain_expressions = { + None: "{col}", + TimeGrain.SECOND: "DATETIME(STRFTIME('%Y-%m-%dT%H:%M:%S', {col}))", + TimeGrain.MINUTE: "DATETIME(STRFTIME('%Y-%m-%dT%H:%M:00', {col}))", + TimeGrain.HOUR: "DATETIME(STRFTIME('%Y-%m-%dT%H:00:00', {col}))", + TimeGrain.DAY: "DATETIME({col}, 'start of day')", + TimeGrain.WEEK: ( + "DATETIME({col}, 'start of day', -strftime('%w', {col}) || ' days')" + ), + TimeGrain.MONTH: "DATETIME({col}, 'start of month')", + TimeGrain.QUARTER: ( + "DATETIME({col}, 'start of month', " + "printf('-%d month', (strftime('%m', {col}) - 1) % 3))" + ), + TimeGrain.YEAR: "DATETIME({col}, 'start of year')", + TimeGrain.WEEK_ENDING_SATURDAY: "DATETIME({col}, 'start of day', 'weekday 6')", + TimeGrain.WEEK_ENDING_SUNDAY: "DATETIME({col}, 'start of day', 'weekday 0')", + TimeGrain.WEEK_STARTING_SUNDAY: ( + "DATETIME({col}, 'start of day', 'weekday 0', '-7 days')" + ), + TimeGrain.WEEK_STARTING_MONDAY: ( + "DATETIME({col}, 'start of day', 'weekday 1', '-7 days')" + ), + } + + @classmethod + def epoch_to_dttm(cls) -> str: + return "datetime({col}, 'unixepoch')" + + @classmethod + def convert_dttm( + cls, + target_type: str, + dttm: datetime, + db_extra: Optional[dict[str, Any]] = None, + ) -> Optional[str]: + """Convert Python datetime to MongoDB/SQL datetime string.""" + sqla_type = cls.get_sqla_column_type(target_type) + + if isinstance( + sqla_type, (types.String, types.DateTime, types.Date, types.TIMESTAMP) + ): + # Return ISO format datetime string for MongoDB compatibility + return f"""{dttm.isoformat(sep=" ", timespec="seconds")!r}""" Review Comment: The use of `!r` for string formatting is inconsistent with the established pattern in other engine specs. All other engine specs in the codebase explicitly wrap the ISO format string with quotes (e.g., `f"""'{dttm.isoformat(...)}'"""`) rather than using the repr approach. While functionally equivalent, the explicit quote approach is more consistent with patterns seen in DynamoDB (line 90), SQLite (line 135), CockroachDB (line 54), and others. Consider changing to match the established convention. ########## tests/unit_tests/db_engine_specs/test_mongodb.py: ########## @@ -0,0 +1,125 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. +from datetime import datetime +from typing import Optional + +import pytest + +from superset.constants import TimeGrain +from tests.unit_tests.db_engine_specs.utils import assert_convert_dttm +from tests.unit_tests.fixtures.common import dttm # noqa: F401 + + [email protected]( + "target_type,expected_result", + [ + ("text", "'2019-01-02 03:04:05'"), + ("TEXT", "'2019-01-02 03:04:05'"), + ("dateTime", "'2019-01-02 03:04:05'"), + ("DateTime", "'2019-01-02 03:04:05'"), + ("DATETIME", "'2019-01-02 03:04:05'"), + ("string", "'2019-01-02 03:04:05'"), + ("String", "'2019-01-02 03:04:05'"), + ("STRING", "'2019-01-02 03:04:05'"), + ("integer", None), + ("number", None), + ("unknowntype", None), + ], Review Comment: The test_convert_dttm function doesn't include test cases for "date" and "timestamp" target types, even though the convert_dttm implementation explicitly handles types.Date and types.TIMESTAMP (line 120 in mongodb.py). Consider adding test cases like ("date", "'2019-01-02 03:04:05'") and ("timestamp", "'2019-01-02 03:04:05'") to ensure these type conversions are properly validated. ########## superset/db_engine_specs/mongodb.py: ########## @@ -0,0 +1,125 @@ +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, +# software distributed under the License is distributed on an +# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY +# KIND, either express or implied. See the License for the +# specific language governing permissions and limitations +# under the License. +"""MongoDB engine spec for Superset. + +Uses PyMongoSQL (https://github.com/passren/PyMongoSQL) as the SQLAlchemy dialect +to enable SQL queries on MongoDB collections. +""" + +from __future__ import annotations + +from datetime import datetime +from typing import Any, Optional + +from sqlalchemy import types + +from superset.constants import TimeGrain +from superset.db_engine_specs.base import BaseEngineSpec, DatabaseCategory + + +class MongoDBEngineSpec(BaseEngineSpec): + """Engine spec for MongoDB using PyMongoSQL dialect.""" + + engine = "mongodb" + engine_name = "MongoDB" + force_column_alias_quotes = False + + metadata = { + "description": ("MongoDB is a document-oriented, operational NoSQL database."), + "logo": "mongodb.png", + "homepage_url": "https://www.mongodb.com/", + "categories": [ + DatabaseCategory.SEARCH_NOSQL, + DatabaseCategory.PROPRIETARY, + ], + "pypi_packages": ["pymongosql"], + "connection_string": ( + "mongodb://{username}:{password}@{host}:{port}/{database}?mode=superset" + ), + "parameters": { + "username": "Username for MongoDB", + "password": "Password for MongoDB", + "host": "MongoDB host", + "port": "MongoDB port", + "database": "Database name", + }, + "drivers": [ + { + "name": "MongoDB Atlas Cloud", + "pypi_package": "pymongosql", + "connection_string": "mongodb+srv://{username}:{password}@{host}/{database}?mode=superset", + "notes": "For MongoDB Atlas cloud service.", + "is_recommended": True, + }, + { + "name": "MongoDB Cluster", + "pypi_package": "pymongosql", + "connection_string": "mongodb://{username}:{password}@{host}:{port}/{database}?mode=superset", + "is_recommended": False, + "notes": ("For self-hosted MongoDB instances."), + }, + ], + "notes": "Uses PartiQL for SQL queries. Requires mode=superset parameter.", Review Comment: The metadata notes incorrectly reference "PartiQL" which is specific to DynamoDB/AWS, not MongoDB. MongoDB uses its own SQL-like query language through PyMongoSQL. This should be corrected to accurately describe the SQL dialect or querying mechanism used by PyMongoSQL for MongoDB. ```suggestion "notes": "Uses PyMongoSQL to enable SQL-like queries on MongoDB collections. Requires mode=superset parameter.", ``` -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: [email protected] For queries about this service, please contact Infrastructure at: [email protected] --------------------------------------------------------------------- To unsubscribe, e-mail: [email protected] For additional commands, e-mail: [email protected]
