diff --git a/README.md b/README.md
index 0cadd1ead..8c13452d1 100644
--- a/README.md
+++ b/README.md
@@ -122,6 +122,7 @@ Here are some of the major database solutions that are supported:
+
**A more comprehensive list of supported databases** along with the configuration instructions can be found [here](https://superset.apache.org/docs/databases/installing-database-drivers).
diff --git a/docs/docs/databases/installing-database-drivers.mdx b/docs/docs/databases/installing-database-drivers.mdx
index ee1b38533..86b1ecd19 100644
--- a/docs/docs/databases/installing-database-drivers.mdx
+++ b/docs/docs/databases/installing-database-drivers.mdx
@@ -52,6 +52,7 @@ A list of some of the recommended packages.
| [Trino](/docs/databases/trino) | `pip install trino` | `trino://{username}:{password}@{hostname}:{port}/{catalog}` |
| [Presto](/docs/databases/presto) | `pip install pyhive` | `presto://` |
| [SAP Hana](/docs/databases/hana) | `pip install hdbcli sqlalchemy-hana or pip install apache-superset[hana]` | `hana://{username}:{password}@{host}:{port}` |
+| [StarRocks](/docs/databases/starrocks) | `pip install starrocks` | `starrocks://:@:/.` |
| [Snowflake](/docs/databases/snowflake) | `pip install snowflake-sqlalchemy` | `snowflake://{user}:{password}@{account}.{region}/{database}?role={role}&warehouse={warehouse}` |
| SQLite | No additional library needed | `sqlite://` |
| [SQL Server](/docs/databases/sql-server) | `pip install pymssql` | `mssql+pymssql://` |
diff --git a/docs/docs/databases/starrocks.mdx b/docs/docs/databases/starrocks.mdx
new file mode 100644
index 000000000..9572437f4
--- /dev/null
+++ b/docs/docs/databases/starrocks.mdx
@@ -0,0 +1,26 @@
+---
+title: StarRocks
+hide_title: true
+sidebar_position: 5
+version: 1
+---
+
+## StarRocks
+
+The [sqlalchemy-starrocks](https://pypi.org/project/starrocks/) library is the recommended
+way to connect to StarRocks through SQLAlchemy.
+
+You'll need to the following setting values to form the connection string:
+
+- **User**: User Name
+- **Password**: DBPassword
+- **Host**: StarRocks FE Host
+- **Catalog**: Catalog Name
+- **Database**: Database Name
+- **Port**: StarRocks FE port
+
+Here's what the connection string looks like:
+
+```
+starrocks://:@:/.
+```
diff --git a/docs/src/resources/data.js b/docs/src/resources/data.js
index 49bc554a4..79b12017d 100644
--- a/docs/src/resources/data.js
+++ b/docs/src/resources/data.js
@@ -152,5 +152,10 @@ export const Databases = [
title: 'YugabyteDB',
href: "www.yugabyte.com",
imgName: 'yugabyte.png'
+ },
+ {
+ title: 'StarRocks',
+ href: "www.starrocks.io",
+ imgName: 'starrocks.png'
}
];
diff --git a/docs/static/img/databases/starrocks.png b/docs/static/img/databases/starrocks.png
new file mode 100644
index 000000000..6868371d7
Binary files /dev/null and b/docs/static/img/databases/starrocks.png differ
diff --git a/setup.py b/setup.py
index 6bad485f2..41f7e11e3 100644
--- a/setup.py
+++ b/setup.py
@@ -189,6 +189,7 @@ setup(
"thumbnails": ["Pillow>=9.5.0, <10.0.0"],
"vertica": ["sqlalchemy-vertica-python>=0.5.9, < 0.6"],
"netezza": ["nzalchemy>=11.0.2"],
+ "starrocks": ["starrocks>=1.0.0"],
},
python_requires="~=3.9",
author="Apache Software Foundation",
diff --git a/superset-frontend/src/assets/images/starrocks.png b/superset-frontend/src/assets/images/starrocks.png
new file mode 100644
index 000000000..6868371d7
Binary files /dev/null and b/superset-frontend/src/assets/images/starrocks.png differ
diff --git a/superset/db_engine_specs/starrocks.py b/superset/db_engine_specs/starrocks.py
new file mode 100644
index 000000000..f687fdbdb
--- /dev/null
+++ b/superset/db_engine_specs/starrocks.py
@@ -0,0 +1,222 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+import logging
+import re
+from typing import Any, Dict, List, Optional, Pattern, Tuple, Type
+from urllib import parse
+
+from flask_babel import gettext as __
+from sqlalchemy import Integer, Numeric, types
+from sqlalchemy.engine import Inspector
+from sqlalchemy.engine.result import Row as ResultRow
+from sqlalchemy.engine.url import URL
+from sqlalchemy.sql.type_api import TypeEngine
+
+from superset.db_engine_specs.mysql import MySQLEngineSpec
+from superset.errors import SupersetErrorType
+from superset.utils.core import GenericDataType
+
+# Regular expressions to catch custom errors
+CONNECTION_ACCESS_DENIED_REGEX = re.compile(
+ "Access denied for user '(?P.*?)'"
+)
+CONNECTION_UNKNOWN_DATABASE_REGEX = re.compile("Unknown database '(?P.*?)'")
+
+logger = logging.getLogger(__name__)
+
+
+class TINYINT(Integer): # pylint: disable=no-init
+ __visit_name__ = "TINYINT"
+
+
+class DOUBLE(Numeric): # pylint: disable=no-init
+ __visit_name__ = "DOUBLE"
+
+
+class ARRAY(TypeEngine): # pylint: disable=no-init
+ __visit_name__ = "ARRAY"
+
+ @property
+ def python_type(self) -> Optional[Type[List[Any]]]:
+ return list
+
+
+class MAP(TypeEngine): # pylint: disable=no-init
+ __visit_name__ = "MAP"
+
+ @property
+ def python_type(self) -> Optional[Type[Dict[Any, Any]]]:
+ return dict
+
+
+class STRUCT(TypeEngine): # pylint: disable=no-init
+ __visit_name__ = "STRUCT"
+
+ @property
+ def python_type(self) -> Optional[Type[Any]]:
+ return None
+
+
+class StarRocksEngineSpec(MySQLEngineSpec):
+ engine = "starrocks"
+ engine_name = "StarRocks"
+
+ default_driver = "starrocks"
+ sqlalchemy_uri_placeholder = (
+ "starrocks://user:password@host:port/catalog.db[?key=value&key=value...]"
+ )
+
+ column_type_mappings = ( # type: ignore
+ (
+ re.compile(r"^tinyint", re.IGNORECASE),
+ TINYINT(),
+ GenericDataType.NUMERIC,
+ ),
+ (
+ re.compile(r"^decimal.*", re.IGNORECASE),
+ types.DECIMAL(),
+ GenericDataType.NUMERIC,
+ ),
+ (
+ re.compile(r"^double", re.IGNORECASE),
+ DOUBLE(),
+ GenericDataType.NUMERIC,
+ ),
+ (
+ re.compile(r"^varchar(\((\d+)\))*$", re.IGNORECASE),
+ types.VARCHAR(),
+ GenericDataType.STRING,
+ ),
+ (
+ re.compile(r"^char(\((\d+)\))*$", re.IGNORECASE),
+ types.CHAR(),
+ GenericDataType.STRING,
+ ),
+ (
+ re.compile(r"^binary.*", re.IGNORECASE),
+ types.String(),
+ GenericDataType.STRING,
+ ),
+ (re.compile(r"^array.*", re.IGNORECASE), ARRAY(), GenericDataType.STRING),
+ (re.compile(r"^map.*", re.IGNORECASE), MAP(), GenericDataType.STRING),
+ (re.compile(r"^struct.*", re.IGNORECASE), STRUCT(), GenericDataType.STRING),
+ )
+
+ custom_errors: Dict[Pattern[str], Tuple[str, SupersetErrorType, Dict[str, Any]]] = {
+ CONNECTION_ACCESS_DENIED_REGEX: (
+ __('Either the username "%(username)s" or the password is incorrect.'),
+ SupersetErrorType.CONNECTION_ACCESS_DENIED_ERROR,
+ {"invalid": ["username", "password"]},
+ ),
+ CONNECTION_UNKNOWN_DATABASE_REGEX: (
+ __('Unable to connect to database "%(database)s".'),
+ SupersetErrorType.CONNECTION_UNKNOWN_DATABASE_ERROR,
+ {"invalid": ["database"]},
+ ),
+ }
+
+ @classmethod
+ def adjust_engine_params(
+ cls,
+ uri: URL,
+ connect_args: Dict[str, Any],
+ catalog: Optional[str] = None,
+ schema: Optional[str] = None,
+ ) -> Tuple[URL, Dict[str, Any]]:
+ database = uri.database
+ if schema and database:
+ schema = parse.quote(schema, safe="")
+ if "." in database:
+ database = database.split(".")[0] + "." + schema
+ else:
+ database += "." + schema
+ uri = uri.set(database=database)
+
+ return uri, connect_args
+
+ @classmethod
+ def get_columns(
+ cls, inspector: Inspector, table_name: str, schema: Optional[str]
+ ) -> List[Dict[str, Any]]:
+ columns = cls._show_columns(inspector, table_name, schema)
+ result: List[Dict[str, Any]] = []
+ for column in columns:
+ column_spec = cls.get_column_spec(column.Type)
+ column_type = column_spec.sqla_type if column_spec else None
+ if column_type is None:
+ column_type = types.String()
+ logger.info(
+ "Did not recognize starrocks type %s of column %s",
+ str(column.Type),
+ str(column.Field),
+ )
+ column_info = cls._create_column_info(column.Field, column_type)
+ column_info["nullable"] = getattr(column, "Null", True)
+ column_info["default"] = None
+ result.append(column_info)
+ return result
+
+ @classmethod
+ def _show_columns(
+ cls, inspector: Inspector, table_name: str, schema: Optional[str]
+ ) -> List[ResultRow]:
+ """
+ Show starrocks column names
+ :param inspector: object that performs database schema inspection
+ :param table_name: table name
+ :param schema: schema name
+ :return: list of column objects
+ """
+ quote = inspector.engine.dialect.identifier_preparer.quote_identifier
+ full_table = quote(table_name)
+ if schema:
+ full_table = "{}.{}".format(quote(schema), full_table)
+ return inspector.bind.execute(f"SHOW COLUMNS FROM {full_table}").fetchall()
+
+ @classmethod
+ def _create_column_info(
+ cls, name: str, data_type: types.TypeEngine
+ ) -> Dict[str, Any]:
+ """
+ Create column info object
+ :param name: column name
+ :param data_type: column data type
+ :return: column info object
+ """
+ return {"name": name, "type": f"{data_type}"}
+
+ @classmethod
+ def get_schema_from_engine_params(
+ cls,
+ sqlalchemy_uri: URL,
+ connect_args: Dict[str, Any],
+ ) -> Optional[str]:
+ """
+ Return the configured schema.
+
+ For StarRocks the SQLAlchemy URI looks like this:
+
+ starrocks://localhost:9030/catalog.schema
+
+ """
+ database = sqlalchemy_uri.database.strip("/")
+
+ if "." not in database:
+ return None
+
+ return parse.unquote(database.split(".")[1])
diff --git a/tests/unit_tests/db_engine_specs/test_starrocks.py b/tests/unit_tests/db_engine_specs/test_starrocks.py
new file mode 100644
index 000000000..7812a1683
--- /dev/null
+++ b/tests/unit_tests/db_engine_specs/test_starrocks.py
@@ -0,0 +1,111 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+from typing import Any, Dict, Optional, Type
+
+import pytest
+from sqlalchemy import types
+from sqlalchemy.engine.url import make_url
+
+from superset.db_engine_specs.starrocks import ARRAY, DOUBLE, MAP, STRUCT, TINYINT
+from superset.utils.core import GenericDataType
+from tests.unit_tests.db_engine_specs.utils import assert_column_spec
+
+
+@pytest.mark.parametrize(
+ "native_type,sqla_type,attrs,generic_type,is_dttm",
+ [
+ # Numeric
+ ("TINYINT", TINYINT, None, GenericDataType.NUMERIC, False),
+ ("DECIMAL", types.DECIMAL, None, GenericDataType.NUMERIC, False),
+ ("DOUBLE", DOUBLE, None, GenericDataType.NUMERIC, False),
+ # String
+ ("CHAR", types.CHAR, None, GenericDataType.STRING, False),
+ ("VARCHAR", types.VARCHAR, None, GenericDataType.STRING, False),
+ ("BINARY", types.String, None, GenericDataType.STRING, False),
+ # Complex type
+ ("ARRAY", ARRAY, None, GenericDataType.STRING, False),
+ ("MAP", MAP, None, GenericDataType.STRING, False),
+ ("STRUCT", STRUCT, None, GenericDataType.STRING, False),
+ ],
+)
+def test_get_column_spec(
+ native_type: str,
+ sqla_type: Type[types.TypeEngine],
+ attrs: Optional[Dict[str, Any]],
+ generic_type: GenericDataType,
+ is_dttm: bool,
+) -> None:
+ from superset.db_engine_specs.starrocks import StarRocksEngineSpec as spec
+
+ assert_column_spec(spec, native_type, sqla_type, attrs, generic_type, is_dttm)
+
+
+@pytest.mark.parametrize(
+ "sqlalchemy_uri,connect_args,return_schema,return_connect_args",
+ [
+ (
+ "starrocks://user:password@host/db1",
+ {"param1": "some_value"},
+ "db1",
+ {"param1": "some_value"},
+ ),
+ (
+ "starrocks://user:password@host/catalog1.db1",
+ {"param1": "some_value"},
+ "catalog1.db1",
+ {"param1": "some_value"},
+ ),
+ ],
+)
+def test_adjust_engine_params(
+ sqlalchemy_uri: str,
+ connect_args: Dict[str, Any],
+ return_schema: str,
+ return_connect_args: Dict[str, Any],
+) -> None:
+ from superset.db_engine_specs.starrocks import StarRocksEngineSpec
+
+ url = make_url(sqlalchemy_uri)
+ returned_url, returned_connect_args = StarRocksEngineSpec.adjust_engine_params(
+ url, connect_args
+ )
+ assert returned_url.database == return_schema
+ assert returned_connect_args == return_connect_args
+
+
+def test_get_schema_from_engine_params() -> None:
+ """
+ Test the ``get_schema_from_engine_params`` method.
+ """
+ from superset.db_engine_specs.starrocks import StarRocksEngineSpec
+
+ assert (
+ StarRocksEngineSpec.get_schema_from_engine_params(
+ make_url("starrocks://localhost:9030/hive.default"),
+ {},
+ )
+ == "default"
+ )
+
+ assert (
+ StarRocksEngineSpec.get_schema_from_engine_params(
+ make_url("starrocks://localhost:9030/hive"),
+ {},
+ )
+ is None
+ )