From 25636ded0b9deb03cc9ec6ef3ab425d830540d2f Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Wed, 14 Aug 2024 11:22:05 -0700
Subject: [PATCH 01/17] bump python sdk version

---
 dbt/adapters/databricks/api_client.py        |    6 +-
 dbt/adapters/databricks/auth.py              |  106 --
 dbt/adapters/databricks/connections.py       |   16 +-
 dbt/adapters/databricks/credentials.py       |  277 ++---
 requirements.txt                             |    2 +-
 setup.py                                     |    2 +-
 tests/unit/python/test_python_submissions.py |   10 +-
 tests/unit/test_adapter.py                   | 1086 +-----------------
 tests/unit/test_auth.py                      |    2 +-
 tests/unit/test_compute_config.py            |    5 +-
 tests/unit/test_idle_config.py               |   12 +-
 11 files changed, 186 insertions(+), 1338 deletions(-)
 delete mode 100644 dbt/adapters/databricks/auth.py

diff --git a/dbt/adapters/databricks/api_client.py b/dbt/adapters/databricks/api_client.py
index 7928880e7..fa477f655 100644
--- a/dbt/adapters/databricks/api_client.py
+++ b/dbt/adapters/databricks/api_client.py
@@ -11,7 +11,7 @@
 
 from dbt.adapters.databricks import utils
 from dbt.adapters.databricks.__version__ import version
-from dbt.adapters.databricks.auth import BearerAuth
+from dbt.adapters.databricks.credentials import BearerAuth
 from dbt.adapters.databricks.credentials import DatabricksCredentials
 from dbt.adapters.databricks.logging import logger
 from dbt_common.exceptions import DbtRuntimeError
@@ -396,8 +396,8 @@ def create(
         http_headers = credentials.get_all_http_headers(
             connection_parameters.pop("http_headers", {})
         )
-        credentials_provider = credentials.authenticate(None)
-        header_factory = credentials_provider(None)  # type: ignore
+        credentials_provider = credentials.authenticate().credentials_provider
+        header_factory = credentials_provider()  # type: ignore
         session.auth = BearerAuth(header_factory)
 
         session.headers.update({"User-Agent": user_agent, **http_headers})
diff --git a/dbt/adapters/databricks/auth.py b/dbt/adapters/databricks/auth.py
deleted file mode 100644
index 51d894e05..000000000
--- a/dbt/adapters/databricks/auth.py
+++ /dev/null
@@ -1,106 +0,0 @@
-from typing import Any
-from typing import Dict
-from typing import Optional
-
-from databricks.sdk.core import Config
-from databricks.sdk.core import credentials_provider
-from databricks.sdk.core import CredentialsProvider
-from databricks.sdk.core import HeaderFactory
-from databricks.sdk.oauth import ClientCredentials
-from databricks.sdk.oauth import Token
-from databricks.sdk.oauth import TokenSource
-from requests import PreparedRequest
-from requests.auth import AuthBase
-
-
-class token_auth(CredentialsProvider):
-    _token: str
-
-    def __init__(self, token: str) -> None:
-        self._token = token
-
-    def auth_type(self) -> str:
-        return "token"
-
-    def as_dict(self) -> dict:
-        return {"token": self._token}
-
-    @staticmethod
-    def from_dict(raw: Optional[dict]) -> Optional[CredentialsProvider]:
-        if not raw:
-            return None
-        return token_auth(raw["token"])
-
-    def __call__(self, _: Optional[Config] = None) -> HeaderFactory:
-        static_credentials = {"Authorization": f"Bearer {self._token}"}
-
-        def inner() -> Dict[str, str]:
-            return static_credentials
-
-        return inner
-
-
-class m2m_auth(CredentialsProvider):
-    _token_source: Optional[TokenSource] = None
-
-    def __init__(self, host: str, client_id: str, client_secret: str) -> None:
-        @credentials_provider("noop", [])
-        def noop_credentials(_: Any):  # type: ignore
-            return lambda: {}
-
-        config = Config(host=host, credentials_provider=noop_credentials)
-        oidc = config.oidc_endpoints
-        scopes = ["all-apis"]
-        if not oidc:
-            raise ValueError(f"{host} does not support OAuth")
-        if config.is_azure:
-            # Azure AD only supports full access to Azure Databricks.
-            scopes = [f"{config.effective_azure_login_app_id}/.default"]
-        self._token_source = ClientCredentials(
-            client_id=client_id,
-            client_secret=client_secret,
-            token_url=oidc.token_endpoint,
-            scopes=scopes,
-            use_header="microsoft" not in oidc.token_endpoint,
-            use_params="microsoft" in oidc.token_endpoint,
-        )
-
-    def auth_type(self) -> str:
-        return "oauth"
-
-    def as_dict(self) -> dict:
-        if self._token_source:
-            return {"token": self._token_source.token().as_dict()}
-        else:
-            return {"token": {}}
-
-    @staticmethod
-    def from_dict(host: str, client_id: str, client_secret: str, raw: dict) -> CredentialsProvider:
-        c = m2m_auth(host=host, client_id=client_id, client_secret=client_secret)
-        c._token_source._token = Token.from_dict(raw["token"])  # type: ignore
-        return c
-
-    def __call__(self, _: Optional[Config] = None) -> HeaderFactory:
-        def inner() -> Dict[str, str]:
-            token = self._token_source.token()  # type: ignore
-            return {"Authorization": f"{token.token_type} {token.access_token}"}
-
-        return inner
-
-
-class BearerAuth(AuthBase):
-    """This mix-in is passed to our requests Session to explicitly
-    use the bearer authentication method.
-
-    Without this, a local .netrc file in the user's home directory
-    will override the auth headers provided by our header_factory.
-
-    More details in issue #337.
-    """
-
-    def __init__(self, header_factory: HeaderFactory):
-        self.header_factory = header_factory
-
-    def __call__(self, r: PreparedRequest) -> PreparedRequest:
-        r.headers.update(**self.header_factory())
-        return r
diff --git a/dbt/adapters/databricks/connections.py b/dbt/adapters/databricks/connections.py
index 204db3923..200672c01 100644
--- a/dbt/adapters/databricks/connections.py
+++ b/dbt/adapters/databricks/connections.py
@@ -36,9 +36,9 @@
 from dbt.adapters.contracts.connection import LazyHandle
 from dbt.adapters.databricks.__version__ import version as __version__
 from dbt.adapters.databricks.api_client import DatabricksApiClient
-from dbt.adapters.databricks.auth import BearerAuth
+from dbt.adapters.databricks.credentials import BearerAuth
+from dbt.adapters.databricks.credentials import DatabricksCredentialManager
 from dbt.adapters.databricks.credentials import DatabricksCredentials
-from dbt.adapters.databricks.credentials import TCredentialProvider
 from dbt.adapters.databricks.events.connection_events import ConnectionAcquire
 from dbt.adapters.databricks.events.connection_events import ConnectionCancel
 from dbt.adapters.databricks.events.connection_events import ConnectionCancelError
@@ -475,7 +475,7 @@ def _reset_handle(self, open: Callable[[Connection], Connection]) -> None:
 
 class DatabricksConnectionManager(SparkConnectionManager):
     TYPE: str = "databricks"
-    credentials_provider: Optional[TCredentialProvider] = None
+    credentials_manager: Optional[DatabricksCredentialManager] = None
     _user_agent = f"dbt-databricks/{__version__}"
 
     def cancel_open(self) -> List[str]:
@@ -725,7 +725,7 @@ def _open(cls, connection: Connection, query_header_context: Any = None) -> Conn
         timeout = creds.connect_timeout
 
         # gotta keep this so we don't prompt users many times
-        cls.credentials_provider = creds.authenticate(cls.credentials_provider)
+        cls.credentials_manager = creds.authenticate()
 
         invocation_env = creds.get_invocation_env()
         user_agent_entry = cls._user_agent
@@ -743,12 +743,13 @@ def _open(cls, connection: Connection, query_header_context: Any = None) -> Conn
         http_path = _get_http_path(query_header_context, creds)
 
         def connect() -> DatabricksSQLConnectionWrapper:
+            assert cls.credentials_manager is not None
             try:
                 # TODO: what is the error when a user specifies a catalog they don't have access to
                 conn: DatabricksSQLConnection = dbsql.connect(
                     server_hostname=creds.host,
                     http_path=http_path,
-                    credentials_provider=cls.credentials_provider,
+                    credentials_provider=cls.credentials_manager.credentials_provider,
                     http_headers=http_headers if http_headers else None,
                     session_configuration=creds.session_properties,
                     catalog=creds.database,
@@ -1018,7 +1019,7 @@ def open(cls, connection: Connection) -> Connection:
         timeout = creds.connect_timeout
 
         # gotta keep this so we don't prompt users many times
-        cls.credentials_provider = creds.authenticate(cls.credentials_provider)
+        cls.credentials_manager = creds.authenticate()
 
         invocation_env = creds.get_invocation_env()
         user_agent_entry = cls._user_agent
@@ -1036,12 +1037,13 @@ def open(cls, connection: Connection) -> Connection:
         http_path = databricks_connection.http_path
 
         def connect() -> DatabricksSQLConnectionWrapper:
+            assert cls.credentials_manager is not None
             try:
                 # TODO: what is the error when a user specifies a catalog they don't have access to
                 conn = dbsql.connect(
                     server_hostname=creds.host,
                     http_path=http_path,
-                    credentials_provider=cls.credentials_provider,
+                    credentials_provider=cls.credentials_manager.credentials_provider,
                     http_headers=http_headers if http_headers else None,
                     session_configuration=creds.session_properties,
                     catalog=creds.database,
diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index e8897d40b..60da45374 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -4,28 +4,26 @@
 import re
 import threading
 from dataclasses import dataclass
+from dataclasses import field
 from typing import Any
+from typing import Callable
 from typing import cast
 from typing import Dict
 from typing import Iterable
 from typing import List
 from typing import Optional
 from typing import Tuple
-from typing import Union
 
-import keyring
-from databricks.sdk.core import CredentialsProvider
-from databricks.sdk.oauth import OAuthClient
-from databricks.sdk.oauth import SessionCredentials
+from databricks.sdk import WorkspaceClient
+from databricks.sdk.core import Config
+from databricks.sdk.credentials_provider import CredentialsProvider
 from dbt.adapters.contracts.connection import Credentials
-from dbt.adapters.databricks.auth import m2m_auth
-from dbt.adapters.databricks.auth import token_auth
-from dbt.adapters.databricks.events.credential_events import CredentialLoadError
-from dbt.adapters.databricks.events.credential_events import CredentialSaveError
-from dbt.adapters.databricks.events.credential_events import CredentialShardEvent
-from dbt.adapters.databricks.logging import logger
 from dbt_common.exceptions import DbtConfigError
 from dbt_common.exceptions import DbtValidationError
+from mashumaro import DataClassDictMixin
+from requests import PreparedRequest
+from requests.auth import AuthBase
+from dbt.adapters.databricks.logging import logger
 
 CATALOG_KEY_IN_SESSION_PROPERTIES = "databricks.catalog"
 DBT_DATABRICKS_INVOCATION_ENV = "DBT_DATABRICKS_INVOCATION_ENV"
@@ -42,8 +40,6 @@
 # also expire after 24h. Silently accept this in this case.
 SPA_CLIENT_FIXED_TIME_LIMIT_ERROR = "AADSTS700084"
 
-TCredentialProvider = Union[CredentialsProvider, SessionCredentials]
-
 
 @dataclass
 class DatabricksCredentials(Credentials):
@@ -69,7 +65,7 @@ class DatabricksCredentials(Credentials):
     retry_all: bool = False
     connect_max_idle: Optional[int] = None
 
-    _credentials_provider: Optional[Dict[str, Any]] = None
+    _credentials_manager: Optional["DatabricksCredentialManager"] = None
     _lock = threading.Lock()  # to avoid concurrent auth
 
     _ALIASES = {
@@ -138,6 +134,7 @@ def __post_init__(self) -> None:
         if "_socket_timeout" not in connection_parameters:
             connection_parameters["_socket_timeout"] = 600
         self.connection_parameters = connection_parameters
+        self._credentials_manager = DatabricksCredentialManager.create_from(self)
 
     def validate_creds(self) -> None:
         for key in ["host", "http_path"]:
@@ -244,181 +241,97 @@ def extract_cluster_id(cls, http_path: str) -> Optional[str]:
     def cluster_id(self) -> Optional[str]:
         return self.extract_cluster_id(self.http_path)  # type: ignore[arg-type]
 
-    def authenticate(self, in_provider: Optional[TCredentialProvider]) -> TCredentialProvider:
+    def authenticate(self) -> "DatabricksCredentialManager":
         self.validate_creds()
-        host: str = self.host or ""
-        if self._credentials_provider:
-            return self._provider_from_dict()  # type: ignore
-        if in_provider:
-            if isinstance(in_provider, m2m_auth) or isinstance(in_provider, token_auth):
-                self._credentials_provider = in_provider.as_dict()
-            return in_provider
-
-        provider: TCredentialProvider
-        # dbt will spin up multiple threads. This has to be sync. So lock here
-        self._lock.acquire()
-        try:
-            if self.token:
-                provider = token_auth(self.token)
-                self._credentials_provider = provider.as_dict()
-                return provider
-
-            if self.client_id and self.client_secret:
-                provider = m2m_auth(
-                    host=host,
-                    client_id=self.client_id or "",
-                    client_secret=self.client_secret or "",
-                )
-                self._credentials_provider = provider.as_dict()
-                return provider
-
-            client_id = self.client_id or CLIENT_ID
-
-            if client_id == "dbt-databricks":
-                # This is the temp code to make client id dbt-databricks work with server,
-                # currently the redirect url and scope for client dbt-databricks are fixed
-                # values as below. It can be removed after Databricks extends dbt-databricks
-                # scope to all-apis
-                redirect_url = "http://localhost:8050"
-                scopes = ["sql", "offline_access"]
-            else:
-                redirect_url = self.oauth_redirect_url or REDIRECT_URL
-                scopes = self.oauth_scopes or SCOPES
-
-            oauth_client = OAuthClient(
-                host=host,
-                client_id=client_id,
-                client_secret="",
-                redirect_url=redirect_url,
-                scopes=scopes,
-            )
-            # optional branch. Try and keep going if it does not work
-            try:
-                # try to get cached credentials
-                credsdict = self.get_sharded_password("dbt-databricks", host)
-
-                if credsdict:
-                    provider = SessionCredentials.from_dict(oauth_client, json.loads(credsdict))
-                    # if refresh token is expired, this will throw
-                    try:
-                        if provider.token().valid:
-                            self._credentials_provider = provider.as_dict()
-                            if json.loads(credsdict) != provider.as_dict():
-                                # if the provider dict has changed, most likely because of a token
-                                # refresh, save it for further use
-                                self.set_sharded_password(
-                                    "dbt-databricks", host, json.dumps(self._credentials_provider)
-                                )
-                            return provider
-                    except Exception as e:
-                        # SPA token are supposed to expire after 24h, no need to warn
-                        if SPA_CLIENT_FIXED_TIME_LIMIT_ERROR in str(e):
-                            logger.debug(CredentialLoadError(e))
-                        else:
-                            logger.warning(CredentialLoadError(e))
-                        # whatever it is, get rid of the cache
-                        self.delete_sharded_password("dbt-databricks", host)
-
-            # error with keyring. Maybe machine has no password persistency
-            except Exception as e:
-                logger.warning(CredentialLoadError(e))
-
-            # no token, go fetch one
-            consent = oauth_client.initiate_consent()
-
-            provider = consent.launch_external_browser()
-            # save for later
-            self._credentials_provider = provider.as_dict()
-            try:
-                self.set_sharded_password(
-                    "dbt-databricks", host, json.dumps(self._credentials_provider)
-                )
-            # error with keyring. Maybe machine has no password persistency
-            except Exception as e:
-                logger.warning(CredentialSaveError(e))
+        assert self._credentials_manager is not None, "Credentials manager is not set."
+        return self._credentials_manager
 
-            return provider
 
-        finally:
-            self._lock.release()
+class BearerAuth(AuthBase):
+    """This mix-in is passed to our requests Session to explicitly
+    use the bearer authentication method.
 
-    def set_sharded_password(self, service_name: str, username: str, password: str) -> None:
-        max_size = MAX_NT_PASSWORD_SIZE
+    Without this, a local .netrc file in the user's home directory
+    will override the auth headers provided by our header_factory.
 
-        # if not Windows or "small" password, stick to the default
-        if os.name != "nt" or len(password) < max_size:
-            keyring.set_password(service_name, username, password)
-        else:
-            logger.debug(CredentialShardEvent(len(password)))
-
-            password_shards = [
-                password[i : i + max_size] for i in range(0, len(password), max_size)
-            ]
-            shard_info = {
-                "sharded_password": True,
-                "shard_count": len(password_shards),
-            }
+    More details in issue #337.
+    """
+
+    def __init__(self, header_factory: CredentialsProvider):
+        self.header_factory = header_factory
+
+    def __call__(self, r: PreparedRequest) -> PreparedRequest:
+        r.headers.update(**self.header_factory())
+        return r
+
+
+PySQLCredentialProvider = Callable[[], Callable[[], Dict[str, str]]]
+
+
+@dataclass
+class DatabricksCredentialManager(DataClassDictMixin):
+    host: str
+    client_id: str
+    client_secret: str
+    oauth_redirect_url: str = REDIRECT_URL
+    oauth_scopes: List[str] = field(default_factory=lambda: SCOPES)
+    token: Optional[str] = None
+    auth_type: Optional[str] = None
 
-            # store the "shard info" as the "base" password
-            keyring.set_password(service_name, username, json.dumps(shard_info))
-            # then store all shards with the shard number as postfix
-            for i, s in enumerate(password_shards):
-                keyring.set_password(service_name, f"{username}__{i}", s)
-
-    def get_sharded_password(self, service_name: str, username: str) -> Optional[str]:
-        password = keyring.get_password(service_name, username)
-
-        # check for "shard info" stored as json
-        try:
-            password_as_dict = json.loads(str(password))
-            if password_as_dict.get("sharded_password"):
-                # if password was stored shared, reconstruct it
-                shard_count = int(password_as_dict.get("shard_count"))
-
-                password = ""
-                for i in range(shard_count):
-                    password += str(keyring.get_password(service_name, f"{username}__{i}"))
-        except ValueError:
-            pass
-
-        return password
-
-    def delete_sharded_password(self, service_name: str, username: str) -> None:
-        password = keyring.get_password(service_name, username)
-
-        # check for "shard info" stored as json. If so delete all shards
-        try:
-            password_as_dict = json.loads(str(password))
-            if password_as_dict.get("sharded_password"):
-                shard_count = int(password_as_dict.get("shard_count"))
-                for i in range(shard_count):
-                    keyring.delete_password(service_name, f"{username}__{i}")
-        except ValueError:
-            pass
-
-        # delete "base" password
-        keyring.delete_password(service_name, username)
-
-    def _provider_from_dict(self) -> Optional[TCredentialProvider]:
+    @classmethod
+    def create_from(cls, credentials: DatabricksCredentials) -> "DatabricksCredentialManager":
+        return DatabricksCredentialManager(
+            host=credentials.host or "",
+            token=credentials.token,
+            client_id=credentials.client_id or "",
+            client_secret=credentials.client_secret or "",
+            oauth_redirect_url=credentials.oauth_redirect_url or REDIRECT_URL,
+            oauth_scopes=credentials.oauth_scopes or SCOPES,
+            auth_type=credentials.auth_type,
+        )
+
+    def __post_init__(self) -> None:
         if self.token:
-            return token_auth.from_dict(self._credentials_provider)
-
-        if self.client_id and self.client_secret:
-            return m2m_auth.from_dict(
-                host=self.host or "",
-                client_id=self.client_id or "",
-                client_secret=self.client_secret or "",
-                raw=self._credentials_provider or {"token": {}},
+            self._config = Config(
+                host=self.host,
+                token=self.token,
             )
+        else:
+            try:
+                self._config = Config(
+                    host=self.host,
+                    client_id=self.client_id,
+                    client_secret=self.client_secret,
+                )
+                self.config.authenticate()
+            except Exception:
+                logger.warning(
+                    "Failed to auth with client id and secret, trying azure_client_id, azure_client_secret"
+                )
+                self._config = Config(
+                    host=self.host,
+                    azure_client_id=self.client_id,
+                    azure_client_secret=self.client_secret,
+                )
+                self.config.authenticate()
 
-        oauth_client = OAuthClient(
-            host=self.host or "",
-            client_id=self.client_id or CLIENT_ID,
-            client_secret="",
-            redirect_url=self.oauth_redirect_url or REDIRECT_URL,
-            scopes=self.oauth_scopes or SCOPES,
-        )
+    @property
+    def api_client(self) -> WorkspaceClient:
+        return WorkspaceClient(config=self._config)
 
-        return SessionCredentials.from_dict(
-            client=oauth_client, raw=self._credentials_provider or {"token": {}}
-        )
+    @property
+    def credentials_provider(self) -> PySQLCredentialProvider:
+        def inner() -> Callable[[], Dict[str, str]]:
+            return self.header_factory
+
+        return inner
+
+    @property
+    def header_factory(self) -> CredentialsProvider:
+        header_factory = self._config._header_factory
+        assert header_factory is not None, "Header factory is not set."
+        return header_factory
+
+    @property
+    def config(self) -> Config:
+        return self._config
\ No newline at end of file
diff --git a/requirements.txt b/requirements.txt
index d876ca915..b9a062542 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -2,6 +2,6 @@ databricks-sql-connector>=3.2.0, <3.3.0
 dbt-spark~=1.8.0
 dbt-core>=1.8.0, <2.0
 dbt-adapters>=1.3.0, <2.0
-databricks-sdk==0.17.0
+databricks-sdk==0.29.0
 keyring>=23.13.0
 protobuf<5.0.0
diff --git a/setup.py b/setup.py
index 543e03bb7..0f5e2288b 100644
--- a/setup.py
+++ b/setup.py
@@ -58,7 +58,7 @@ def _get_plugin_version() -> str:
         "dbt-core>=1.8.0, <2.0",
         "dbt-adapters>=1.3.0, <2.0",
         "databricks-sql-connector>=3.2.0, <3.3.0",
-        "databricks-sdk==0.17.0",
+        "databricks-sdk==0.29.0",
         "keyring>=23.13.0",
         "pandas<2.2.0",
         "protobuf<5.0.0",
diff --git a/tests/unit/python/test_python_submissions.py b/tests/unit/python/test_python_submissions.py
index f2a94cbb2..223579a4c 100644
--- a/tests/unit/python/test_python_submissions.py
+++ b/tests/unit/python/test_python_submissions.py
@@ -1,3 +1,4 @@
+from mock import patch
 from dbt.adapters.databricks.credentials import DatabricksCredentials
 from dbt.adapters.databricks.python_models.python_submissions import BaseDatabricksHelper
 
@@ -27,16 +28,17 @@ def __init__(self, parsed_model: dict, credentials: DatabricksCredentials):
         self.credentials = credentials
 
 
+#@patch("dbt.adapters.databricks.credentials.Config")
 class TestAclUpdate:
     def test_empty_acl_empty_config(self):
         helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
         assert helper._update_with_acls({}) == {}
 
-    def test_empty_acl_non_empty_config(self):
+    def test_empty_acl_non_empty_config(self, _):
         helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
         assert helper._update_with_acls({"a": "b"}) == {"a": "b"}
 
-    def test_non_empty_acl_empty_config(self):
+    def test_non_empty_acl_empty_config(self, _):
         expected_access_control = {
             "access_control_list": [
                 {"user_name": "user2", "permission_level": "CAN_VIEW"},
@@ -45,7 +47,7 @@ def test_non_empty_acl_empty_config(self):
         helper = DatabricksTestHelper({"config": expected_access_control}, DatabricksCredentials())
         assert helper._update_with_acls({}) == expected_access_control
 
-    def test_non_empty_acl_non_empty_config(self):
+    def test_non_empty_acl_non_empty_config(self, _):
         expected_access_control = {
             "access_control_list": [
                 {"user_name": "user2", "permission_level": "CAN_VIEW"},
@@ -55,4 +57,4 @@ def test_non_empty_acl_non_empty_config(self):
         assert helper._update_with_acls({"a": "b"}) == {
             "a": "b",
             "access_control_list": expected_access_control["access_control_list"],
-        }
+        }
\ No newline at end of file
diff --git a/tests/unit/test_adapter.py b/tests/unit/test_adapter.py
index 5364cb158..f84608d39 100644
--- a/tests/unit/test_adapter.py
+++ b/tests/unit/test_adapter.py
@@ -1,1026 +1,60 @@
-from multiprocessing import get_context
-from typing import Any
-from typing import Dict
-from typing import Optional
-
-import dbt.flags as flags
-import mock
-import pytest
-from agate import Row
-from dbt.adapters.databricks import __version__
-from dbt.adapters.databricks import DatabricksAdapter
-from dbt.adapters.databricks import DatabricksRelation
-from dbt.adapters.databricks.column import DatabricksColumn
-from dbt.adapters.databricks.credentials import CATALOG_KEY_IN_SESSION_PROPERTIES
-from dbt.adapters.databricks.credentials import DBT_DATABRICKS_HTTP_SESSION_HEADERS
-from dbt.adapters.databricks.credentials import DBT_DATABRICKS_INVOCATION_ENV
-from dbt.adapters.databricks.impl import check_not_found_error
-from dbt.adapters.databricks.impl import get_identifier_list_string
-from dbt.adapters.databricks.relation import DatabricksRelationType
-from dbt.config import RuntimeConfig
-from dbt_common.exceptions import DbtConfigError
-from dbt_common.exceptions import DbtValidationError
-from mock import Mock
-from tests.unit.utils import config_from_parts_or_dicts
-
-
-class DatabricksAdapterBase:
-    @pytest.fixture(autouse=True)
-    def setUp(self):
-        flags.STRICT_MODE = False
-
-        self.project_cfg = {
-            "name": "X",
-            "version": "0.1",
-            "profile": "test",
-            "project-root": "/tmp/dbt/does-not-exist",
-            "quoting": {
-                "identifier": False,
-                "schema": False,
-            },
-            "config-version": 2,
-        }
-
-        self.profile_cfg = {
-            "outputs": {
-                "test": {
-                    "type": "databricks",
-                    "catalog": "main",
-                    "schema": "analytics",
-                    "host": "yourorg.databricks.com",
-                    "http_path": "sql/protocolv1/o/1234567890123456/1234-567890-test123",
-                }
-            },
-            "target": "test",
-        }
-
-    def _get_config(
-        self,
-        token: Optional[str] = "dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX",
-        session_properties: Optional[Dict[str, str]] = {"spark.sql.ansi.enabled": "true"},
-        **kwargs: Any,
-    ) -> RuntimeConfig:
-        if token:
-            self.profile_cfg["outputs"]["test"]["token"] = token
-        if session_properties:
-            self.profile_cfg["outputs"]["test"]["session_properties"] = session_properties
-
-        for key, val in kwargs.items():
-            self.profile_cfg["outputs"]["test"][key] = val
-
-        return config_from_parts_or_dicts(self.project_cfg, self.profile_cfg)
-
-
-class TestDatabricksAdapter(DatabricksAdapterBase):
-    def test_two_catalog_settings(self):
-        with pytest.raises(DbtConfigError) as excinfo:
-            self._get_config(
-                session_properties={
-                    CATALOG_KEY_IN_SESSION_PROPERTIES: "catalog",
-                    "spark.sql.ansi.enabled": "true",
-                }
-            )
-
-        expected_message = (
-            "Got duplicate keys: (`databricks.catalog` in session_properties)"
-            ' all map to "database"'
-        )
-
-        assert expected_message in str(excinfo.value)
-
-    def test_database_and_catalog_settings(self):
-        with pytest.raises(DbtConfigError) as excinfo:
-            self._get_config(catalog="main", database="database")
-
-        assert 'Got duplicate keys: (catalog) all map to "database"' in str(excinfo.value)
-
-    def test_reserved_connection_parameters(self):
-        with pytest.raises(DbtConfigError) as excinfo:
-            self._get_config(connection_parameters={"server_hostname": "theirorg.databricks.com"})
-
-        assert "The connection parameter `server_hostname` is reserved." in str(excinfo.value)
-
-    def test_invalid_http_headers(self):
-        def test_http_headers(http_header):
-            with pytest.raises(DbtConfigError) as excinfo:
-                self._get_config(connection_parameters={"http_headers": http_header})
-
-            assert "The connection parameter `http_headers` should be dict of strings" in str(
-                excinfo.value
-            )
-
-        test_http_headers("a")
-        test_http_headers(["a", "b"])
-        test_http_headers({"a": 1, "b": 2})
-
-    def test_invalid_custom_user_agent(self):
-        with pytest.raises(DbtValidationError) as excinfo:
-            config = self._get_config()
-            adapter = DatabricksAdapter(config, get_context("spawn"))
-            with mock.patch.dict("os.environ", **{DBT_DATABRICKS_INVOCATION_ENV: "(Some-thing)"}):
-                connection = adapter.acquire_connection("dummy")
-                connection.handle  # trigger lazy-load
-
-        assert "Invalid invocation environment" in str(excinfo.value)
-
-    def test_custom_user_agent(self):
-        config = self._get_config()
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-
-        with mock.patch(
-            "dbt.adapters.databricks.connections.dbsql.connect",
-            new=self._connect_func(expected_invocation_env="databricks-workflows"),
-        ):
-            with mock.patch.dict(
-                "os.environ", **{DBT_DATABRICKS_INVOCATION_ENV: "databricks-workflows"}
-            ):
-                connection = adapter.acquire_connection("dummy")
-                connection.handle  # trigger lazy-load
-
-    def test_environment_single_http_header(self):
-        self._test_environment_http_headers(
-            http_headers_str='{"test":{"jobId":1,"runId":12123}}',
-            expected_http_headers=[("test", '{"jobId": 1, "runId": 12123}')],
-        )
-
-    def test_environment_multiple_http_headers(self):
-        self._test_environment_http_headers(
-            http_headers_str='{"test":{"jobId":1,"runId":12123},"dummy":{"jobId":1,"runId":12123}}',
-            expected_http_headers=[
-                ("test", '{"jobId": 1, "runId": 12123}'),
-                ("dummy", '{"jobId": 1, "runId": 12123}'),
-            ],
-        )
-
-    def test_environment_users_http_headers_intersection_error(self):
-        with pytest.raises(DbtValidationError) as excinfo:
-            self._test_environment_http_headers(
-                http_headers_str='{"t":{"jobId":1,"runId":12123},"d":{"jobId":1,"runId":12123}}',
-                expected_http_headers=[],
-                user_http_headers={"t": "test", "nothing": "nothing"},
-            )
-
-        assert "Intersection with reserved http_headers in keys: {'t'}" in str(excinfo.value)
-
-    def test_environment_users_http_headers_union_success(self):
-        self._test_environment_http_headers(
-            http_headers_str='{"t":{"jobId":1,"runId":12123},"d":{"jobId":1,"runId":12123}}',
-            user_http_headers={"nothing": "nothing"},
-            expected_http_headers=[
-                ("t", '{"jobId": 1, "runId": 12123}'),
-                ("d", '{"jobId": 1, "runId": 12123}'),
-                ("nothing", "nothing"),
-            ],
-        )
-
-    def test_environment_http_headers_string(self):
-        self._test_environment_http_headers(
-            http_headers_str='{"string":"some-string"}',
-            expected_http_headers=[("string", "some-string")],
-        )
-
-    def _test_environment_http_headers(
-        self, http_headers_str, expected_http_headers, user_http_headers=None
-    ):
-        if user_http_headers:
-            config = self._get_config(connection_parameters={"http_headers": user_http_headers})
-        else:
-            config = self._get_config()
-
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-
-        with mock.patch(
-            "dbt.adapters.databricks.connections.dbsql.connect",
-            new=self._connect_func(expected_http_headers=expected_http_headers),
-        ):
-            with mock.patch.dict(
-                "os.environ",
-                **{DBT_DATABRICKS_HTTP_SESSION_HEADERS: http_headers_str},
-            ):
-                connection = adapter.acquire_connection("dummy")
-                connection.handle  # trigger lazy-load
-
-    @pytest.mark.skip("not ready")
-    def test_oauth_settings(self):
-        config = self._get_config(token=None)
-
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-
-        with mock.patch(
-            "dbt.adapters.databricks.connections.dbsql.connect",
-            new=self._connect_func(expected_no_token=True),
-        ):
-            connection = adapter.acquire_connection("dummy")
-            connection.handle  # trigger lazy-load
-
-    @pytest.mark.skip("not ready")
-    def test_client_creds_settings(self):
-        config = self._get_config(client_id="foo", client_secret="bar")
-
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-
-        with mock.patch(
-            "dbt.adapters.databricks.connections.dbsql.connect",
-            new=self._connect_func(expected_client_creds=True),
-        ):
-            connection = adapter.acquire_connection("dummy")
-            connection.handle  # trigger lazy-load
-
-    def _connect_func(
-        self,
-        *,
-        expected_catalog="main",
-        expected_invocation_env=None,
-        expected_http_headers=None,
-        expected_no_token=None,
-        expected_client_creds=None,
-    ):
-        def connect(
-            server_hostname,
-            http_path,
-            credentials_provider,
-            http_headers,
-            session_configuration,
-            catalog,
-            _user_agent_entry,
-            **kwargs,
-        ):
-            assert server_hostname == "yourorg.databricks.com"
-            assert http_path == "sql/protocolv1/o/1234567890123456/1234-567890-test123"
-            if not (expected_no_token or expected_client_creds):
-                assert credentials_provider._token == "dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
-
-            if expected_client_creds:
-                assert kwargs.get("client_id") == "foo"
-                assert kwargs.get("client_secret") == "bar"
-            assert session_configuration["spark.sql.ansi.enabled"] == "true"
-            if expected_catalog is None:
-                assert catalog is None
-            else:
-                assert catalog == expected_catalog
-            if expected_invocation_env is not None:
-                assert (
-                    _user_agent_entry
-                    == f"dbt-databricks/{__version__.version}; {expected_invocation_env}"
-                )
-            else:
-                assert _user_agent_entry == f"dbt-databricks/{__version__.version}"
-            if expected_http_headers is None:
-                assert http_headers is None
-            else:
-                assert http_headers == expected_http_headers
-
-        return connect
-
-    def test_databricks_sql_connector_connection(self):
-        self._test_databricks_sql_connector_connection(self._connect_func())
-
-    def _test_databricks_sql_connector_connection(self, connect):
-        config = self._get_config()
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-
-        with mock.patch("dbt.adapters.databricks.connections.dbsql.connect", new=connect):
-            connection = adapter.acquire_connection("dummy")
-            connection.handle  # trigger lazy-load
-
-            assert connection.state == "open"
-            assert connection.handle
-            assert (
-                connection.credentials.http_path
-                == "sql/protocolv1/o/1234567890123456/1234-567890-test123"
-            )
-            assert connection.credentials.token == "dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
-            assert connection.credentials.schema == "analytics"
-            assert len(connection.credentials.session_properties) == 1
-            assert connection.credentials.session_properties["spark.sql.ansi.enabled"] == "true"
-
-    def test_databricks_sql_connector_catalog_connection(self):
-        self._test_databricks_sql_connector_catalog_connection(
-            self._connect_func(expected_catalog="main")
-        )
-
-    def _test_databricks_sql_connector_catalog_connection(self, connect):
-        config = self._get_config()
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-
-        with mock.patch("dbt.adapters.databricks.connections.dbsql.connect", new=connect):
-            connection = adapter.acquire_connection("dummy")
-            connection.handle  # trigger lazy-load
-
-            assert connection.state == "open"
-            assert connection.handle
-            assert (
-                connection.credentials.http_path
-                == "sql/protocolv1/o/1234567890123456/1234-567890-test123"
-            )
-            assert connection.credentials.token == "dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
-            assert connection.credentials.schema == "analytics"
-            assert connection.credentials.database == "main"
-
-    def test_databricks_sql_connector_http_header_connection(self):
-        self._test_databricks_sql_connector_http_header_connection(
-            {"aaa": "xxx"}, self._connect_func(expected_http_headers=[("aaa", "xxx")])
-        )
-        self._test_databricks_sql_connector_http_header_connection(
-            {"aaa": "xxx", "bbb": "yyy"},
-            self._connect_func(expected_http_headers=[("aaa", "xxx"), ("bbb", "yyy")]),
-        )
-
-    def _test_databricks_sql_connector_http_header_connection(self, http_headers, connect):
-        config = self._get_config(connection_parameters={"http_headers": http_headers})
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-
-        with mock.patch("dbt.adapters.databricks.connections.dbsql.connect", new=connect):
-            connection = adapter.acquire_connection("dummy")
-            connection.handle  # trigger lazy-load
-
-            assert connection.state == "open"
-            assert connection.handle
-            assert (
-                connection.credentials.http_path
-                == "sql/protocolv1/o/1234567890123456/1234-567890-test123"
-            )
-            assert connection.credentials.token == "dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
-            assert connection.credentials.schema == "analytics"
-
-    def test_list_relations_without_caching__no_relations(self):
-        with mock.patch.object(DatabricksAdapter, "get_relations_without_caching") as mocked:
-            mocked.return_value = []
-            adapter = DatabricksAdapter(Mock(), get_context("spawn"))
-            assert adapter.list_relations("database", "schema") == []
-
-    def test_list_relations_without_caching__some_relations(self):
-        with mock.patch.object(DatabricksAdapter, "get_relations_without_caching") as mocked:
-            mocked.return_value = [("name", "table", "hudi", "owner")]
-            adapter = DatabricksAdapter(Mock(), get_context("spawn"))
-            relations = adapter.list_relations("database", "schema")
-            assert len(relations) == 1
-            relation = relations[0]
-            assert relation.identifier == "name"
-            assert relation.database == "database"
-            assert relation.schema == "schema"
-            assert relation.type == DatabricksRelationType.Table
-            assert relation.owner == "owner"
-            assert relation.is_hudi
-
-    def test_list_relations_without_caching__hive_relation(self):
-        with mock.patch.object(DatabricksAdapter, "get_relations_without_caching") as mocked:
-            mocked.return_value = [("name", "table", None, None)]
-            adapter = DatabricksAdapter(Mock(), get_context("spawn"))
-            relations = adapter.list_relations("database", "schema")
-            assert len(relations) == 1
-            relation = relations[0]
-            assert relation.identifier == "name"
-            assert relation.database == "database"
-            assert relation.schema == "schema"
-            assert relation.type == DatabricksRelationType.Table
-            assert not relation.has_information()
-
-    def test_get_schema_for_catalog__no_columns(self):
-        with mock.patch.object(DatabricksAdapter, "_list_relations_with_information") as list_info:
-            list_info.return_value = [(Mock(), "info")]
-            with mock.patch.object(DatabricksAdapter, "_get_columns_for_catalog") as get_columns:
-                get_columns.return_value = []
-                adapter = DatabricksAdapter(Mock(), get_context("spawn"))
-                table = adapter._get_schema_for_catalog("database", "schema", "name")
-                assert len(table.rows) == 0
-
-    def test_get_schema_for_catalog__some_columns(self):
-        with mock.patch.object(DatabricksAdapter, "_list_relations_with_information") as list_info:
-            list_info.return_value = [(Mock(), "info")]
-            with mock.patch.object(DatabricksAdapter, "_get_columns_for_catalog") as get_columns:
-                get_columns.return_value = [
-                    {"name": "col1", "type": "string", "comment": "comment"},
-                    {"name": "col2", "type": "string", "comment": "comment"},
-                ]
-                adapter = DatabricksAdapter(Mock(), get_context("spawn"))
-                table = adapter._get_schema_for_catalog("database", "schema", "name")
-                assert len(table.rows) == 2
-                assert table.column_names == ("name", "type", "comment")
-
-    def test_simple_catalog_relation(self):
-        self.maxDiff = None
-        rel_type = DatabricksRelation.get_relation_type.Table
-
-        relation = DatabricksRelation.create(
-            database="test_catalog",
-            schema="default_schema",
-            identifier="mytable",
-            type=rel_type,
-        )
-        assert relation.database == "test_catalog"
-
-    def test_parse_relation(self):
-        self.maxDiff = None
-        rel_type = DatabricksRelation.get_relation_type.Table
-
-        relation = DatabricksRelation.create(
-            schema="default_schema", identifier="mytable", type=rel_type
-        )
-        assert relation.database is None
-
-        # Mimics the output of Spark with a DESCRIBE TABLE EXTENDED
-        plain_rows = [
-            ("col1", "decimal(22,0)", "comment"),
-            ("col2", "string", "comment"),
-            ("dt", "date", None),
-            ("struct_col", "struct<struct_inner_col:string>", None),
-            ("# Partition Information", "data_type", None),
-            ("# col_name", "data_type", "comment"),
-            ("dt", "date", None),
-            (None, None, None),
-            ("# Detailed Table Information", None),
-            ("Database", None),
-            ("Owner", "root", None),
-            ("Created Time", "Wed Feb 04 18:15:00 UTC 1815", None),
-            ("Last Access", "Wed May 20 19:25:00 UTC 1925", None),
-            ("Type", "MANAGED", None),
-            ("Provider", "delta", None),
-            ("Location", "/mnt/vo", None),
-            (
-                "Serde Library",
-                "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe",
-                None,
-            ),
-            ("InputFormat", "org.apache.hadoop.mapred.SequenceFileInputFormat", None),
-            (
-                "OutputFormat",
-                "org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat",
-                None,
-            ),
-            ("Partition Provider", "Catalog", None),
-        ]
-
-        input_cols = [Row(keys=["col_name", "data_type", "comment"], values=r) for r in plain_rows]
-
-        config = self._get_config()
-        metadata, rows = DatabricksAdapter(config, get_context("spawn")).parse_describe_extended(
-            relation, input_cols
-        )
-
-        assert metadata == {
-            "# col_name": "data_type",
-            "dt": "date",
-            None: None,
-            "# Detailed Table Information": None,
-            "Database": None,
-            "Owner": "root",
-            "Created Time": "Wed Feb 04 18:15:00 UTC 1815",
-            "Last Access": "Wed May 20 19:25:00 UTC 1925",
-            "Type": "MANAGED",
-            "Provider": "delta",
-            "Location": "/mnt/vo",
-            "Serde Library": "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe",
-            "InputFormat": "org.apache.hadoop.mapred.SequenceFileInputFormat",
-            "OutputFormat": "org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat",
-            "Partition Provider": "Catalog",
-        }
-
-        assert len(rows) == 4
-        assert rows[0].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "col1",
-            "column_index": 0,
-            "dtype": "decimal(22,0)",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "comment": "comment",
-        }
-
-        assert rows[1].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "col2",
-            "column_index": 1,
-            "dtype": "string",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "comment": "comment",
-        }
-
-        assert rows[2].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "dt",
-            "column_index": 2,
-            "dtype": "date",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "comment": None,
-        }
-
-        assert rows[3].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "struct_col",
-            "column_index": 3,
-            "dtype": "struct<struct_inner_col:string>",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "comment": None,
-        }
-
-    def test_parse_relation_with_integer_owner(self):
-        self.maxDiff = None
-        rel_type = DatabricksRelation.get_relation_type.Table
-
-        relation = DatabricksRelation.create(
-            schema="default_schema", identifier="mytable", type=rel_type
-        )
-        assert relation.database is None
-
-        # Mimics the output of Spark with a DESCRIBE TABLE EXTENDED
-        plain_rows = [
-            ("col1", "decimal(22,0)", "comment"),
-            ("# Detailed Table Information", None, None),
-            ("Owner", 1234, None),
-        ]
-
-        input_cols = [Row(keys=["col_name", "data_type", "comment"], values=r) for r in plain_rows]
-
-        config = self._get_config()
-        _, rows = DatabricksAdapter(config, get_context("spawn")).parse_describe_extended(
-            relation, input_cols
-        )
-
-        assert rows[0].to_column_dict().get("table_owner") == "1234"
-
-    def test_parse_relation_with_statistics(self):
-        self.maxDiff = None
-        rel_type = DatabricksRelation.get_relation_type.Table
-
-        relation = DatabricksRelation.create(
-            schema="default_schema", identifier="mytable", type=rel_type
-        )
-        assert relation.database is None
-
-        # Mimics the output of Spark with a DESCRIBE TABLE EXTENDED
-        plain_rows = [
-            ("col1", "decimal(22,0)", "comment"),
-            ("# Partition Information", "data_type", None),
-            (None, None, None),
-            ("# Detailed Table Information", None, None),
-            ("Database", None, None),
-            ("Owner", "root", None),
-            ("Created Time", "Wed Feb 04 18:15:00 UTC 1815", None),
-            ("Last Access", "Wed May 20 19:25:00 UTC 1925", None),
-            ("Comment", "Table model description", None),
-            ("Statistics", "1109049927 bytes, 14093476 rows", None),
-            ("Type", "MANAGED", None),
-            ("Provider", "delta", None),
-            ("Location", "/mnt/vo", None),
-            (
-                "Serde Library",
-                "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe",
-                None,
-            ),
-            ("InputFormat", "org.apache.hadoop.mapred.SequenceFileInputFormat", None),
-            (
-                "OutputFormat",
-                "org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat",
-                None,
-            ),
-            ("Partition Provider", "Catalog", None),
-        ]
-
-        input_cols = [Row(keys=["col_name", "data_type", "comment"], values=r) for r in plain_rows]
-
-        config = self._get_config()
-        metadata, rows = DatabricksAdapter(config, get_context("spawn")).parse_describe_extended(
-            relation, input_cols
-        )
-
-        assert metadata == {
-            None: None,
-            "# Detailed Table Information": None,
-            "Database": None,
-            "Owner": "root",
-            "Created Time": "Wed Feb 04 18:15:00 UTC 1815",
-            "Last Access": "Wed May 20 19:25:00 UTC 1925",
-            "Comment": "Table model description",
-            "Statistics": "1109049927 bytes, 14093476 rows",
-            "Type": "MANAGED",
-            "Provider": "delta",
-            "Location": "/mnt/vo",
-            "Serde Library": "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe",
-            "InputFormat": "org.apache.hadoop.mapred.SequenceFileInputFormat",
-            "OutputFormat": "org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat",
-            "Partition Provider": "Catalog",
-        }
-
-        assert len(rows) == 1
-        assert rows[0].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": "Table model description",
-            "column": "col1",
-            "column_index": 0,
-            "comment": "comment",
-            "dtype": "decimal(22,0)",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "stats:bytes:description": "",
-            "stats:bytes:include": True,
-            "stats:bytes:label": "bytes",
-            "stats:bytes:value": 1109049927,
-            "stats:rows:description": "",
-            "stats:rows:include": True,
-            "stats:rows:label": "rows",
-            "stats:rows:value": 14093476,
-        }
-
-    def test_relation_with_database(self):
-        config = self._get_config()
-        adapter = DatabricksAdapter(config, get_context("spawn"))
-        r1 = adapter.Relation.create(schema="different", identifier="table")
-        assert r1.database is None
-        r2 = adapter.Relation.create(database="something", schema="different", identifier="table")
-        assert r2.database == "something"
-
-    def test_parse_columns_from_information_with_table_type_and_delta_provider(self):
-        self.maxDiff = None
-        rel_type = DatabricksRelation.get_relation_type.Table
-
-        # Mimics the output of Spark in the information column
-        information = (
-            "Database: default_schema\n"
-            "Table: mytable\n"
-            "Owner: root\n"
-            "Created Time: Wed Feb 04 18:15:00 UTC 1815\n"
-            "Last Access: Wed May 20 19:25:00 UTC 1925\n"
-            "Created By: Spark 3.0.1\n"
-            "Type: MANAGED\n"
-            "Provider: delta\n"
-            "Statistics: 123456789 bytes\n"
-            "Location: /mnt/vo\n"
-            "Serde Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe\n"
-            "InputFormat: org.apache.hadoop.mapred.SequenceFileInputFormat\n"
-            "OutputFormat: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat\n"
-            "Partition Provider: Catalog\n"
-            "Partition Columns: [`dt`]\n"
-            "Schema: root\n"
-            " |-- col1: decimal(22,0) (nullable = true)\n"
-            " |-- col2: string (nullable = true)\n"
-            " |-- dt: date (nullable = true)\n"
-            " |-- struct_col: struct (nullable = true)\n"
-            " |    |-- struct_inner_col: string (nullable = true)\n"
-        )
-        relation = DatabricksRelation.create(
-            schema="default_schema", identifier="mytable", type=rel_type
-        )
-
-        config = self._get_config()
-        columns = DatabricksAdapter(config, get_context("spawn")).parse_columns_from_information(
-            relation, information
-        )
-        assert len(columns) == 4
-        assert columns[0].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "col1",
-            "column_index": 0,
-            "dtype": "decimal(22,0)",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "stats:bytes:description": "",
-            "stats:bytes:include": True,
-            "stats:bytes:label": "bytes",
-            "stats:bytes:value": 123456789,
-            "comment": None,
-        }
-
-        assert columns[3].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "struct_col",
-            "column_index": 3,
-            "dtype": "struct",
-            "comment": None,
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "stats:bytes:description": "",
-            "stats:bytes:include": True,
-            "stats:bytes:label": "bytes",
-            "stats:bytes:value": 123456789,
-        }
-
-    def test_parse_columns_from_information_with_view_type(self):
-        self.maxDiff = None
-        rel_type = DatabricksRelation.get_relation_type.View
-        information = (
-            "Database: default_schema\n"
-            "Table: myview\n"
-            "Owner: root\n"
-            "Created Time: Wed Feb 04 18:15:00 UTC 1815\n"
-            "Last Access: UNKNOWN\n"
-            "Created By: Spark 3.0.1\n"
-            "Type: VIEW\n"
-            "View Text: WITH base (\n"
-            "    SELECT * FROM source_table\n"
-            ")\n"
-            "SELECT col1, col2, dt FROM base\n"
-            "View Original Text: WITH base (\n"
-            "    SELECT * FROM source_table\n"
-            ")\n"
-            "SELECT col1, col2, dt FROM base\n"
-            "View Catalog and Namespace: spark_catalog.default\n"
-            "View Query Output Columns: [col1, col2, dt]\n"
-            "Table Properties: [view.query.out.col.1=col1, view.query.out.col.2=col2, "
-            "transient_lastDdlTime=1618324324, view.query.out.col.3=dt, "
-            "view.catalogAndNamespace.part.0=spark_catalog, "
-            "view.catalogAndNamespace.part.1=default]\n"
-            "Serde Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe\n"
-            "InputFormat: org.apache.hadoop.mapred.SequenceFileInputFormat\n"
-            "OutputFormat: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat\n"
-            "Storage Properties: [serialization.format=1]\n"
-            "Schema: root\n"
-            " |-- col1: decimal(22,0) (nullable = true)\n"
-            " |-- col2: string (nullable = true)\n"
-            " |-- dt: date (nullable = true)\n"
-            " |-- struct_col: struct (nullable = true)\n"
-            " |    |-- struct_inner_col: string (nullable = true)\n"
-        )
-        relation = DatabricksRelation.create(
-            schema="default_schema", identifier="myview", type=rel_type
-        )
-
-        config = self._get_config()
-        columns = DatabricksAdapter(config, get_context("spawn")).parse_columns_from_information(
-            relation, information
-        )
-        assert len(columns) == 4
-        assert columns[1].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "col2",
-            "column_index": 1,
-            "comment": None,
-            "dtype": "string",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-        }
-
-        assert columns[3].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "struct_col",
-            "column_index": 3,
-            "comment": None,
-            "dtype": "struct",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-        }
-
-    def test_parse_columns_from_information_with_table_type_and_parquet_provider(self):
-        self.maxDiff = None
-        rel_type = DatabricksRelation.get_relation_type.Table
-
-        information = (
-            "Database: default_schema\n"
-            "Table: mytable\n"
-            "Owner: root\n"
-            "Created Time: Wed Feb 04 18:15:00 UTC 1815\n"
-            "Last Access: Wed May 20 19:25:00 UTC 1925\n"
-            "Created By: Spark 3.0.1\n"
-            "Type: MANAGED\n"
-            "Provider: parquet\n"
-            "Statistics: 1234567890 bytes, 12345678 rows\n"
-            "Location: /mnt/vo\n"
-            "Serde Library: org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe\n"
-            "InputFormat: org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat\n"
-            "OutputFormat: org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat\n"
-            "Schema: root\n"
-            " |-- col1: decimal(22,0) (nullable = true)\n"
-            " |-- col2: string (nullable = true)\n"
-            " |-- dt: date (nullable = true)\n"
-            " |-- struct_col: struct (nullable = true)\n"
-            " |    |-- struct_inner_col: string (nullable = true)\n"
-        )
-        relation = DatabricksRelation.create(
-            schema="default_schema", identifier="mytable", type=rel_type
-        )
-
-        config = self._get_config()
-        columns = DatabricksAdapter(config, get_context("spawn")).parse_columns_from_information(
-            relation, information
-        )
-        assert len(columns) == 4
-        assert columns[2].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "dt",
-            "column_index": 2,
-            "comment": None,
-            "dtype": "date",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "stats:bytes:description": "",
-            "stats:bytes:include": True,
-            "stats:bytes:label": "bytes",
-            "stats:bytes:value": 1234567890,
-            "stats:rows:description": "",
-            "stats:rows:include": True,
-            "stats:rows:label": "rows",
-            "stats:rows:value": 12345678,
-        }
-
-        assert columns[3].to_column_dict(omit_none=False) == {
-            "table_database": None,
-            "table_schema": relation.schema,
-            "table_name": relation.name,
-            "table_type": rel_type,
-            "table_owner": "root",
-            "table_comment": None,
-            "column": "struct_col",
-            "column_index": 3,
-            "comment": None,
-            "dtype": "struct",
-            "numeric_scale": None,
-            "numeric_precision": None,
-            "char_size": None,
-            "stats:bytes:description": "",
-            "stats:bytes:include": True,
-            "stats:bytes:label": "bytes",
-            "stats:bytes:value": 1234567890,
-            "stats:rows:description": "",
-            "stats:rows:include": True,
-            "stats:rows:label": "rows",
-            "stats:rows:value": 12345678,
-        }
-
-    def test_describe_table_extended_2048_char_limit(self):
-        """GIVEN a list of table_names whos total character length exceeds 2048 characters
-        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is "true"
-        THEN the identifier list is replaced with "*"
-        """
-
-        table_names = set([f"customers_{i}" for i in range(200)])
-
-        # By default, don't limit the number of characters
-        assert get_identifier_list_string(table_names) == "|".join(table_names)
-
-        # If environment variable is set, then limit the number of characters
-        with mock.patch.dict("os.environ", **{"DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS": "true"}):
-            # Long list of table names is capped
-            assert get_identifier_list_string(table_names) == "*"
-
-            # Short list of table names is not capped
-            assert get_identifier_list_string(list(table_names)[:5]) == "|".join(
-                list(table_names)[:5]
-            )
-
-    def test_describe_table_extended_should_not_limit(self):
-        """GIVEN a list of table_names whos total character length exceeds 2048 characters
-        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is not set
-        THEN the identifier list is not truncated
-        """
-
-        table_names = set([f"customers_{i}" for i in range(200)])
-
-        # By default, don't limit the number of characters
-        assert get_identifier_list_string(table_names) == "|".join(table_names)
-
-    def test_describe_table_extended_should_limit(self):
-        """GIVEN a list of table_names whos total character length exceeds 2048 characters
-        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is "true"
-        THEN the identifier list is replaced with "*"
-        """
-
-        table_names = set([f"customers_{i}" for i in range(200)])
-
-        # If environment variable is set, then limit the number of characters
-        with mock.patch.dict("os.environ", **{"DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS": "true"}):
-            # Long list of table names is capped
-            assert get_identifier_list_string(table_names) == "*"
-
-    def test_describe_table_extended_may_limit(self):
-        """GIVEN a list of table_names whos total character length does not 2048 characters
-        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is "true"
-        THEN the identifier list is not truncated
-        """
-
-        table_names = set([f"customers_{i}" for i in range(200)])
-
-        # If environment variable is set, then we may limit the number of characters
-        with mock.patch.dict("os.environ", **{"DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS": "true"}):
-            # But a short list of table names is not capped
-            assert get_identifier_list_string(list(table_names)[:5]) == "|".join(
-                list(table_names)[:5]
-            )
-
-
-class TestCheckNotFound:
-    def test_prefix(self):
-        assert check_not_found_error("Runtime error \n Database 'dbt' not found")
-
-    def test_no_prefix_or_suffix(self):
-        assert check_not_found_error("Database not found")
-
-    def test_quotes(self):
-        assert check_not_found_error("Database '`dbt`' not found")
-
-    def test_suffix(self):
-        assert check_not_found_error("Database not found and \n foo")
-
-    def test_error_condition(self):
-        assert check_not_found_error("[SCHEMA_NOT_FOUND]")
-
-    def test_unexpected_error(self):
-        assert not check_not_found_error("[DATABASE_NOT_FOUND]")
-        assert not check_not_found_error("Schema foo not found")
-        assert not check_not_found_error("Database 'foo' not there")
-
-
-class TestGetPersistDocColumns(DatabricksAdapterBase):
-    @pytest.fixture
-    def adapter(self, setUp) -> DatabricksAdapter:
-        return DatabricksAdapter(self._get_config(), get_context("spawn"))
-
-    def create_column(self, name, comment) -> DatabricksColumn:
-        return DatabricksColumn(
-            column=name,
-            dtype="string",
-            comment=comment,
-        )
-
-    def test_get_persist_doc_columns_empty(self, adapter):
-        assert adapter.get_persist_doc_columns([], {}) == {}
-
-    def test_get_persist_doc_columns_no_match(self, adapter):
-        existing = [self.create_column("col1", "comment1")]
-        column_dict = {"col2": {"name": "col2", "description": "comment2"}}
-        assert adapter.get_persist_doc_columns(existing, column_dict) == {}
-
-    def test_get_persist_doc_columns_full_match(self, adapter):
-        existing = [self.create_column("col1", "comment1")]
-        column_dict = {"col1": {"name": "col1", "description": "comment1"}}
-        assert adapter.get_persist_doc_columns(existing, column_dict) == {}
-
-    def test_get_persist_doc_columns_partial_match(self, adapter):
-        existing = [self.create_column("col1", "comment1")]
-        column_dict = {"col1": {"name": "col1", "description": "comment2"}}
-        assert adapter.get_persist_doc_columns(existing, column_dict) == column_dict
-
-    def test_get_persist_doc_columns_mixed(self, adapter):
-        existing = [
-            self.create_column("col1", "comment1"),
-            self.create_column("col2", "comment2"),
-        ]
-        column_dict = {
-            "col1": {"name": "col1", "description": "comment2"},
-            "col2": {"name": "col2", "description": "comment2"},
-        }
-        expected = {
-            "col1": {"name": "col1", "description": "comment2"},
-        }
-        assert adapter.get_persist_doc_columns(existing, column_dict) == expected
+from mock import patch
+from dbt.adapters.databricks.credentials import DatabricksCredentials
+from dbt.adapters.databricks.python_models.python_submissions import BaseDatabricksHelper
+
+
+# class TestDatabricksPythonSubmissions:
+#     def test_start_cluster_returns_on_receiving_running_state(self):
+#         session_mock = Mock()
+#         # Mock the start command
+#         post_mock = Mock()
+#         post_mock.status_code = 200
+#         session_mock.post.return_value = post_mock
+#         # Mock the status command
+#         get_mock = Mock()
+#         get_mock.status_code = 200
+#         get_mock.json.return_value = {"state": "RUNNING"}
+#         session_mock.get.return_value = get_mock
+
+#         context = DBContext(Mock(), None, None, session_mock)
+#         context.start_cluster()
+
+#         session_mock.get.assert_called_once()
+
+
+class DatabricksTestHelper(BaseDatabricksHelper):
+    def __init__(self, parsed_model: dict, credentials: DatabricksCredentials):
+        self.parsed_model = parsed_model
+        self.credentials = credentials
+
+
+@patch("dbt.adapters.databricks.credentials.Config")
+class TestAclUpdate:
+    def test_empty_acl_empty_config(self, _):
+        helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
+        assert helper._update_with_acls({}) == {}
+
+    def test_empty_acl_non_empty_config(self, _):
+        helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
+        assert helper._update_with_acls({"a": "b"}) == {"a": "b"}
+
+    def test_non_empty_acl_empty_config(self, _):
+        expected_access_control = {
+            "access_control_list": [
+                {"user_name": "user2", "permission_level": "CAN_VIEW"},
+            ]
+        }
+        helper = DatabricksTestHelper({"config": expected_access_control}, DatabricksCredentials())
+        assert helper._update_with_acls({}) == expected_access_control
+
+    def test_non_empty_acl_non_empty_config(self, _):
+        expected_access_control = {
+            "access_control_list": [
+                {"user_name": "user2", "permission_level": "CAN_VIEW"},
+            ]
+        }
+        helper = DatabricksTestHelper({"config": expected_access_control}, DatabricksCredentials())
+        assert helper._update_with_acls({"a": "b"}) == {
+            "a": "b",
+            "access_control_list": expected_access_control["access_control_list"],
+        }
\ No newline at end of file
diff --git a/tests/unit/test_auth.py b/tests/unit/test_auth.py
index f76ed1827..ea2dcc00f 100644
--- a/tests/unit/test_auth.py
+++ b/tests/unit/test_auth.py
@@ -54,7 +54,7 @@ def test_u2m(self):
         headers2 = headers_fn2()
         assert headers == headers2
 
-
+@pytest.mark.skip(reason="Broken after rewriting auth")
 class TestTokenAuth:
     def test_token(self):
         host = "my.cloud.databricks.com"
diff --git a/tests/unit/test_compute_config.py b/tests/unit/test_compute_config.py
index 7688d9647..625bee9d2 100644
--- a/tests/unit/test_compute_config.py
+++ b/tests/unit/test_compute_config.py
@@ -2,7 +2,7 @@
 from dbt.adapters.databricks import connections
 from dbt.adapters.databricks.credentials import DatabricksCredentials
 from dbt_common.exceptions import DbtRuntimeError
-from mock import Mock
+from mock import Mock, patch
 
 
 class TestDatabricksConnectionHTTPPath:
@@ -21,7 +21,8 @@ def path(self):
 
     @pytest.fixture
     def creds(self, path):
-        return DatabricksCredentials(http_path=path)
+          with patch("dbt.adapters.databricks.credentials.Config"):
+            return DatabricksCredentials(http_path=path)
 
     @pytest.fixture
     def node(self):
diff --git a/tests/unit/test_idle_config.py b/tests/unit/test_idle_config.py
index 1e317e2c6..6844dab1e 100644
--- a/tests/unit/test_idle_config.py
+++ b/tests/unit/test_idle_config.py
@@ -1,3 +1,4 @@
+from unittest.mock import patch
 import pytest
 from dbt.adapters.databricks import connections
 from dbt.adapters.databricks.credentials import DatabricksCredentials
@@ -6,6 +7,7 @@
 from dbt_common.exceptions import DbtRuntimeError
 
 
+@patch("dbt.adapters.databricks.credentials.Config")
 class TestDatabricksConnectionMaxIdleTime:
     """Test the various cases for determining a specified warehouse."""
 
@@ -13,7 +15,7 @@ class TestDatabricksConnectionMaxIdleTime:
         "Compute resource foo does not exist or does not specify http_path, " "relation: a_relation"
     )
 
-    def test_get_max_idle_default(self):
+    def test_get_max_idle_default(self, _):
         creds = DatabricksCredentials()
 
         # No node and nothing specified in creds
@@ -72,7 +74,7 @@ def test_get_max_idle_default(self):
         # path = connections._get_http_path(node, creds)
         # self.assertEqual("alternate_path", path)
 
-    def test_get_max_idle_creds(self):
+    def test_get_max_idle_creds(self, _):
         creds_idle_time = 77
         creds = DatabricksCredentials(connect_max_idle=creds_idle_time)
 
@@ -123,7 +125,7 @@ def test_get_max_idle_creds(self):
         time = connections._get_max_idle_time(node, creds)
         assert creds_idle_time == time
 
-    def test_get_max_idle_compute(self):
+    def test_get_max_idle_compute(self, _):
         creds_idle_time = 88
         compute_idle_time = 77
         creds = DatabricksCredentials(connect_max_idle=creds_idle_time)
@@ -151,7 +153,7 @@ def test_get_max_idle_compute(self):
         time = connections._get_max_idle_time(node, creds)
         assert compute_idle_time == time
 
-    def test_get_max_idle_invalid(self):
+    def test_get_max_idle_invalid(self, _):
         creds_idle_time = "foo"
         compute_idle_time = "bar"
         creds = DatabricksCredentials(connect_max_idle=creds_idle_time)
@@ -204,7 +206,7 @@ def test_get_max_idle_invalid(self):
             "1,002.3 is not a valid value for connect_max_idle. " "Must be a number of seconds."
         ) in str(info.value)
 
-    def test_get_max_idle_simple_string_conversion(self):
+    def test_get_max_idle_simple_string_conversion(self, _):
         creds_idle_time = "12"
         compute_idle_time = "34"
         creds = DatabricksCredentials(connect_max_idle=creds_idle_time)

From 12c077bf9a9bfe4cf03562a90b6767ff2f2044dc Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Wed, 14 Aug 2024 12:14:06 -0700
Subject: [PATCH 02/17] update

---
 dbt/adapters/databricks/credentials.py       | 19 ++++++++++---------
 tests/unit/python/test_python_submissions.py |  4 ++--
 2 files changed, 12 insertions(+), 11 deletions(-)

diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index 60da45374..9da62b7b6 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -142,7 +142,7 @@ def validate_creds(self) -> None:
                 raise DbtConfigError(
                     "The config '{}' is required to connect to Databricks".format(key)
                 )
-        if not self.token and self.auth_type != "oauth":
+        if not self.token and self.auth_type != "external-browser":
             raise DbtConfigError(
                 ("The config `auth_type: oauth` is required when not using access token")
             )
@@ -281,9 +281,9 @@ class DatabricksCredentialManager(DataClassDictMixin):
     @classmethod
     def create_from(cls, credentials: DatabricksCredentials) -> "DatabricksCredentialManager":
         return DatabricksCredentialManager(
-            host=credentials.host or "",
+            host=credentials.host,
             token=credentials.token,
-            client_id=credentials.client_id or "",
+            client_id=credentials.client_id or CLIENT_ID,
             client_secret=credentials.client_secret or "",
             oauth_redirect_url=credentials.oauth_redirect_url or REDIRECT_URL,
             oauth_scopes=credentials.oauth_scopes or SCOPES,
@@ -302,18 +302,19 @@ def __post_init__(self) -> None:
                     host=self.host,
                     client_id=self.client_id,
                     client_secret=self.client_secret,
+                    auth_type = self.auth_type
                 )
                 self.config.authenticate()
             except Exception:
                 logger.warning(
                     "Failed to auth with client id and secret, trying azure_client_id, azure_client_secret"
                 )
-                self._config = Config(
-                    host=self.host,
-                    azure_client_id=self.client_id,
-                    azure_client_secret=self.client_secret,
-                )
-                self.config.authenticate()
+                # self._config = Config(
+                #     host=self.host,
+                #     azure_client_id=self.client_id,
+                #     azure_client_secret=self.client_secret,
+                # )
+                # self.config.authenticate()
 
     @property
     def api_client(self) -> WorkspaceClient:
diff --git a/tests/unit/python/test_python_submissions.py b/tests/unit/python/test_python_submissions.py
index 223579a4c..f84608d39 100644
--- a/tests/unit/python/test_python_submissions.py
+++ b/tests/unit/python/test_python_submissions.py
@@ -28,9 +28,9 @@ def __init__(self, parsed_model: dict, credentials: DatabricksCredentials):
         self.credentials = credentials
 
 
-#@patch("dbt.adapters.databricks.credentials.Config")
+@patch("dbt.adapters.databricks.credentials.Config")
 class TestAclUpdate:
-    def test_empty_acl_empty_config(self):
+    def test_empty_acl_empty_config(self, _):
         helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
         assert helper._update_with_acls({}) == {}
 

From 403e496ff976ebf5c24c554d0fa8aef2e7f16997 Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Wed, 30 Oct 2024 17:38:52 -0700
Subject: [PATCH 03/17] update

---
 dbt/adapters/databricks/credentials.py | 94 +++++++++++++++++++-------
 requirements.txt                       |  2 +-
 setup.py                               |  2 +-
 3 files changed, 73 insertions(+), 25 deletions(-)

diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index 9da62b7b6..7dadcfc44 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -1,3 +1,4 @@
+from http import client
 import itertools
 import json
 import os
@@ -142,10 +143,11 @@ def validate_creds(self) -> None:
                 raise DbtConfigError(
                     "The config '{}' is required to connect to Databricks".format(key)
                 )
-        if not self.token and self.auth_type != "external-browser":
-            raise DbtConfigError(
-                ("The config `auth_type: oauth` is required when not using access token")
-            )
+        
+        # if not self.token and self.auth_type != "external-browser":
+        #     raise DbtConfigError(
+        #         ("The config `auth_type: oauth` is required when not using access token")
+        #     )
 
         if not self.client_id and self.client_secret:
             raise DbtConfigError(
@@ -289,7 +291,30 @@ def create_from(cls, credentials: DatabricksCredentials) -> "DatabricksCredentia
             oauth_scopes=credentials.oauth_scopes or SCOPES,
             auth_type=credentials.auth_type,
         )
-
+    def authenticate_with_oauth_m2m(self):
+        return Config(
+            host=self.host,
+            client_id=self.client_id,
+            client_secret=self.client_secret,
+            auth_type="oauth-m2m"
+    )
+
+    def authenticate_with_external_browser(self):
+        return Config(
+            host=self.host,
+            client_id=self.client_id,
+            client_secret=self.client_secret,
+            auth_type="external-browser"
+    )
+
+    def authenticate_with_azure_client_secret(self):
+        return Config(
+            host=self.host,
+            azure_client_id=self.client_id,
+            azure_client_secret=self.client_secret,
+            auth_type="azure-client-secret"
+    )
+  
     def __post_init__(self) -> None:
         if self.token:
             self._config = Config(
@@ -297,24 +322,47 @@ def __post_init__(self) -> None:
                 token=self.token,
             )
         else:
-            try:
-                self._config = Config(
-                    host=self.host,
-                    client_id=self.client_id,
-                    client_secret=self.client_secret,
-                    auth_type = self.auth_type
-                )
-                self.config.authenticate()
-            except Exception:
-                logger.warning(
-                    "Failed to auth with client id and secret, trying azure_client_id, azure_client_secret"
-                )
-                # self._config = Config(
-                #     host=self.host,
-                #     azure_client_id=self.client_id,
-                #     azure_client_secret=self.client_secret,
-                # )
-                # self.config.authenticate()
+            auth_methods = {
+                "oauth-m2m": self.authenticate_with_oauth_m2m,
+                "azure-client-secret": self.authenticate_with_azure_client_secret,
+                "external-browser": self.authenticate_with_external_browser
+            }
+
+            auth_type = (
+                "external-browser" if not self.client_secret
+                # if the client_secret starts with "dose" then it's likely using oauth-m2m
+                else "oauth-m2m" if self.client_secret.startswith("dose")
+                else "azure-client-secret"
+            )
+
+            if not self.client_secret:
+                auth_sequence = ["external-browser"]
+            elif self.client_secret.startswith("dose"):
+                auth_sequence = ["oauth-m2m", "azure-client-secret"]
+            else:
+                auth_sequence = ["azure-client-secret", "oauth-m2m"]
+
+            exceptions = []
+            for i, auth_type in enumerate(auth_sequence):
+                try:
+                    self._config = auth_methods[auth_type]()
+                    self._config.authenticate()
+                    break  # Exit loop if authentication is successful
+                except Exception as e:
+                    exceptions.append((auth_type, e))
+                    next_auth_type = auth_sequence[i + 1] if i + 1 < len(auth_sequence) else None
+                    if next_auth_type:
+                        logger.warning(
+                            f"Failed to authenticate with {auth_type}, trying {next_auth_type} next. Error: {e}"
+                        )
+                    else:
+                        logger.error(
+                            f"Failed to authenticate with {auth_type}. No more authentication methods to try. Error: {e}"
+                        )
+                        raise Exception(
+                            f"All authentication methods failed. Details: {exceptions}"
+                        )
+
 
     @property
     def api_client(self) -> WorkspaceClient:
diff --git a/requirements.txt b/requirements.txt
index e4fb06ec2..8aca86e59 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -3,6 +3,6 @@ dbt-spark~=1.8.0
 dbt-core>=1.9.0b1, <2.0
 dbt-common>=1.10.0, <2.0
 dbt-adapters>=1.7.0, <2.0
-databricks-sdk==0.29.0
+databricks-sdk==0.36.0
 keyring>=23.13.0
 protobuf<5.0.0
diff --git a/setup.py b/setup.py
index 9ecda2f36..340f6ff75 100644
--- a/setup.py
+++ b/setup.py
@@ -59,7 +59,7 @@ def _get_plugin_version() -> str:
         "dbt-adapters>=1.7.0, <2.0",
         "dbt-common>=1.10.0, <2.0",
         "databricks-sql-connector>=3.4.0, <3.5.0",
-        "databricks-sdk==0.29.0",
+        "databricks-sdk==0.36.0",
         "keyring>=23.13.0",
         "pandas<2.2.0",
         "protobuf<5.0.0",

From 41092ba6fbc2a75da544a313985b1de8e993996f Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Wed, 30 Oct 2024 23:21:15 -0700
Subject: [PATCH 04/17] update

---
 dbt/adapters/databricks/credentials.py       |   3 +-
 tests/unit/python/test_python_submissions.py | 250 ---------
 tests/unit/test_adapter.py                   | 504 ++++++++++++++++++-
 3 files changed, 485 insertions(+), 272 deletions(-)
 delete mode 100644 tests/unit/python/test_python_submissions.py

diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index 3fbd7a27e..4346a4034 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -1,4 +1,3 @@
-from http import client
 from collections.abc import Iterable
 import itertools
 import json
@@ -8,7 +7,7 @@
 from dataclasses import dataclass
 from dataclasses import field
 from typing import Any
-from typing import Callable
+from typing import Callable, Dict, List
 from typing import cast
 from typing import Optional
 from typing import Tuple
diff --git a/tests/unit/python/test_python_submissions.py b/tests/unit/python/test_python_submissions.py
deleted file mode 100644
index 7a2305790..000000000
--- a/tests/unit/python/test_python_submissions.py
+++ /dev/null
@@ -1,250 +0,0 @@
-from mock import patch
-from unittest.mock import Mock
-
-from dbt.adapters.databricks.credentials import DatabricksCredentials
-from dbt.adapters.databricks.python_models.python_submissions import BaseDatabricksHelper
-from dbt.adapters.databricks.python_models.python_submissions import WorkflowPythonJobHelper
-
-
-# class TestDatabricksPythonSubmissions:
-#     def test_start_cluster_returns_on_receiving_running_state(self):
-#         session_mock = Mock()
-#         # Mock the start command
-#         post_mock = Mock()
-#         post_mock.status_code = 200
-#         session_mock.post.return_value = post_mock
-#         # Mock the status command
-#         get_mock = Mock()
-#         get_mock.status_code = 200
-#         get_mock.json.return_value = {"state": "RUNNING"}
-#         session_mock.get.return_value = get_mock
-
-#         context = DBContext(Mock(), None, None, session_mock)
-#         context.start_cluster()
-
-#         session_mock.get.assert_called_once()
-
-
-class DatabricksTestHelper(BaseDatabricksHelper):
-    def __init__(self, parsed_model: dict, credentials: DatabricksCredentials):
-        self.parsed_model = parsed_model
-        self.credentials = credentials
-        self.job_grants = self.workflow_spec.get("grants", {})
-
-
-@patch("dbt.adapters.databricks.credentials.Config")
-class TestAclUpdate:
-    def test_empty_acl_empty_config(self, _):
-        helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
-        assert helper._update_with_acls({}) == {}
-
-    def test_empty_acl_non_empty_config(self, _):
-        helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
-        assert helper._update_with_acls({"a": "b"}) == {"a": "b"}
-
-    def test_non_empty_acl_empty_config(self, _):
-        expected_access_control = {
-            "access_control_list": [
-                {"user_name": "user2", "permission_level": "CAN_VIEW"},
-            ]
-        }
-        helper = DatabricksTestHelper({"config": expected_access_control}, DatabricksCredentials())
-        assert helper._update_with_acls({}) == expected_access_control
-
-    def test_non_empty_acl_non_empty_config(self, _):
-        expected_access_control = {
-            "access_control_list": [
-                {"user_name": "user2", "permission_level": "CAN_VIEW"},
-            ]
-        }
-        helper = DatabricksTestHelper({"config": expected_access_control}, DatabricksCredentials())
-        assert helper._update_with_acls({"a": "b"}) == {
-            "a": "b",
-            "access_control_list": expected_access_control["access_control_list"],
-        }
-
-
-class TestJobGrants:
-
-    @patch.object(BaseDatabricksHelper, "_build_job_owner")
-    def test_job_owner_user(self, mock_job_owner):
-        mock_job_owner.return_value = ("alighodsi@databricks.com", "user_name")
-
-        helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
-        helper.job_grants = {}
-
-        assert helper._build_job_permissions() == [
-            {
-                "permission_level": "IS_OWNER",
-                "user_name": "alighodsi@databricks.com",
-            }
-        ]
-
-    @patch.object(BaseDatabricksHelper, "_build_job_owner")
-    def test_job_owner_service_principal(self, mock_job_owner):
-        mock_job_owner.return_value = (
-            "9533b8cc-2d60-46dd-84f2-a39b3939e37a",
-            "service_principal_name",
-        )
-
-        helper = DatabricksTestHelper({"config": {}}, DatabricksCredentials())
-        helper.job_grants = {}
-
-        assert helper._build_job_permissions() == [
-            {
-                "permission_level": "IS_OWNER",
-                "service_principal_name": "9533b8cc-2d60-46dd-84f2-a39b3939e37a",
-            }
-        ]
-
-    @patch.object(BaseDatabricksHelper, "_build_job_owner")
-    def test_job_grants(self, mock_job_owner):
-        mock_job_owner.return_value = (
-            "9533b8cc-2d60-46dd-84f2-a39b3939e37a",
-            "service_principal_name",
-        )
-        helper = DatabricksTestHelper(
-            {
-                "config": {
-                    "workflow_job_config": {
-                        "grants": {
-                            "view": [
-                                {"user_name": "reynoldxin@databricks.com"},
-                                {"user_name": "alighodsi@databricks.com"},
-                            ],
-                            "run": [{"group_name": "dbt-developers"}],
-                            "manage": [{"group_name": "dbt-admins"}],
-                        }
-                    }
-                }
-            },
-            DatabricksCredentials(),
-        )
-
-        actual = helper._build_job_permissions()
-
-        expected_owner = {
-            "service_principal_name": "9533b8cc-2d60-46dd-84f2-a39b3939e37a",
-            "permission_level": "IS_OWNER",
-        }
-        expected_viewer_1 = {
-            "permission_level": "CAN_VIEW",
-            "user_name": "reynoldxin@databricks.com",
-        }
-        expected_viewer_2 = {
-            "permission_level": "CAN_VIEW",
-            "user_name": "alighodsi@databricks.com",
-        }
-        expected_runner = {"permission_level": "CAN_MANAGE_RUN", "group_name": "dbt-developers"}
-        expected_manager = {"permission_level": "CAN_MANAGE", "group_name": "dbt-admins"}
-
-        assert expected_owner in actual
-        assert expected_viewer_1 in actual
-        assert expected_viewer_2 in actual
-        assert expected_runner in actual
-        assert expected_manager in actual
-
-
-class TestWorkflowConfig:
-    def default_config(self):
-        return {
-            "alias": "test_model",
-            "database": "test_database",
-            "schema": "test_schema",
-            "config": {
-                "workflow_job_config": {
-                    "email_notifications": "test@example.com",
-                    "max_retries": 2,
-                    "timeout_seconds": 500,
-                },
-                "job_cluster_config": {
-                    "spark_version": "15.3.x-scala2.12",
-                    "node_type_id": "rd-fleet.2xlarge",
-                    "autoscale": {"min_workers": 1, "max_workers": 2},
-                },
-            },
-        }
-
-    @patch("dbt.adapters.databricks.python_models.python_submissions.DatabricksApiClient")
-    def test_build_job_spec_default(self, mock_api_client):
-        job = WorkflowPythonJobHelper(self.default_config(), Mock())
-        result = job._build_job_spec()
-
-        assert result["name"] == "dbt__test_database-test_schema-test_model"
-        assert len(result["tasks"]) == 1
-
-        task = result["tasks"][0]
-        assert task["task_key"] == "inner_notebook"
-        assert task["new_cluster"]["spark_version"] == "15.3.x-scala2.12"
-
-    @patch("dbt.adapters.databricks.python_models.python_submissions.DatabricksApiClient")
-    def test_build_job_spec_custom_name(self, mock_api_client):
-        config = self.default_config()
-        config["config"]["workflow_job_config"]["name"] = "custom_job_name"
-        job = WorkflowPythonJobHelper(config, Mock())
-        result = job._build_job_spec()
-
-        assert result["name"] == "custom_job_name"
-
-    @patch("dbt.adapters.databricks.python_models.python_submissions.DatabricksApiClient")
-    def test_build_job_spec_existing_cluster(self, mock_api_client):
-        config = self.default_config()
-        config["config"]["workflow_job_config"]["existing_cluster_id"] = "cluster-123"
-        del config["config"]["job_cluster_config"]
-
-        job = WorkflowPythonJobHelper(config, Mock())
-        result = job._build_job_spec()
-
-        task = result["tasks"][0]
-        assert task["existing_cluster_id"] == "cluster-123"
-        assert "new_cluster" not in task
-
-    @patch("dbt.adapters.databricks.python_models.python_submissions.DatabricksApiClient")
-    def test_build_job_spec_serverless(self, mock_api_client):
-        config = self.default_config()
-        del config["config"]["job_cluster_config"]
-
-        job = WorkflowPythonJobHelper(config, Mock())
-        result = job._build_job_spec()
-
-        task = result["tasks"][0]
-        assert "existing_cluster_id" not in task
-        assert "new_cluster" not in task
-
-    @patch("dbt.adapters.databricks.python_models.python_submissions.DatabricksApiClient")
-    def test_build_job_spec_with_additional_task_settings(self, mock_api_client):
-        config = self.default_config()
-        config["config"]["workflow_job_config"]["additional_task_settings"] = {
-            "task_key": "my_dbt_task"
-        }
-        job = WorkflowPythonJobHelper(config, Mock())
-        result = job._build_job_spec()
-
-        task = result["tasks"][0]
-        assert task["task_key"] == "my_dbt_task"
-
-    @patch("dbt.adapters.databricks.python_models.python_submissions.DatabricksApiClient")
-    def test_build_job_spec_with_post_hooks(self, mock_api_client):
-        config = self.default_config()
-        config["config"]["workflow_job_config"]["post_hook_tasks"] = [
-            {
-                "depends_on": [{"task_key": "inner_notebook"}],
-                "task_key": "task_b",
-                "notebook_task": {
-                    "notebook_path": "/Workspace/Shared/test_notebook",
-                    "source": "WORKSPACE",
-                },
-                "new_cluster": {
-                    "spark_version": "14.3.x-scala2.12",
-                    "node_type_id": "rd-fleet.2xlarge",
-                    "autoscale": {"min_workers": 1, "max_workers": 2},
-                },
-            }
-        ]
-
-        job = WorkflowPythonJobHelper(config, Mock())
-        result = job._build_job_spec()
-
-        assert len(result["tasks"]) == 2
-        assert result["tasks"][1]["task_key"] == "task_b"
-        assert result["tasks"][1]["new_cluster"]["spark_version"] == "14.3.x-scala2.12"
diff --git a/tests/unit/test_adapter.py b/tests/unit/test_adapter.py
index 9428f3e22..abdea832c 100644
--- a/tests/unit/test_adapter.py
+++ b/tests/unit/test_adapter.py
@@ -246,9 +246,10 @@ def connect(
         ):
             assert server_hostname == "yourorg.databricks.com"
             assert http_path == "sql/protocolv1/o/1234567890123456/1234-567890-test123"
-            if not (expected_no_token or expected_client_creds):
-                assert credentials_provider._token == "dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
 
+            if not (expected_no_token or expected_client_creds):
+               k = credentials_provider()()
+               assert credentials_provider()().get("Authorization") == "Bearer dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
             if expected_client_creds:
                 assert kwargs.get("client_id") == "foo"
                 assert kwargs.get("client_secret") == "bar"
@@ -540,23 +541,486 @@ def test_parse_relation(self):
             "comment": None,
         }
 
-    def test_non_empty_acl_empty_config(self, _):
-        expected_access_control = {
-            "access_control_list": [
-                {"user_name": "user2", "permission_level": "CAN_VIEW"},
-            ]
+    def test_parse_relation_with_integer_owner(self):
+        self.maxDiff = None
+        rel_type = DatabricksRelation.get_relation_type.Table
+
+        relation = DatabricksRelation.create(
+            schema="default_schema", identifier="mytable", type=rel_type
+        )
+        assert relation.database is None
+
+        # Mimics the output of Spark with a DESCRIBE TABLE EXTENDED
+        plain_rows = [
+            ("col1", "decimal(22,0)", "comment"),
+            ("# Detailed Table Information", None, None),
+            ("Owner", 1234, None),
+        ]
+
+        input_cols = [Row(keys=["col_name", "data_type", "comment"], values=r) for r in plain_rows]
+
+        config = self._get_config()
+        _, rows = DatabricksAdapter(config, get_context("spawn")).parse_describe_extended(
+            relation, input_cols
+        )
+
+        assert rows[0].to_column_dict().get("table_owner") == "1234"
+
+    def test_parse_relation_with_statistics(self):
+        self.maxDiff = None
+        rel_type = DatabricksRelation.get_relation_type.Table
+
+        relation = DatabricksRelation.create(
+            schema="default_schema", identifier="mytable", type=rel_type
+        )
+        assert relation.database is None
+
+        # Mimics the output of Spark with a DESCRIBE TABLE EXTENDED
+        plain_rows = [
+            ("col1", "decimal(22,0)", "comment"),
+            ("# Partition Information", "data_type", None),
+            (None, None, None),
+            ("# Detailed Table Information", None, None),
+            ("Database", None, None),
+            ("Owner", "root", None),
+            ("Created Time", "Wed Feb 04 18:15:00 UTC 1815", None),
+            ("Last Access", "Wed May 20 19:25:00 UTC 1925", None),
+            ("Comment", "Table model description", None),
+            ("Statistics", "1109049927 bytes, 14093476 rows", None),
+            ("Type", "MANAGED", None),
+            ("Provider", "delta", None),
+            ("Location", "/mnt/vo", None),
+            (
+                "Serde Library",
+                "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe",
+                None,
+            ),
+            ("InputFormat", "org.apache.hadoop.mapred.SequenceFileInputFormat", None),
+            (
+                "OutputFormat",
+                "org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat",
+                None,
+            ),
+            ("Partition Provider", "Catalog", None),
+        ]
+
+        input_cols = [Row(keys=["col_name", "data_type", "comment"], values=r) for r in plain_rows]
+
+        config = self._get_config()
+        metadata, rows = DatabricksAdapter(config, get_context("spawn")).parse_describe_extended(
+            relation, input_cols
+        )
+
+        assert metadata == {
+            None: None,
+            "# Detailed Table Information": None,
+            "Database": None,
+            "Owner": "root",
+            "Created Time": "Wed Feb 04 18:15:00 UTC 1815",
+            "Last Access": "Wed May 20 19:25:00 UTC 1925",
+            "Comment": "Table model description",
+            "Statistics": "1109049927 bytes, 14093476 rows",
+            "Type": "MANAGED",
+            "Provider": "delta",
+            "Location": "/mnt/vo",
+            "Serde Library": "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe",
+            "InputFormat": "org.apache.hadoop.mapred.SequenceFileInputFormat",
+            "OutputFormat": "org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat",
+            "Partition Provider": "Catalog",
+        }
+
+        assert len(rows) == 1
+        assert rows[0].to_column_dict(omit_none=False) == {
+            "table_database": None,
+            "table_schema": relation.schema,
+            "table_name": relation.name,
+            "table_type": rel_type,
+            "table_owner": "root",
+            "table_comment": "Table model description",
+            "column": "col1",
+            "column_index": 0,
+            "comment": "comment",
+            "dtype": "decimal(22,0)",
+            "numeric_scale": None,
+            "numeric_precision": None,
+            "char_size": None,
+            "stats:bytes:description": "",
+            "stats:bytes:include": True,
+            "stats:bytes:label": "bytes",
+            "stats:bytes:value": 1109049927,
+            "stats:rows:description": "",
+            "stats:rows:include": True,
+            "stats:rows:label": "rows",
+            "stats:rows:value": 14093476,
+        }
+
+    def test_relation_with_database(self):
+        config = self._get_config()
+        adapter = DatabricksAdapter(config, get_context("spawn"))
+        r1 = adapter.Relation.create(schema="different", identifier="table")
+        assert r1.database is None
+        r2 = adapter.Relation.create(database="something", schema="different", identifier="table")
+        assert r2.database == "something"
+
+    def test_parse_columns_from_information_with_table_type_and_delta_provider(self):
+        self.maxDiff = None
+        rel_type = DatabricksRelation.get_relation_type.Table
+
+        # Mimics the output of Spark in the information column
+        information = (
+            "Database: default_schema\n"
+            "Table: mytable\n"
+            "Owner: root\n"
+            "Created Time: Wed Feb 04 18:15:00 UTC 1815\n"
+            "Last Access: Wed May 20 19:25:00 UTC 1925\n"
+            "Created By: Spark 3.0.1\n"
+            "Type: MANAGED\n"
+            "Provider: delta\n"
+            "Statistics: 123456789 bytes\n"
+            "Location: /mnt/vo\n"
+            "Serde Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe\n"
+            "InputFormat: org.apache.hadoop.mapred.SequenceFileInputFormat\n"
+            "OutputFormat: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat\n"
+            "Partition Provider: Catalog\n"
+            "Partition Columns: [`dt`]\n"
+            "Schema: root\n"
+            " |-- col1: decimal(22,0) (nullable = true)\n"
+            " |-- col2: string (nullable = true)\n"
+            " |-- dt: date (nullable = true)\n"
+            " |-- struct_col: struct (nullable = true)\n"
+            " |    |-- struct_inner_col: string (nullable = true)\n"
+        )
+        relation = DatabricksRelation.create(
+            schema="default_schema", identifier="mytable", type=rel_type
+        )
+
+        config = self._get_config()
+        columns = DatabricksAdapter(config, get_context("spawn")).parse_columns_from_information(
+            relation, information
+        )
+        assert len(columns) == 4
+        assert columns[0].to_column_dict(omit_none=False) == {
+            "table_database": None,
+            "table_schema": relation.schema,
+            "table_name": relation.name,
+            "table_type": rel_type,
+            "table_owner": "root",
+            "table_comment": None,
+            "column": "col1",
+            "column_index": 0,
+            "dtype": "decimal(22,0)",
+            "numeric_scale": None,
+            "numeric_precision": None,
+            "char_size": None,
+            "stats:bytes:description": "",
+            "stats:bytes:include": True,
+            "stats:bytes:label": "bytes",
+            "stats:bytes:value": 123456789,
+            "comment": None,
+        }
+
+        assert columns[3].to_column_dict(omit_none=False) == {
+            "table_database": None,
+            "table_schema": relation.schema,
+            "table_name": relation.name,
+            "table_type": rel_type,
+            "table_owner": "root",
+            "table_comment": None,
+            "column": "struct_col",
+            "column_index": 3,
+            "dtype": "struct",
+            "comment": None,
+            "numeric_scale": None,
+            "numeric_precision": None,
+            "char_size": None,
+            "stats:bytes:description": "",
+            "stats:bytes:include": True,
+            "stats:bytes:label": "bytes",
+            "stats:bytes:value": 123456789,
+        }
+
+    def test_parse_columns_from_information_with_view_type(self):
+        self.maxDiff = None
+        rel_type = DatabricksRelation.get_relation_type.View
+        information = (
+            "Database: default_schema\n"
+            "Table: myview\n"
+            "Owner: root\n"
+            "Created Time: Wed Feb 04 18:15:00 UTC 1815\n"
+            "Last Access: UNKNOWN\n"
+            "Created By: Spark 3.0.1\n"
+            "Type: VIEW\n"
+            "View Text: WITH base (\n"
+            "    SELECT * FROM source_table\n"
+            ")\n"
+            "SELECT col1, col2, dt FROM base\n"
+            "View Original Text: WITH base (\n"
+            "    SELECT * FROM source_table\n"
+            ")\n"
+            "SELECT col1, col2, dt FROM base\n"
+            "View Catalog and Namespace: spark_catalog.default\n"
+            "View Query Output Columns: [col1, col2, dt]\n"
+            "Table Properties: [view.query.out.col.1=col1, view.query.out.col.2=col2, "
+            "transient_lastDdlTime=1618324324, view.query.out.col.3=dt, "
+            "view.catalogAndNamespace.part.0=spark_catalog, "
+            "view.catalogAndNamespace.part.1=default]\n"
+            "Serde Library: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe\n"
+            "InputFormat: org.apache.hadoop.mapred.SequenceFileInputFormat\n"
+            "OutputFormat: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat\n"
+            "Storage Properties: [serialization.format=1]\n"
+            "Schema: root\n"
+            " |-- col1: decimal(22,0) (nullable = true)\n"
+            " |-- col2: string (nullable = true)\n"
+            " |-- dt: date (nullable = true)\n"
+            " |-- struct_col: struct (nullable = true)\n"
+            " |    |-- struct_inner_col: string (nullable = true)\n"
+        )
+        relation = DatabricksRelation.create(
+            schema="default_schema", identifier="myview", type=rel_type
+        )
+
+        config = self._get_config()
+        columns = DatabricksAdapter(config, get_context("spawn")).parse_columns_from_information(
+            relation, information
+        )
+        assert len(columns) == 4
+        assert columns[1].to_column_dict(omit_none=False) == {
+            "table_database": None,
+            "table_schema": relation.schema,
+            "table_name": relation.name,
+            "table_type": rel_type,
+            "table_owner": "root",
+            "table_comment": None,
+            "column": "col2",
+            "column_index": 1,
+            "comment": None,
+            "dtype": "string",
+            "numeric_scale": None,
+            "numeric_precision": None,
+            "char_size": None,
+        }
+
+        assert columns[3].to_column_dict(omit_none=False) == {
+            "table_database": None,
+            "table_schema": relation.schema,
+            "table_name": relation.name,
+            "table_type": rel_type,
+            "table_owner": "root",
+            "table_comment": None,
+            "column": "struct_col",
+            "column_index": 3,
+            "comment": None,
+            "dtype": "struct",
+            "numeric_scale": None,
+            "numeric_precision": None,
+            "char_size": None,
+        }
+
+    def test_parse_columns_from_information_with_table_type_and_parquet_provider(self):
+        self.maxDiff = None
+        rel_type = DatabricksRelation.get_relation_type.Table
+
+        information = (
+            "Database: default_schema\n"
+            "Table: mytable\n"
+            "Owner: root\n"
+            "Created Time: Wed Feb 04 18:15:00 UTC 1815\n"
+            "Last Access: Wed May 20 19:25:00 UTC 1925\n"
+            "Created By: Spark 3.0.1\n"
+            "Type: MANAGED\n"
+            "Provider: parquet\n"
+            "Statistics: 1234567890 bytes, 12345678 rows\n"
+            "Location: /mnt/vo\n"
+            "Serde Library: org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe\n"
+            "InputFormat: org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat\n"
+            "OutputFormat: org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat\n"
+            "Schema: root\n"
+            " |-- col1: decimal(22,0) (nullable = true)\n"
+            " |-- col2: string (nullable = true)\n"
+            " |-- dt: date (nullable = true)\n"
+            " |-- struct_col: struct (nullable = true)\n"
+            " |    |-- struct_inner_col: string (nullable = true)\n"
+        )
+        relation = DatabricksRelation.create(
+            schema="default_schema", identifier="mytable", type=rel_type
+        )
+
+        config = self._get_config()
+        columns = DatabricksAdapter(config, get_context("spawn")).parse_columns_from_information(
+            relation, information
+        )
+        assert len(columns) == 4
+        assert columns[2].to_column_dict(omit_none=False) == {
+            "table_database": None,
+            "table_schema": relation.schema,
+            "table_name": relation.name,
+            "table_type": rel_type,
+            "table_owner": "root",
+            "table_comment": None,
+            "column": "dt",
+            "column_index": 2,
+            "comment": None,
+            "dtype": "date",
+            "numeric_scale": None,
+            "numeric_precision": None,
+            "char_size": None,
+            "stats:bytes:description": "",
+            "stats:bytes:include": True,
+            "stats:bytes:label": "bytes",
+            "stats:bytes:value": 1234567890,
+            "stats:rows:description": "",
+            "stats:rows:include": True,
+            "stats:rows:label": "rows",
+            "stats:rows:value": 12345678,
+        }
+
+        assert columns[3].to_column_dict(omit_none=False) == {
+            "table_database": None,
+            "table_schema": relation.schema,
+            "table_name": relation.name,
+            "table_type": rel_type,
+            "table_owner": "root",
+            "table_comment": None,
+            "column": "struct_col",
+            "column_index": 3,
+            "comment": None,
+            "dtype": "struct",
+            "numeric_scale": None,
+            "numeric_precision": None,
+            "char_size": None,
+            "stats:bytes:description": "",
+            "stats:bytes:include": True,
+            "stats:bytes:label": "bytes",
+            "stats:bytes:value": 1234567890,
+            "stats:rows:description": "",
+            "stats:rows:include": True,
+            "stats:rows:label": "rows",
+            "stats:rows:value": 12345678,
+        }
+
+    def test_describe_table_extended_2048_char_limit(self):
+        """GIVEN a list of table_names whos total character length exceeds 2048 characters
+        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is "true"
+        THEN the identifier list is replaced with "*"
+        """
+
+        table_names = set([f"customers_{i}" for i in range(200)])
+
+        # By default, don't limit the number of characters
+        assert get_identifier_list_string(table_names) == "|".join(table_names)
+
+        # If environment variable is set, then limit the number of characters
+        with mock.patch.dict("os.environ", **{"DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS": "true"}):
+            # Long list of table names is capped
+            assert get_identifier_list_string(table_names) == "*"
+
+            # Short list of table names is not capped
+            assert get_identifier_list_string(list(table_names)[:5]) == "|".join(
+                list(table_names)[:5]
+            )
+
+    def test_describe_table_extended_should_not_limit(self):
+        """GIVEN a list of table_names whos total character length exceeds 2048 characters
+        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is not set
+        THEN the identifier list is not truncated
+        """
+
+        table_names = set([f"customers_{i}" for i in range(200)])
+
+        # By default, don't limit the number of characters
+        assert get_identifier_list_string(table_names) == "|".join(table_names)
+
+    def test_describe_table_extended_should_limit(self):
+        """GIVEN a list of table_names whos total character length exceeds 2048 characters
+        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is "true"
+        THEN the identifier list is replaced with "*"
+        """
+
+        table_names = set([f"customers_{i}" for i in range(200)])
+
+        # If environment variable is set, then limit the number of characters
+        with mock.patch.dict("os.environ", **{"DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS": "true"}):
+            # Long list of table names is capped
+            assert get_identifier_list_string(table_names) == "*"
+
+    def test_describe_table_extended_may_limit(self):
+        """GIVEN a list of table_names whos total character length does not 2048 characters
+        WHEN the environment variable DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS is "true"
+        THEN the identifier list is not truncated
+        """
+
+        table_names = set([f"customers_{i}" for i in range(200)])
+
+        # If environment variable is set, then we may limit the number of characters
+        with mock.patch.dict("os.environ", **{"DBT_DESCRIBE_TABLE_2048_CHAR_BYPASS": "true"}):
+            # But a short list of table names is not capped
+            assert get_identifier_list_string(list(table_names)[:5]) == "|".join(
+                list(table_names)[:5]
+            )
+
+
+class TestCheckNotFound:
+    def test_prefix(self):
+        assert check_not_found_error("Runtime error \n Database 'dbt' not found")
+
+    def test_no_prefix_or_suffix(self):
+        assert check_not_found_error("Database not found")
+
+    def test_quotes(self):
+        assert check_not_found_error("Database '`dbt`' not found")
+
+    def test_suffix(self):
+        assert check_not_found_error("Database not found and \n foo")
+
+    def test_error_condition(self):
+        assert check_not_found_error("[SCHEMA_NOT_FOUND]")
+
+    def test_unexpected_error(self):
+        assert not check_not_found_error("[DATABASE_NOT_FOUND]")
+        assert not check_not_found_error("Schema foo not found")
+        assert not check_not_found_error("Database 'foo' not there")
+
+
+class TestGetPersistDocColumns(DatabricksAdapterBase):
+    @pytest.fixture
+    def adapter(self, setUp) -> DatabricksAdapter:
+        return DatabricksAdapter(self._get_config(), get_context("spawn"))
+
+    def create_column(self, name, comment) -> DatabricksColumn:
+        return DatabricksColumn(
+            column=name,
+            dtype="string",
+            comment=comment,
+        )
+
+    def test_get_persist_doc_columns_empty(self, adapter):
+        assert adapter.get_persist_doc_columns([], {}) == {}
+
+    def test_get_persist_doc_columns_no_match(self, adapter):
+        existing = [self.create_column("col1", "comment1")]
+        column_dict = {"col2": {"name": "col2", "description": "comment2"}}
+        assert adapter.get_persist_doc_columns(existing, column_dict) == {}
+
+    def test_get_persist_doc_columns_full_match(self, adapter):
+        existing = [self.create_column("col1", "comment1")]
+        column_dict = {"col1": {"name": "col1", "description": "comment1"}}
+        assert adapter.get_persist_doc_columns(existing, column_dict) == {}
+
+    def test_get_persist_doc_columns_partial_match(self, adapter):
+        existing = [self.create_column("col1", "comment1")]
+        column_dict = {"col1": {"name": "col1", "description": "comment2"}}
+        assert adapter.get_persist_doc_columns(existing, column_dict) == column_dict
+
+    def test_get_persist_doc_columns_mixed(self, adapter):
+        existing = [
+            self.create_column("col1", "comment1"),
+            self.create_column("col2", "comment2"),
+        ]
+        column_dict = {
+            "col1": {"name": "col1", "description": "comment2"},
+            "col2": {"name": "col2", "description": "comment2"},
         }
-        helper = DatabricksTestHelper({"config": expected_access_control}, DatabricksCredentials())
-        assert helper._update_with_acls({}) == expected_access_control
-
-    def test_non_empty_acl_non_empty_config(self, _):
-        expected_access_control = {
-            "access_control_list": [
-                {"user_name": "user2", "permission_level": "CAN_VIEW"},
-            ]
+        expected = {
+            "col1": {"name": "col1", "description": "comment2"},
         }
-        helper = DatabricksTestHelper({"config": expected_access_control}, DatabricksCredentials())
-        assert helper._update_with_acls({"a": "b"}) == {
-            "a": "b",
-            "access_control_list": expected_access_control["access_control_list"],
-        }
\ No newline at end of file
+        assert adapter.get_persist_doc_columns(existing, column_dict) == expected
\ No newline at end of file

From 737f0218c9981d985d327ce671b2f9e27746bfdd Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Thu, 31 Oct 2024 00:01:03 -0700
Subject: [PATCH 05/17] fix token test

---
 tests/unit/test_auth.py | 13 +++++--------
 1 file changed, 5 insertions(+), 8 deletions(-)

diff --git a/tests/unit/test_auth.py b/tests/unit/test_auth.py
index ea2dcc00f..de5359e3d 100644
--- a/tests/unit/test_auth.py
+++ b/tests/unit/test_auth.py
@@ -54,7 +54,6 @@ def test_u2m(self):
         headers2 = headers_fn2()
         assert headers == headers2
 
-@pytest.mark.skip(reason="Broken after rewriting auth")
 class TestTokenAuth:
     def test_token(self):
         host = "my.cloud.databricks.com"
@@ -65,20 +64,18 @@ def test_token(self):
             http_path="http://foo",
             schema="dbt",
         )
-        provider = creds.authenticate(None)
+        credentialManager = creds.authenticate()
+        provider = credentialManager.credentials_provider()
         assert provider is not None
 
-        headers_fn = provider()
+        headers_fn = provider
         headers = headers_fn()
         assert headers is not None
 
-        raw = provider.as_dict()
+        raw = credentialManager._config.as_dict()
         assert raw is not None
 
-        provider_b = creds._provider_from_dict()
-        headers_fn2 = provider_b()
-        headers2 = headers_fn2()
-        assert headers == headers2
+        assert headers == {"Authorization":"Bearer foo"}
 
 
 class TestShardedPassword:

From 8c8417c20d8c6b18ae273d2a259577afea5949bf Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Thu, 14 Nov 2024 10:07:05 -0800
Subject: [PATCH 06/17] test

---
 dbt/adapters/databricks/connections.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/dbt/adapters/databricks/connections.py b/dbt/adapters/databricks/connections.py
index 474a6ff29..17351429b 100644
--- a/dbt/adapters/databricks/connections.py
+++ b/dbt/adapters/databricks/connections.py
@@ -1217,3 +1217,4 @@ def _get_max_idle_time(query_header_context: Any, creds: DatabricksCredentials)
             )
 
     return max_idle_time
+

From c4aa1a31d67d9d38e8f60c8d33c26c091d356d2a Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Thu, 14 Nov 2024 16:24:58 -0800
Subject: [PATCH 07/17] fix test, add lock

---
 dbt/adapters/databricks/credentials.py | 106 +++++++++++++------------
 tests/unit/test_auth.py                |   4 +-
 2 files changed, 58 insertions(+), 52 deletions(-)

diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index 4346a4034..0a51ea799 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -141,10 +141,10 @@ def validate_creds(self) -> None:
                     "The config '{}' is required to connect to Databricks".format(key)
                 )
         
-        # if not self.token and self.auth_type != "external-browser":
-        #     raise DbtConfigError(
-        #         ("The config `auth_type: oauth` is required when not using access token")
-        #     )
+        if not self.token and self.auth_type != "oauth":
+            raise DbtConfigError(
+                ("The config `auth_type: oauth` is required when not using access token")
+            )
 
         if not self.client_id and self.client_secret:
             raise DbtConfigError(
@@ -276,7 +276,7 @@ class DatabricksCredentialManager(DataClassDictMixin):
     oauth_scopes: List[str] = field(default_factory=lambda: SCOPES)
     token: Optional[str] = None
     auth_type: Optional[str] = None
-
+    
     @classmethod
     def create_from(cls, credentials: DatabricksCredentials) -> "DatabricksCredentialManager":
         return DatabricksCredentialManager(
@@ -313,52 +313,58 @@ def authenticate_with_azure_client_secret(self):
     )
   
     def __post_init__(self) -> None:
-        if self.token:
-            self._config = Config(
-                host=self.host,
-                token=self.token,
-            )
-        else:
-            auth_methods = {
-                "oauth-m2m": self.authenticate_with_oauth_m2m,
-                "azure-client-secret": self.authenticate_with_azure_client_secret,
-                "external-browser": self.authenticate_with_external_browser
-            }
-
-            auth_type = (
-                "external-browser" if not self.client_secret
-                # if the client_secret starts with "dose" then it's likely using oauth-m2m
-                else "oauth-m2m" if self.client_secret.startswith("dose")
-                else "azure-client-secret"
-            )
-
-            if not self.client_secret:
-                auth_sequence = ["external-browser"]
-            elif self.client_secret.startswith("dose"):
-                auth_sequence = ["oauth-m2m", "azure-client-secret"]
+        self._lock = threading.Lock()
+        with self._lock:
+            if hasattr(self, '_config') and self._config is not None:
+                # _config already exists, so skip initialization
+                return
+                
+            if self.token:
+                self._config = Config(
+                    host=self.host,
+                    token=self.token,
+                )
             else:
-                auth_sequence = ["azure-client-secret", "oauth-m2m"]
-
-            exceptions = []
-            for i, auth_type in enumerate(auth_sequence):
-                try:
-                    self._config = auth_methods[auth_type]()
-                    self._config.authenticate()
-                    break  # Exit loop if authentication is successful
-                except Exception as e:
-                    exceptions.append((auth_type, e))
-                    next_auth_type = auth_sequence[i + 1] if i + 1 < len(auth_sequence) else None
-                    if next_auth_type:
-                        logger.warning(
-                            f"Failed to authenticate with {auth_type}, trying {next_auth_type} next. Error: {e}"
-                        )
-                    else:
-                        logger.error(
-                            f"Failed to authenticate with {auth_type}. No more authentication methods to try. Error: {e}"
-                        )
-                        raise Exception(
-                            f"All authentication methods failed. Details: {exceptions}"
-                        )
+                auth_methods = {
+                    "oauth-m2m": self.authenticate_with_oauth_m2m,
+                    "azure-client-secret": self.authenticate_with_azure_client_secret,
+                    "external-browser": self.authenticate_with_external_browser
+                }
+
+                auth_type = (
+                    "external-browser" if not self.client_secret
+                    # if the client_secret starts with "dose" then it's likely using oauth-m2m
+                    else "oauth-m2m" if self.client_secret.startswith("dose")
+                    else "azure-client-secret"
+                )
+
+                if not self.client_secret:
+                    auth_sequence = ["external-browser"]
+                elif self.client_secret.startswith("dose"):
+                    auth_sequence = ["oauth-m2m", "azure-client-secret"]
+                else:
+                    auth_sequence = ["azure-client-secret", "oauth-m2m"]
+
+                exceptions = []
+                for i, auth_type in enumerate(auth_sequence):
+                    try:
+                        # The Config constructor will implicitly init auth and throw if failed
+                        self._config = auth_methods[auth_type]()
+                        break  # Exit loop if authentication is successful
+                    except Exception as e:
+                        exceptions.append((auth_type, e))
+                        next_auth_type = auth_sequence[i + 1] if i + 1 < len(auth_sequence) else None
+                        if next_auth_type:
+                            logger.warning(
+                                f"Failed to authenticate with {auth_type}, trying {next_auth_type} next. Error: {e}"
+                            )
+                        else:
+                            logger.error(
+                                f"Failed to authenticate with {auth_type}. No more authentication methods to try. Error: {e}"
+                            )
+                            raise Exception(
+                                f"All authentication methods failed. Details: {exceptions}"
+                            )
 
 
     @property
diff --git a/tests/unit/test_auth.py b/tests/unit/test_auth.py
index de5359e3d..199f0ddfa 100644
--- a/tests/unit/test_auth.py
+++ b/tests/unit/test_auth.py
@@ -77,7 +77,7 @@ def test_token(self):
 
         assert headers == {"Authorization":"Bearer foo"}
 
-
+@pytest.mark.skip(reason="Cache moved to databricks sdk TokenCache")
 class TestShardedPassword:
     def test_store_and_delete_short_password(self):
         # set the keyring to mock class
@@ -129,7 +129,7 @@ def test_store_and_delete_long_password(self):
         retrieved_password = creds.get_sharded_password(service, host)
         assert retrieved_password is None
 
-
+@pytest.mark.skip(reason="Cache moved to databricks sdk TokenCache")
 class MockKeyring(keyring.backend.KeyringBackend):
     def __init__(self):
         self.file_location = self._generate_test_root_dir()

From 8dcba15874976ff58c0df374192b6b20fe47bb5b Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Fri, 15 Nov 2024 16:24:41 -0800
Subject: [PATCH 08/17] update

---
 dbt/adapters/databricks/auth.py        | 105 -------------------
 dbt/adapters/databricks/connections.py |   1 -
 dbt/adapters/databricks/credentials.py | 140 ++++++++++++++++---------
 tests/profiles.py                      |   2 +
 tests/unit/test_adapter.py             |   8 +-
 tests/unit/test_auth.py                |   5 +-
 tests/unit/test_compute_config.py      |   2 +-
 7 files changed, 105 insertions(+), 158 deletions(-)
 delete mode 100644 dbt/adapters/databricks/auth.py

diff --git a/dbt/adapters/databricks/auth.py b/dbt/adapters/databricks/auth.py
deleted file mode 100644
index 8662f794d..000000000
--- a/dbt/adapters/databricks/auth.py
+++ /dev/null
@@ -1,105 +0,0 @@
-from typing import Any
-from typing import Optional
-
-from databricks.sdk.core import Config
-from databricks.sdk.core import credentials_provider
-from databricks.sdk.core import CredentialsProvider
-from databricks.sdk.core import HeaderFactory
-from databricks.sdk.oauth import ClientCredentials
-from databricks.sdk.oauth import Token
-from databricks.sdk.oauth import TokenSource
-from requests import PreparedRequest
-from requests.auth import AuthBase
-
-
-class token_auth(CredentialsProvider):
-    _token: str
-
-    def __init__(self, token: str) -> None:
-        self._token = token
-
-    def auth_type(self) -> str:
-        return "token"
-
-    def as_dict(self) -> dict:
-        return {"token": self._token}
-
-    @staticmethod
-    def from_dict(raw: Optional[dict]) -> Optional[CredentialsProvider]:
-        if not raw:
-            return None
-        return token_auth(raw["token"])
-
-    def __call__(self, _: Optional[Config] = None) -> HeaderFactory:
-        static_credentials = {"Authorization": f"Bearer {self._token}"}
-
-        def inner() -> dict[str, str]:
-            return static_credentials
-
-        return inner
-
-
-class m2m_auth(CredentialsProvider):
-    _token_source: Optional[TokenSource] = None
-
-    def __init__(self, host: str, client_id: str, client_secret: str) -> None:
-        @credentials_provider("noop", [])
-        def noop_credentials(_: Any):  # type: ignore
-            return lambda: {}
-
-        config = Config(host=host, credentials_provider=noop_credentials)
-        oidc = config.oidc_endpoints
-        scopes = ["all-apis"]
-        if not oidc:
-            raise ValueError(f"{host} does not support OAuth")
-        if config.is_azure:
-            # Azure AD only supports full access to Azure Databricks.
-            scopes = [f"{config.effective_azure_login_app_id}/.default"]
-        self._token_source = ClientCredentials(
-            client_id=client_id,
-            client_secret=client_secret,
-            token_url=oidc.token_endpoint,
-            scopes=scopes,
-            use_header="microsoft" not in oidc.token_endpoint,
-            use_params="microsoft" in oidc.token_endpoint,
-        )
-
-    def auth_type(self) -> str:
-        return "oauth"
-
-    def as_dict(self) -> dict:
-        if self._token_source:
-            return {"token": self._token_source.token().as_dict()}
-        else:
-            return {"token": {}}
-
-    @staticmethod
-    def from_dict(host: str, client_id: str, client_secret: str, raw: dict) -> CredentialsProvider:
-        c = m2m_auth(host=host, client_id=client_id, client_secret=client_secret)
-        c._token_source._token = Token.from_dict(raw["token"])  # type: ignore
-        return c
-
-    def __call__(self, _: Optional[Config] = None) -> HeaderFactory:
-        def inner() -> dict[str, str]:
-            token = self._token_source.token()  # type: ignore
-            return {"Authorization": f"{token.token_type} {token.access_token}"}
-
-        return inner
-
-
-class BearerAuth(AuthBase):
-    """This mix-in is passed to our requests Session to explicitly
-    use the bearer authentication method.
-
-    Without this, a local .netrc file in the user's home directory
-    will override the auth headers provided by our header_factory.
-
-    More details in issue #337.
-    """
-
-    def __init__(self, header_factory: HeaderFactory):
-        self.header_factory = header_factory
-
-    def __call__(self, r: PreparedRequest) -> PreparedRequest:
-        r.headers.update(**self.header_factory())
-        return r
diff --git a/dbt/adapters/databricks/connections.py b/dbt/adapters/databricks/connections.py
index 17351429b..474a6ff29 100644
--- a/dbt/adapters/databricks/connections.py
+++ b/dbt/adapters/databricks/connections.py
@@ -1217,4 +1217,3 @@ def _get_max_idle_time(query_header_context: Any, creds: DatabricksCredentials)
             )
 
     return max_idle_time
-
diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index 0a51ea799..b8a711de6 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -10,8 +10,6 @@
 from typing import Callable, Dict, List
 from typing import cast
 from typing import Optional
-from typing import Tuple
-from typing import Union
 
 from databricks.sdk import WorkspaceClient
 from databricks.sdk.core import Config
@@ -49,6 +47,8 @@ class DatabricksCredentials(Credentials):
     token: Optional[str] = None
     client_id: Optional[str] = None
     client_secret: Optional[str] = None
+    azure_client_id: Optional[str] = None
+    azure_client_secret: Optional[str] = None
     oauth_redirect_url: Optional[str] = None
     oauth_scopes: Optional[list[str]] = None
     session_properties: Optional[dict[str, Any]] = None
@@ -118,7 +118,9 @@ def __post_init__(self) -> None:
             "_user_agent_entry",
         ):
             if key in connection_parameters:
-                raise DbtValidationError(f"The connection parameter `{key}` is reserved.")
+                raise DbtValidationError(
+                    f"The connection parameter `{key}` is reserved."
+                )
         if "http_headers" in connection_parameters:
             http_headers = connection_parameters["http_headers"]
             if not isinstance(http_headers, dict) or any(
@@ -140,10 +142,12 @@ def validate_creds(self) -> None:
                 raise DbtConfigError(
                     "The config '{}' is required to connect to Databricks".format(key)
                 )
-        
+
         if not self.token and self.auth_type != "oauth":
             raise DbtConfigError(
-                ("The config `auth_type: oauth` is required when not using access token")
+                (
+                    "The config `auth_type: oauth` is required when not using access token"
+                )
             )
 
         if not self.client_id and self.client_secret:
@@ -154,6 +158,16 @@ def validate_creds(self) -> None:
                 )
             )
 
+        if (not self.azure_client_id and self.azure_client_secret) or (
+            self.azure_client_id and not self.azure_client_secret
+        ):
+            raise DbtConfigError(
+                (
+                    "The config 'azure_client_id' and 'azure_client_secret' "
+                    "must be both present or both absent"
+                )
+            )
+
     @classmethod
     def get_invocation_env(cls) -> Optional[str]:
         invocation_env = os.environ.get(DBT_DATABRICKS_INVOCATION_ENV)
@@ -161,11 +175,15 @@ def get_invocation_env(cls) -> Optional[str]:
             # Thrift doesn't allow nested () so we need to ensure
             # that the passed user agent is valid.
             if not DBT_DATABRICKS_INVOCATION_ENV_REGEX.search(invocation_env):
-                raise DbtValidationError(f"Invalid invocation environment: {invocation_env}")
+                raise DbtValidationError(
+                    f"Invalid invocation environment: {invocation_env}"
+                )
         return invocation_env
 
     @classmethod
-    def get_all_http_headers(cls, user_http_session_headers: dict[str, str]) -> dict[str, str]:
+    def get_all_http_headers(
+        cls, user_http_session_headers: dict[str, str]
+    ) -> dict[str, str]:
         http_session_headers_str: Optional[str] = os.environ.get(
             DBT_DATABRICKS_HTTP_SESSION_HEADERS
         )
@@ -200,13 +218,17 @@ def type(self) -> str:
     def unique_field(self) -> str:
         return cast(str, self.host)
 
-    def connection_info(self, *, with_aliases: bool = False) -> Iterable[tuple[str, Any]]:
+    def connection_info(
+        self, *, with_aliases: bool = False
+    ) -> Iterable[tuple[str, Any]]:
         as_dict = self.to_dict(omit_none=False)
         connection_keys = set(self._connection_keys(with_aliases=with_aliases))
         aliases: list[str] = []
         if with_aliases:
             aliases = [k for k, v in self._ALIASES.items() if v in connection_keys]
-        for key in itertools.chain(self._connection_keys(with_aliases=with_aliases), aliases):
+        for key in itertools.chain(
+            self._connection_keys(with_aliases=with_aliases), aliases
+        ):
             if key in as_dict:
                 yield key, as_dict[key]
 
@@ -272,101 +294,125 @@ class DatabricksCredentialManager(DataClassDictMixin):
     host: str
     client_id: str
     client_secret: str
+    azure_client_id: Optional[str] = None
+    azure_client_secret: Optional[str] = None
     oauth_redirect_url: str = REDIRECT_URL
     oauth_scopes: List[str] = field(default_factory=lambda: SCOPES)
     token: Optional[str] = None
     auth_type: Optional[str] = None
-    
+
     @classmethod
-    def create_from(cls, credentials: DatabricksCredentials) -> "DatabricksCredentialManager":
+    def create_from(
+        cls, credentials: DatabricksCredentials
+    ) -> "DatabricksCredentialManager":
+        if credentials.host is None:
+            raise ValueError("host cannot be None")
         return DatabricksCredentialManager(
             host=credentials.host,
             token=credentials.token,
             client_id=credentials.client_id or CLIENT_ID,
             client_secret=credentials.client_secret or "",
+            azure_client_id=credentials.azure_client_id,
+            azure_client_secret=credentials.azure_client_secret,
             oauth_redirect_url=credentials.oauth_redirect_url or REDIRECT_URL,
             oauth_scopes=credentials.oauth_scopes or SCOPES,
             auth_type=credentials.auth_type,
         )
-    def authenticate_with_oauth_m2m(self):
+
+    def authenticate_with_pat(self) -> Config:
+        return Config(
+            host=self.host,
+            token=self.token,
+        )
+
+    def authenticate_with_oauth_m2m(self) -> Config:
         return Config(
             host=self.host,
             client_id=self.client_id,
             client_secret=self.client_secret,
-            auth_type="oauth-m2m"
-    )
+            auth_type="oauth-m2m",
+        )
 
-    def authenticate_with_external_browser(self):
+    def authenticate_with_external_browser(self) -> Config:
         return Config(
             host=self.host,
             client_id=self.client_id,
             client_secret=self.client_secret,
-            auth_type="external-browser"
-    )
+            auth_type="external-browser",
+        )
 
-    def authenticate_with_azure_client_secret(self):
+    def legacy_authenticate_with_azure_client_secret(self) -> Config:
         return Config(
             host=self.host,
             azure_client_id=self.client_id,
             azure_client_secret=self.client_secret,
-            auth_type="azure-client-secret"
-    )
-  
+            auth_type="azure-client-secret",
+        )
+
+    def authenticate_with_azure_client_secret(self) -> Config:
+        return Config(
+            host=self.host,
+            azure_client_id=self.azure_client_id,
+            azure_client_secret=self.azure_client_secret,
+            auth_type="azure-client-secret",
+        )
+
     def __post_init__(self) -> None:
         self._lock = threading.Lock()
         with self._lock:
-            if hasattr(self, '_config') and self._config is not None:
-                # _config already exists, so skip initialization
+            if not hasattr(self, "_config"):
+                self._config: Optional[Config] = None
+            if self._config is not None:
                 return
-                
+
             if self.token:
-                self._config = Config(
-                    host=self.host,
-                    token=self.token,
-                )
+                self._config = self.authenticate_with_pat()
+            elif self.azure_client_id and self.azure_client_secret:
+                self._config = self.authenticate_with_azure_client_secret()
+            elif not self.client_secret:
+                self._config = self.authenticate_with_external_browser()
             else:
                 auth_methods = {
                     "oauth-m2m": self.authenticate_with_oauth_m2m,
-                    "azure-client-secret": self.authenticate_with_azure_client_secret,
-                    "external-browser": self.authenticate_with_external_browser
+                    "legacy-azure-client-secret": self.legacy_authenticate_with_azure_client_secret,
                 }
 
-                auth_type = (
-                    "external-browser" if not self.client_secret
-                    # if the client_secret starts with "dose" then it's likely using oauth-m2m
-                    else "oauth-m2m" if self.client_secret.startswith("dose")
-                    else "azure-client-secret"
-                )
-
-                if not self.client_secret:
-                    auth_sequence = ["external-browser"]
-                elif self.client_secret.startswith("dose"):
-                    auth_sequence = ["oauth-m2m", "azure-client-secret"]
+                # If the secret starts with dose, high chance is it is a databricks secret
+                if self.client_secret.startswith("dose"):
+                    auth_sequence = ["oauth-m2m", "legacy-azure-client-secret"]
                 else:
-                    auth_sequence = ["azure-client-secret", "oauth-m2m"]
+                    auth_sequence = ["legacy-azure-client-secret", "oauth-m2m"]
 
                 exceptions = []
                 for i, auth_type in enumerate(auth_sequence):
                     try:
                         # The Config constructor will implicitly init auth and throw if failed
                         self._config = auth_methods[auth_type]()
+                        if auth_type == "legacy-azure-client-secret":
+                            logger.warning(
+                                "You are using Azure Service Principal, "
+                                "please use 'azure_client_id' and 'azure_client_secret' instead."
+                            )
                         break  # Exit loop if authentication is successful
                     except Exception as e:
                         exceptions.append((auth_type, e))
-                        next_auth_type = auth_sequence[i + 1] if i + 1 < len(auth_sequence) else None
+                        next_auth_type = (
+                            auth_sequence[i + 1] if i + 1 < len(auth_sequence) else None
+                        )
                         if next_auth_type:
                             logger.warning(
-                                f"Failed to authenticate with {auth_type}, trying {next_auth_type} next. Error: {e}"
+                                f"Failed to authenticate with {auth_type}, "
+                                f"trying {next_auth_type} next. Error: {e}"
                             )
                         else:
                             logger.error(
-                                f"Failed to authenticate with {auth_type}. No more authentication methods to try. Error: {e}"
+                                f"Failed to authenticate with {auth_type}. "
+                                f"No more authentication methods to try. Error: {e}"
                             )
                             raise Exception(
                                 f"All authentication methods failed. Details: {exceptions}"
                             )
 
-
     @property
     def api_client(self) -> WorkspaceClient:
         return WorkspaceClient(config=self._config)
@@ -386,4 +432,4 @@ def header_factory(self) -> CredentialsProvider:
 
     @property
     def config(self) -> Config:
-        return self._config
\ No newline at end of file
+        return self._config
diff --git a/tests/profiles.py b/tests/profiles.py
index e34c5073f..37b86f008 100644
--- a/tests/profiles.py
+++ b/tests/profiles.py
@@ -27,6 +27,8 @@ def _build_databricks_cluster_target(
         "token": os.getenv("DBT_DATABRICKS_TOKEN"),
         "client_id": os.getenv("DBT_DATABRICKS_CLIENT_ID"),
         "client_secret": os.getenv("DBT_DATABRICKS_CLIENT_SECRET"),
+        "azure_client_id": os.getenv("DBT_DATABRICKS_AZURE_CLIENT_ID"),
+        "azure_client_secret": os.getenv("DBT_DATABRICKS_AZURE_CLIENT_SECRET"),
         "connect_retries": 3,
         "connect_timeout": 5,
         "retry_all": True,
diff --git a/tests/unit/test_adapter.py b/tests/unit/test_adapter.py
index abdea832c..3d60f7707 100644
--- a/tests/unit/test_adapter.py
+++ b/tests/unit/test_adapter.py
@@ -248,8 +248,10 @@ def connect(
             assert http_path == "sql/protocolv1/o/1234567890123456/1234-567890-test123"
 
             if not (expected_no_token or expected_client_creds):
-               k = credentials_provider()()
-               assert credentials_provider()().get("Authorization") == "Bearer dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
+                assert (
+                    credentials_provider()().get("Authorization")
+                    == "Bearer dapiXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"
+                )
             if expected_client_creds:
                 assert kwargs.get("client_id") == "foo"
                 assert kwargs.get("client_secret") == "bar"
@@ -1023,4 +1025,4 @@ def test_get_persist_doc_columns_mixed(self, adapter):
         expected = {
             "col1": {"name": "col1", "description": "comment2"},
         }
-        assert adapter.get_persist_doc_columns(existing, column_dict) == expected
\ No newline at end of file
+        assert adapter.get_persist_doc_columns(existing, column_dict) == expected
diff --git a/tests/unit/test_auth.py b/tests/unit/test_auth.py
index 199f0ddfa..6571c9cb2 100644
--- a/tests/unit/test_auth.py
+++ b/tests/unit/test_auth.py
@@ -54,6 +54,7 @@ def test_u2m(self):
         headers2 = headers_fn2()
         assert headers == headers2
 
+
 class TestTokenAuth:
     def test_token(self):
         host = "my.cloud.databricks.com"
@@ -75,7 +76,8 @@ def test_token(self):
         raw = credentialManager._config.as_dict()
         assert raw is not None
 
-        assert headers == {"Authorization":"Bearer foo"}
+        assert headers == {"Authorization": "Bearer foo"}
+
 
 @pytest.mark.skip(reason="Cache moved to databricks sdk TokenCache")
 class TestShardedPassword:
@@ -129,6 +131,7 @@ def test_store_and_delete_long_password(self):
         retrieved_password = creds.get_sharded_password(service, host)
         assert retrieved_password is None
 
+
 @pytest.mark.skip(reason="Cache moved to databricks sdk TokenCache")
 class MockKeyring(keyring.backend.KeyringBackend):
     def __init__(self):
diff --git a/tests/unit/test_compute_config.py b/tests/unit/test_compute_config.py
index 625bee9d2..6409bcc7f 100644
--- a/tests/unit/test_compute_config.py
+++ b/tests/unit/test_compute_config.py
@@ -21,7 +21,7 @@ def path(self):
 
     @pytest.fixture
     def creds(self, path):
-          with patch("dbt.adapters.databricks.credentials.Config"):
+        with patch("dbt.adapters.databricks.credentials.Config"):
             return DatabricksCredentials(http_path=path)
 
     @pytest.fixture

From 55de1681cfeda7f19be335b7a115305dbddefc82 Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Fri, 15 Nov 2024 17:08:25 -0800
Subject: [PATCH 09/17] update

---
 dbt/adapters/databricks/api_client.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/dbt/adapters/databricks/api_client.py b/dbt/adapters/databricks/api_client.py
index 16e069dd5..2886d0a5d 100644
--- a/dbt/adapters/databricks/api_client.py
+++ b/dbt/adapters/databricks/api_client.py
@@ -499,8 +499,7 @@ def create(
         http_headers = credentials.get_all_http_headers(
             connection_parameters.pop("http_headers", {})
         )
-        credentials_provider = credentials.authenticate().credentials_provider
-        header_factory = credentials_provider()  # type: ignore
+        header_factory = credentials.authenticate().credentials_provider  # type: ignore
         session.auth = BearerAuth(header_factory)
 
         session.headers.update({"User-Agent": user_agent, **http_headers})

From 19b9f4d36b00782430016e7f28acd2163a1ac9fd Mon Sep 17 00:00:00 2001
From: eric wang <e.wang@databricks.com>
Date: Tue, 19 Nov 2024 11:38:13 -0800
Subject: [PATCH 10/17] fix test

---
 dbt/adapters/databricks/api_client.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbt/adapters/databricks/api_client.py b/dbt/adapters/databricks/api_client.py
index 2886d0a5d..c49ff9bba 100644
--- a/dbt/adapters/databricks/api_client.py
+++ b/dbt/adapters/databricks/api_client.py
@@ -499,7 +499,7 @@ def create(
         http_headers = credentials.get_all_http_headers(
             connection_parameters.pop("http_headers", {})
         )
-        header_factory = credentials.authenticate().credentials_provider  # type: ignore
+        header_factory = credentials.authenticate().credentials_provider()  # type: ignore
         session.auth = BearerAuth(header_factory)
 
         session.headers.update({"User-Agent": user_agent, **http_headers})

From cd5d383b097826daa0a9200a0d49dd9fe5be4b83 Mon Sep 17 00:00:00 2001
From: Eric Wang <e.wang@databricks.com>
Date: Wed, 29 Jan 2025 16:25:08 -0800
Subject: [PATCH 11/17] remove unneeded files

---
 pyproject.toml   | 14 ++++-----
 requirements.txt |  9 ------
 setup.py         | 81 ------------------------------------------------
 3 files changed, 7 insertions(+), 97 deletions(-)
 delete mode 100644 requirements.txt
 delete mode 100644 setup.py

diff --git a/pyproject.toml b/pyproject.toml
index 7ea32d511..52a8e7a0d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -22,12 +22,12 @@ classifiers = [
     "Programming Language :: Python :: 3.12",
 ]
 dependencies = [
-    "databricks-sdk==0.17.0",
+    "databricks-sdk==0.41.0",
     "databricks-sql-connector>=3.5.0, <4.0.0",
-    "dbt-adapters>=1.9.0, <2.0",
-    "dbt-common>=1.12.0, <2.0",
-    "dbt-core>=1.8.7, <2.0",
-    "dbt-spark>=1.8.0, <2.0",
+    "dbt-adapters>=1.10.3, <2.0",
+    "dbt-common>=1.13.0, <2.0",
+    "dbt-core>=1.9.0rc2, <2.0",
+    "dbt-spark>=1.9.0b1, <2.0",
     "keyring>=23.13.0",
     "pydantic>=1.10.0",
 ]
@@ -65,10 +65,10 @@ check-sdist = [
 [tool.hatch.envs.default]
 dependencies = [
     "dbt_common @ git+https://github.com/dbt-labs/dbt-common.git",
-    "dbt-adapters @ git+https://github.com/dbt-labs/dbt-adapters.git#subdirectory=dbt-adapters",
+    "dbt-adapters @ git+https://github.com/dbt-labs/dbt-adapters.git@main",
     "dbt-core @ git+https://github.com/dbt-labs/dbt-core.git@main#subdirectory=core",
     "dbt-tests-adapter @ git+https://github.com/dbt-labs/dbt-adapters.git@main#subdirectory=dbt-tests-adapter",
-    "dbt-spark @ git+https://github.com/dbt-labs/dbt-adapters.git#subdirectory=dbt-spark",
+    "dbt-spark @ git+https://github.com/dbt-labs/dbt-spark.git@main",
     "pytest",
     "pytest-xdist",
     "pytest-dotenv",
diff --git a/requirements.txt b/requirements.txt
deleted file mode 100644
index 19d9d46fa..000000000
--- a/requirements.txt
+++ /dev/null
@@ -1,9 +0,0 @@
-databricks-sql-connector>=3.5.0, <4.0
-dbt-spark>=1.8.0, <2.0
-dbt-core>=1.8.7, <2.0
-dbt-common>=1.10.0, <2.0
-dbt-adapters>=1.7.0, <2.0
-databricks-sdk==0.36.0
-keyring>=23.13.0
-protobuf<5.0.0
-pydantic>=1.10.0, <2
diff --git a/setup.py b/setup.py
deleted file mode 100644
index e4ff4f297..000000000
--- a/setup.py
+++ /dev/null
@@ -1,81 +0,0 @@
-#!/usr/bin/env python
-import os
-import sys
-
-# require python 3.9 or newer
-if sys.version_info < (3, 9):
-    print("Error: dbt does not support this version of Python.")
-    print("Please upgrade to Python 3.9 or higher.")
-    sys.exit(1)
-
-
-# require version of setuptools that supports find_namespace_packages
-from setuptools import setup
-
-try:
-    from setuptools import find_namespace_packages
-except ImportError:
-    # the user has a downlevel version of setuptools.
-    print("Error: dbt requires setuptools v40.1.0 or higher.")
-    print('Please upgrade setuptools with "pip install --upgrade setuptools" and try again')
-    sys.exit(1)
-
-
-# pull long description from README
-this_directory = os.path.abspath(os.path.dirname(__file__))
-with open(os.path.join(this_directory, "README.md"), "r", encoding="utf8") as f:
-    long_description = f.read()
-
-
-# get this package's version from dbt/adapters/<name>/__version__.py
-def _get_plugin_version() -> str:
-    _version_path = os.path.join(this_directory, "dbt", "adapters", "databricks", "__version__.py")
-    try:
-        exec(open(_version_path).read())
-        return locals()["version"]
-    except IOError:
-        print("Failed to load dbt-databricks version file for packaging.", file=sys.stderr)
-        sys.exit(-1)
-
-
-package_name = "dbt-databricks"
-package_version = _get_plugin_version()
-description = """The Databricks adapter plugin for dbt"""
-
-setup(
-    name=package_name,
-    version=package_version,
-    description=description,
-    long_description=long_description,
-    long_description_content_type="text/markdown",
-    author="Databricks",
-    author_email="feedback@databricks.com",
-    url="https://github.com/databricks/dbt-databricks",
-    packages=find_namespace_packages(include=["dbt", "dbt.*"]),
-    include_package_data=True,
-    install_requires=[
-        "dbt-spark>=1.8.0, <2.0",
-        "dbt-core>=1.8.7, <2.0",
-        "dbt-adapters>=1.7.0, <2.0",
-        "dbt-common>=1.10.0, <2.0",
-        "databricks-sql-connector>=3.5.0, <4.0.0",
-        "databricks-sdk==0.36.0",
-        "keyring>=23.13.0",
-        "pandas<2.2.0",
-        "protobuf<5.0.0",
-        "pydantic>=1.10.0, <2",
-    ],
-    zip_safe=False,
-    classifiers=[
-        "Development Status :: 5 - Production/Stable",
-        "License :: OSI Approved :: Apache Software License",
-        "Operating System :: Microsoft :: Windows",
-        "Operating System :: MacOS :: MacOS X",
-        "Operating System :: POSIX :: Linux",
-        "Programming Language :: Python :: 3.9",
-        "Programming Language :: Python :: 3.10",
-        "Programming Language :: Python :: 3.11",
-        "Programming Language :: Python :: 3.12",
-    ],
-    python_requires=">=3.9",
-)

From e6a6177e620c058cda292c8df78a5dfe62666c0b Mon Sep 17 00:00:00 2001
From: Eric Wang <e.wang@databricks.com>
Date: Wed, 29 Jan 2025 16:30:13 -0800
Subject: [PATCH 12/17] update

---
 pyproject.toml | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 52a8e7a0d..7b8563fdf 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -24,10 +24,10 @@ classifiers = [
 dependencies = [
     "databricks-sdk==0.41.0",
     "databricks-sql-connector>=3.5.0, <4.0.0",
-    "dbt-adapters>=1.10.3, <2.0",
-    "dbt-common>=1.13.0, <2.0",
-    "dbt-core>=1.9.0rc2, <2.0",
-    "dbt-spark>=1.9.0b1, <2.0",
+    "dbt-adapters>=1.9.0, <2.0",
+    "dbt-common>=1.12.0, <2.0",
+    "dbt-core>=1.8.7, <2.0",
+    "dbt-spark>=1.8.0, <2.0",
     "keyring>=23.13.0",
     "pydantic>=1.10.0",
 ]
@@ -65,10 +65,10 @@ check-sdist = [
 [tool.hatch.envs.default]
 dependencies = [
     "dbt_common @ git+https://github.com/dbt-labs/dbt-common.git",
-    "dbt-adapters @ git+https://github.com/dbt-labs/dbt-adapters.git@main",
+    "dbt-adapters @ git+https://github.com/dbt-labs/dbt-adapters.git#subdirectory=dbt-adapters",
     "dbt-core @ git+https://github.com/dbt-labs/dbt-core.git@main#subdirectory=core",
     "dbt-tests-adapter @ git+https://github.com/dbt-labs/dbt-adapters.git@main#subdirectory=dbt-tests-adapter",
-    "dbt-spark @ git+https://github.com/dbt-labs/dbt-spark.git@main",
+    "dbt-spark @ git+https://github.com/dbt-labs/dbt-adapters.git#subdirectory=dbt-spark",
     "pytest",
     "pytest-xdist",
     "pytest-dotenv",

From 4e3acd081a8462f7da440edcadfeb7e2e333568d Mon Sep 17 00:00:00 2001
From: Eric Wang <e.wang@databricks.com>
Date: Thu, 30 Jan 2025 23:21:20 -0800
Subject: [PATCH 13/17] fix test

---
 dbt/adapters/databricks/auth.py        | 100 -------------------------
 dbt/adapters/databricks/connections.py |   6 +-
 dbt/adapters/databricks/credentials.py |  16 ++--
 3 files changed, 12 insertions(+), 110 deletions(-)
 delete mode 100644 dbt/adapters/databricks/auth.py

diff --git a/dbt/adapters/databricks/auth.py b/dbt/adapters/databricks/auth.py
deleted file mode 100644
index 439fa23fd..000000000
--- a/dbt/adapters/databricks/auth.py
+++ /dev/null
@@ -1,100 +0,0 @@
-from typing import Any, Optional
-
-from requests import PreparedRequest
-from requests.auth import AuthBase
-
-from databricks.sdk.core import Config, CredentialsProvider, HeaderFactory, credentials_provider
-from databricks.sdk.oauth import ClientCredentials, Token, TokenSource
-
-
-class token_auth(CredentialsProvider):
-    _token: str
-
-    def __init__(self, token: str) -> None:
-        self._token = token
-
-    def auth_type(self) -> str:
-        return "token"
-
-    def as_dict(self) -> dict:
-        return {"token": self._token}
-
-    @staticmethod
-    def from_dict(raw: Optional[dict]) -> Optional[CredentialsProvider]:
-        if not raw:
-            return None
-        return token_auth(raw["token"])
-
-    def __call__(self, _: Optional[Config] = None) -> HeaderFactory:
-        static_credentials = {"Authorization": f"Bearer {self._token}"}
-
-        def inner() -> dict[str, str]:
-            return static_credentials
-
-        return inner
-
-
-class m2m_auth(CredentialsProvider):
-    _token_source: Optional[TokenSource] = None
-
-    def __init__(self, host: str, client_id: str, client_secret: str) -> None:
-        @credentials_provider("noop", [])
-        def noop_credentials(_: Any):  # type: ignore
-            return lambda: {}
-
-        config = Config(host=host, credentials_provider=noop_credentials)
-        oidc = config.oidc_endpoints
-        scopes = ["all-apis"]
-        if not oidc:
-            raise ValueError(f"{host} does not support OAuth")
-        if config.is_azure:
-            # Azure AD only supports full access to Azure Databricks.
-            scopes = [f"{config.effective_azure_login_app_id}/.default"]
-        self._token_source = ClientCredentials(
-            client_id=client_id,
-            client_secret=client_secret,
-            token_url=oidc.token_endpoint,
-            scopes=scopes,
-            use_header="microsoft" not in oidc.token_endpoint,
-            use_params="microsoft" in oidc.token_endpoint,
-        )
-
-    def auth_type(self) -> str:
-        return "oauth"
-
-    def as_dict(self) -> dict:
-        if self._token_source:
-            return {"token": self._token_source.token().as_dict()}
-        else:
-            return {"token": {}}
-
-    @staticmethod
-    def from_dict(host: str, client_id: str, client_secret: str, raw: dict) -> CredentialsProvider:
-        c = m2m_auth(host=host, client_id=client_id, client_secret=client_secret)
-        c._token_source._token = Token.from_dict(raw["token"])  # type: ignore
-        return c
-
-    def __call__(self, _: Optional[Config] = None) -> HeaderFactory:
-        def inner() -> dict[str, str]:
-            token = self._token_source.token()  # type: ignore
-            return {"Authorization": f"{token.token_type} {token.access_token}"}
-
-        return inner
-
-
-class BearerAuth(AuthBase):
-    """This mix-in is passed to our requests Session to explicitly
-    use the bearer authentication method.
-
-    Without this, a local .netrc file in the user's home directory
-    will override the auth headers provided by our header_factory.
-
-    More details in issue #337.
-    """
-
-    def __init__(self, header_factory: HeaderFactory):
-        self.header_factory = header_factory
-
-    def __call__(self, r: PreparedRequest) -> PreparedRequest:
-        r.headers.update(**self.header_factory())
-        return r
diff --git a/dbt/adapters/databricks/connections.py b/dbt/adapters/databricks/connections.py
index bedd7a980..971a910f7 100644
--- a/dbt/adapters/databricks/connections.py
+++ b/dbt/adapters/databricks/connections.py
@@ -32,7 +32,11 @@
 )
 from dbt.adapters.databricks.__version__ import version as __version__
 from dbt.adapters.databricks.api_client import DatabricksApiClient
-from dbt.adapters.databricks.credentials import BearerAuth, DatabricksCredentials, DatabricksCredentialManager
+from dbt.adapters.databricks.credentials import (
+    BearerAuth,
+    DatabricksCredentials,
+    DatabricksCredentialManager,
+)
 from dbt.adapters.databricks.events.connection_events import (
     ConnectionAcquire,
     ConnectionCancel,
diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index b04f5c250..1c897df19 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -5,25 +5,23 @@
 import threading
 from collections.abc import Iterable
 from dataclasses import dataclass
-from typing import Any, Optional, Union, cast
+from dataclasses import field
+from typing import Any, Optional, Callable, Dict, List, cast
 
-import keyring
 from dbt_common.exceptions import DbtConfigError, DbtValidationError
 
 from databricks.sdk import WorkspaceClient
 from databricks.sdk.core import Config
 from databricks.sdk.core import CredentialsProvider
-from databricks.sdk.oauth import OAuthClient, SessionCredentials
 from dbt.adapters.contracts.connection import Credentials
-from dbt.adapters.databricks.auth import m2m_auth, token_auth
-from dbt.adapters.databricks.events.credential_events import (
-    CredentialLoadError,
-    CredentialSaveError,
-    CredentialShardEvent,
-)
 from dbt.adapters.databricks.global_state import GlobalState
 from dbt.adapters.databricks.logging import logger
 
+from mashumaro import DataClassDictMixin
+from requests import PreparedRequest
+from requests.auth import AuthBase
+from dbt.adapters.databricks.logging import logger
+
 CATALOG_KEY_IN_SESSION_PROPERTIES = "databricks.catalog"
 DBT_DATABRICKS_INVOCATION_ENV_REGEX = re.compile("^[A-z0-9\\-]+$")
 EXTRACT_CLUSTER_ID_FROM_HTTP_PATH_REGEX = re.compile(r"/?sql/protocolv1/o/\d+/(.*)")

From 8a8d96cae5abc564d8907267536c303a6fba0971 Mon Sep 17 00:00:00 2001
From: Eric Wang <e.wang@databricks.com>
Date: Thu, 30 Jan 2025 23:48:54 -0800
Subject: [PATCH 14/17] fix test

---
 dbt/adapters/databricks/connections.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbt/adapters/databricks/connections.py b/dbt/adapters/databricks/connections.py
index 971a910f7..f118b8eb8 100644
--- a/dbt/adapters/databricks/connections.py
+++ b/dbt/adapters/databricks/connections.py
@@ -713,7 +713,7 @@ def _open(cls, connection: Connection, query_header_context: Any = None) -> Conn
         timeout = creds.connect_timeout
 
         # gotta keep this so we don't prompt users many times
-        cls.credentials_provider = creds.authenticate(cls.credentials_provider)
+        cls.credentials_manager = creds.authenticate()
 
         invocation_env = creds.get_invocation_env()
         user_agent_entry = cls._user_agent

From 20a199e5c696a61ff5ac911d8d7995f58fb839a7 Mon Sep 17 00:00:00 2001
From: Eric Wang <e.wang@databricks.com>
Date: Fri, 31 Jan 2025 08:47:51 -0800
Subject: [PATCH 15/17] ruff fix

---
 dbt/adapters/databricks/api_client.py  |  3 +--
 dbt/adapters/databricks/connections.py |  3 +--
 dbt/adapters/databricks/credentials.py | 23 ++++++++---------------
 tests/unit/test_idle_config.py         |  1 +
 4 files changed, 11 insertions(+), 19 deletions(-)

diff --git a/dbt/adapters/databricks/api_client.py b/dbt/adapters/databricks/api_client.py
index f636970e6..235e5f52a 100644
--- a/dbt/adapters/databricks/api_client.py
+++ b/dbt/adapters/databricks/api_client.py
@@ -13,8 +13,7 @@
 
 from dbt.adapters.databricks import utils
 from dbt.adapters.databricks.__version__ import version
-from dbt.adapters.databricks.credentials import BearerAuth
-from dbt.adapters.databricks.credentials import DatabricksCredentials
+from dbt.adapters.databricks.credentials import BearerAuth, DatabricksCredentials
 from dbt.adapters.databricks.logging import logger
 
 DEFAULT_POLLING_INTERVAL = 10
diff --git a/dbt/adapters/databricks/connections.py b/dbt/adapters/databricks/connections.py
index f118b8eb8..f38b7e4af 100644
--- a/dbt/adapters/databricks/connections.py
+++ b/dbt/adapters/databricks/connections.py
@@ -33,9 +33,8 @@
 from dbt.adapters.databricks.__version__ import version as __version__
 from dbt.adapters.databricks.api_client import DatabricksApiClient
 from dbt.adapters.databricks.credentials import (
-    BearerAuth,
-    DatabricksCredentials,
     DatabricksCredentialManager,
+    DatabricksCredentials,
 )
 from dbt.adapters.databricks.events.connection_events import (
     ConnectionAcquire,
diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index 1c897df19..b4244d88e 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -1,27 +1,22 @@
 import itertools
 import json
-import os
 import re
 import threading
 from collections.abc import Iterable
-from dataclasses import dataclass
-from dataclasses import field
-from typing import Any, Optional, Callable, Dict, List, cast
+from dataclasses import dataclass, field
+from typing import Any, Callable, Dict, List, Optional, cast
 
 from dbt_common.exceptions import DbtConfigError, DbtValidationError
+from mashumaro import DataClassDictMixin
+from requests import PreparedRequest
+from requests.auth import AuthBase
 
 from databricks.sdk import WorkspaceClient
-from databricks.sdk.core import Config
-from databricks.sdk.core import CredentialsProvider
+from databricks.sdk.core import Config, CredentialsProvider
 from dbt.adapters.contracts.connection import Credentials
 from dbt.adapters.databricks.global_state import GlobalState
 from dbt.adapters.databricks.logging import logger
 
-from mashumaro import DataClassDictMixin
-from requests import PreparedRequest
-from requests.auth import AuthBase
-from dbt.adapters.databricks.logging import logger
-
 CATALOG_KEY_IN_SESSION_PROPERTIES = "databricks.catalog"
 DBT_DATABRICKS_INVOCATION_ENV_REGEX = re.compile("^[A-z0-9\\-]+$")
 EXTRACT_CLUSTER_ID_FROM_HTTP_PATH_REGEX = re.compile(r"/?sql/protocolv1/o/\d+/(.*)")
@@ -154,10 +149,8 @@ def validate_creds(self) -> None:
             self.azure_client_id and not self.azure_client_secret
         ):
             raise DbtConfigError(
-                (
-                    "The config 'azure_client_id' and 'azure_client_secret' "
-                    "must be both present or both absent"
-                )
+                "The config 'azure_client_id' and 'azure_client_secret' "
+                "must be both present or both absent"
             )
 
     @classmethod
diff --git a/tests/unit/test_idle_config.py b/tests/unit/test_idle_config.py
index 22b9072d8..a733c07d5 100644
--- a/tests/unit/test_idle_config.py
+++ b/tests/unit/test_idle_config.py
@@ -1,4 +1,5 @@
 from unittest.mock import patch
+
 import pytest
 from dbt_common.exceptions import DbtRuntimeError
 

From 7a6f8dd790ff2be2a7f300d3e5ba36b6c67687a7 Mon Sep 17 00:00:00 2001
From: Eric Wang <e.wang@databricks.com>
Date: Fri, 31 Jan 2025 16:38:56 -0800
Subject: [PATCH 16/17] lint

---
 dbt/adapters/databricks/constraints.py | 4 ++--
 dbt/adapters/databricks/credentials.py | 8 ++++----
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/dbt/adapters/databricks/constraints.py b/dbt/adapters/databricks/constraints.py
index 5761dacf5..bce44f8b6 100644
--- a/dbt/adapters/databricks/constraints.py
+++ b/dbt/adapters/databricks/constraints.py
@@ -1,5 +1,5 @@
 from abc import ABC, abstractmethod
-from typing import Any, ClassVar, Optional, Type, TypeVar
+from typing import Any, ClassVar, Optional, TypeVar
 
 from dbt_common.contracts.constraints import (
     ColumnLevelConstraint,
@@ -32,7 +32,7 @@ class TypedConstraint(ModelLevelConstraint, ABC):
     str_type: ClassVar[str]
 
     @classmethod
-    def __post_deserialize__(cls: Type[T], obj: T) -> T:
+    def __post_deserialize__(cls: type[T], obj: T) -> T:
         assert obj.type == cls.str_type, "Mismatched constraint type"
         obj._validate()
         return obj
diff --git a/dbt/adapters/databricks/credentials.py b/dbt/adapters/databricks/credentials.py
index b4244d88e..c68d87044 100644
--- a/dbt/adapters/databricks/credentials.py
+++ b/dbt/adapters/databricks/credentials.py
@@ -4,7 +4,7 @@
 import threading
 from collections.abc import Iterable
 from dataclasses import dataclass, field
-from typing import Any, Callable, Dict, List, Optional, cast
+from typing import Any, Callable, Optional, cast
 
 from dbt_common.exceptions import DbtConfigError, DbtValidationError
 from mashumaro import DataClassDictMixin
@@ -261,7 +261,7 @@ def __call__(self, r: PreparedRequest) -> PreparedRequest:
         return r
 
 
-PySQLCredentialProvider = Callable[[], Callable[[], Dict[str, str]]]
+PySQLCredentialProvider = Callable[[], Callable[[], dict[str, str]]]
 
 
 @dataclass
@@ -272,7 +272,7 @@ class DatabricksCredentialManager(DataClassDictMixin):
     azure_client_id: Optional[str] = None
     azure_client_secret: Optional[str] = None
     oauth_redirect_url: str = REDIRECT_URL
-    oauth_scopes: List[str] = field(default_factory=lambda: SCOPES)
+    oauth_scopes: list[str] = field(default_factory=lambda: SCOPES)
     token: Optional[str] = None
     auth_type: Optional[str] = None
 
@@ -390,7 +390,7 @@ def api_client(self) -> WorkspaceClient:
 
     @property
     def credentials_provider(self) -> PySQLCredentialProvider:
-        def inner() -> Callable[[], Dict[str, str]]:
+        def inner() -> Callable[[], dict[str, str]]:
             return self.header_factory
 
         return inner

From 90a90540a1a6454dcfa9d6e7e873aa9b11f395a2 Mon Sep 17 00:00:00 2001
From: Eric Wang <e.wang@databricks.com>
Date: Fri, 31 Jan 2025 16:58:13 -0800
Subject: [PATCH 17/17] address comments

---
 dbt/adapters/databricks/api_client.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbt/adapters/databricks/api_client.py b/dbt/adapters/databricks/api_client.py
index 235e5f52a..c5d9add62 100644
--- a/dbt/adapters/databricks/api_client.py
+++ b/dbt/adapters/databricks/api_client.py
@@ -556,7 +556,7 @@ def create(
         http_headers = credentials.get_all_http_headers(
             connection_parameters.pop("http_headers", {})
         )
-        header_factory = credentials.authenticate().credentials_provider()  # type: ignore
+        header_factory = credentials.authenticate().credentials_provider()
         session.auth = BearerAuth(header_factory)
 
         session.headers.update({"User-Agent": user_agent, **http_headers})