From 1382600ec8552eb22bc53e242f1afea1ac38ab01 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=D0=9C=D0=B0=D1=80=D1=82=D1=8B=D0=BD=D0=BE=D0=B2=20=D0=9C?=
 =?UTF-8?q?=D0=B0=D0=BA=D1=81=D0=B8=D0=BC=20=D0=A1=D0=B5=D1=80=D0=B3=D0=B5?=
 =?UTF-8?q?=D0=B5=D0=B2=D0=B8=D1=87?= <msmarty5@mts.ru>
Date: Tue, 20 Aug 2024 11:14:06 +0000
Subject: [PATCH 1/2] Fix documentation build

---
 docs/conf.py          | 3 ---
 requirements/docs.txt | 3 ++-
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/docs/conf.py b/docs/conf.py
index f781dddd..867d4daf 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -120,9 +120,6 @@
     {"rel": "icon", "href": "icon.svg", "type": "image/svg+xml"},
 ]
 
-# TODO: remove after https://github.com/mgeier/sphinx-last-updated-by-git/pull/77
-git_exclude_patterns = ["docs/_static/logo_wide.svg"]
-
 # The master toctree document.
 master_doc = "index"
 
diff --git a/requirements/docs.txt b/requirements/docs.txt
index be2cd127..87768350 100644
--- a/requirements/docs.txt
+++ b/requirements/docs.txt
@@ -9,7 +9,8 @@ sphinx<8
 sphinx-copybutton
 sphinx-design
 sphinx-favicon
-sphinx-last-updated-by-git
+# https://github.com/mgeier/sphinx-last-updated-by-git/pull/77
+sphinx-last-updated-by-git>=0.3.8
 # TODO: uncomment after https://github.com/zqmillet/sphinx-plantuml/pull/4
 # sphinx-plantuml
 sphinx-tabs

From 81d86f61214960c31aff33d7f3c75f2570d35427 Mon Sep 17 00:00:00 2001
From: maxim-lixakov <mvliksako1@mts.ru>
Date: Thu, 15 Aug 2024 18:25:48 +0300
Subject: [PATCH 2/2] [DOP-16999] - add jdbc_dialect logging

---
 docs/changelog/next_release/305.feature.rst   |  1 +
 .../jdbc_connection/connection.py             |  2 +
 .../db_connection/jdbc_mixin/connection.py    | 12 ++++++
 .../test_clickhouse_integration.py            | 35 +++++++++++++++++
 .../test_postgres_integration.py              | 38 +++++++++++++++++++
 5 files changed, 88 insertions(+)
 create mode 100644 docs/changelog/next_release/305.feature.rst

diff --git a/docs/changelog/next_release/305.feature.rst b/docs/changelog/next_release/305.feature.rst
new file mode 100644
index 00000000..c4c44dc6
--- /dev/null
+++ b/docs/changelog/next_release/305.feature.rst
@@ -0,0 +1 @@
+Add log.info about JDBC dialect usage: ``Detected dialect: 'org.apache.spark.sql.jdbc.MySQLDialect'``
diff --git a/onetl/connection/db_connection/jdbc_connection/connection.py b/onetl/connection/db_connection/jdbc_connection/connection.py
index 9d41298e..32c0b65c 100644
--- a/onetl/connection/db_connection/jdbc_connection/connection.py
+++ b/onetl/connection/db_connection/jdbc_connection/connection.py
@@ -90,6 +90,7 @@ def sql(
 
         query = clear_statement(query)
 
+        log.info("|%s| Detected dialect: '%s'", self.__class__.__name__, self.jdbc_dialect)
         log.info("|%s| Executing SQL query (on executor):", self.__class__.__name__)
         log_lines(log, query)
 
@@ -195,6 +196,7 @@ def get_df_schema(
         columns: list[str] | None = None,
         options: JDBCReadOptions | None = None,
     ) -> StructType:
+        log.info("|%s| Detected dialect: '%s'", self.__class__.__name__, self.jdbc_dialect)
         log.info("|%s| Fetching schema of table %r ...", self.__class__.__name__, source)
 
         query = self.dialect.get_sql_query(source, columns=columns, limit=0, compact=True)
diff --git a/onetl/connection/db_connection/jdbc_mixin/connection.py b/onetl/connection/db_connection/jdbc_mixin/connection.py
index 8ec77d13..5d309e58 100644
--- a/onetl/connection/db_connection/jdbc_mixin/connection.py
+++ b/onetl/connection/db_connection/jdbc_mixin/connection.py
@@ -205,6 +205,7 @@ def fetch(
 
         query = clear_statement(query)
 
+        log.info("|%s| Detected dialect: '%s'", self.__class__.__name__, self.jdbc_dialect)
         log.info("|%s| Executing SQL query (on driver):", self.__class__.__name__)
         log_lines(log, query)
 
@@ -277,6 +278,7 @@ def execute(
 
         statement = clear_statement(statement)
 
+        log.info("|%s| Detected dialect: '%s'", self.__class__.__name__, self.jdbc_dialect)
         log.info("|%s| Executing statement (on driver):", self.__class__.__name__)
         log_lines(log, statement)
 
@@ -308,6 +310,16 @@ def execute(
             log_lines(log, str(metrics))
         return df
 
+    @property
+    def jdbc_dialect(self):
+        """
+        Returns the JDBC dialect associated with the connection URL.
+        """
+        jdbc_dialects_package = self.spark._jvm.org.apache.spark.sql.jdbc
+        dialect = jdbc_dialects_package.JdbcDialects.get(self.jdbc_url).toString()
+
+        return dialect.split("$")[0] if "$" in dialect else dialect
+
     @validator("spark")
     def _check_java_class_imported(cls, spark):
         try:
diff --git a/tests/tests_integration/tests_db_connection_integration/test_clickhouse_integration.py b/tests/tests_integration/tests_db_connection_integration/test_clickhouse_integration.py
index 78656d83..1bd2ebf3 100644
--- a/tests/tests_integration/tests_db_connection_integration/test_clickhouse_integration.py
+++ b/tests/tests_integration/tests_db_connection_integration/test_clickhouse_integration.py
@@ -321,3 +321,38 @@ def func_finalizer():
     # wrong syntax
     with pytest.raises(Exception):
         clickhouse.execute(f"CREATE FUNCTION wrong_function AS (a, b) -> {suffix}")
+
+
+def test_clickhouse_connection_no_jdbc_dialect(spark, processing, load_table_data, caplog):
+    clickhouse = Clickhouse(
+        host=processing.host,
+        port=processing.port,
+        user=processing.user,
+        password=processing.password,
+        database=processing.database,
+        spark=spark,
+    )
+
+    table = load_table_data.full_name
+    clickhouse.get_df_schema(table)
+
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.NoopDialect'" in caplog.text
+
+    # clear the caplog buffer
+    caplog.clear()
+    clickhouse.sql("SELECT version()")
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.NoopDialect'" in caplog.text
+
+    # clear the caplog buffer
+    caplog.clear()
+    clickhouse.fetch("SELECT version()")
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.NoopDialect'" in caplog.text
+
+    # clear the caplog buffer
+    caplog.clear()
+    clickhouse.execute(f"TRUNCATE TABLE {table}")
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.NoopDialect'" in caplog.text
diff --git a/tests/tests_integration/tests_db_connection_integration/test_postgres_integration.py b/tests/tests_integration/tests_db_connection_integration/test_postgres_integration.py
index 6cea95cc..0b05e7f9 100644
--- a/tests/tests_integration/tests_db_connection_integration/test_postgres_integration.py
+++ b/tests/tests_integration/tests_db_connection_integration/test_postgres_integration.py
@@ -1035,3 +1035,41 @@ def test_postgres_connection_execute_with_legacy_jdbc_options(spark, processing)
 
     options = Postgres.JDBCOptions(query_timeout=30)
     postgres.execute("DROP TABLE IF EXISTS temp_table;", options=options)
+
+
+def test_postgres_connection_jdbc_dialect_usage(spark, processing, load_table_data, caplog):
+    postgres = Postgres(
+        host=processing.host,
+        port=processing.port,
+        user=processing.user,
+        password=processing.password,
+        database=processing.database,
+        spark=spark,
+    )
+
+    table = load_table_data.full_name
+    postgres.get_df_schema(table)
+
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.PostgresDialect'" in caplog.text
+
+    # clear the caplog buffer
+    caplog.clear()
+    postgres.sql("SELECT version()")
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.PostgresDialect'" in caplog.text
+
+    caplog.clear()
+    postgres.fetch("SELECT version()")
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.PostgresDialect'" in caplog.text
+
+    caplog.clear()
+    postgres.fetch("SELECT version()")
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.PostgresDialect'" in caplog.text
+
+    caplog.clear()
+    postgres.execute(f"TRUNCATE TABLE {table}")
+    with caplog.at_level(logging.INFO):
+        assert "Detected dialect: 'org.apache.spark.sql.jdbc.PostgresDialect'" in caplog.text