pandas-dev · mpak123 · Oct 22, 2025 · Oct 22, 2025 · Oct 22, 2025 · Oct 22, 2025
diff --git a/doc/source/whatsnew/v3.0.0.rst b/doc/source/whatsnew/v3.0.0.rst
@@ -156,6 +156,7 @@ All warnings for upcoming changes in pandas will have the base class :class:`pan
 
 Other enhancements
 ^^^^^^^^^^^^^^^^^^
+- :func:`DataFrame.to_sql` now accepts a ``hints`` parameter to pass database-specific query hints for optimizing insert performance. The hints are specified as a dictionary mapping dialect names to hint strings (e.g., ``{'oracle': '/*+ APPEND PARALLEL(4) */', 'mysql': 'DELAYED'}``). Users are responsible for providing correctly formatted hint strings for their target database (:issue:`61370`)
 - :func:`pandas.merge` propagates the ``attrs`` attribute to the result if all
   inputs have identical ``attrs``, as has so far already been the case for
   :func:`pandas.concat`.

diff --git a/pandas/core/generic.py b/pandas/core/generic.py
@@ -2798,6 +2798,7 @@ def to_sql(
         chunksize: int | None = None,
         dtype: DtypeArg | None = None,
         method: Literal["multi"] | Callable | None = None,
+        hints: dict[str, str] | None = None,
     ) -> int | None:
         """
         Write records stored in a DataFrame to a SQL database.
@@ -2861,6 +2862,21 @@ def to_sql(
 
             Details and a sample callable implementation can be found in the
             section :ref:`insert method <io.sql.method>`.
+        hints : dict[str, str], optional
+            Dictionary of SQL hints to optimize insertion performance, keyed by
+            database dialect name (e.g., 'oracle', 'mysql', 'postgresql', 'mssql').
+            Each value should be a complete hint string formatted exactly as required
+            by the target database. The user is responsible for providing correctly
+            formatted hint strings.
+
+            Examples: ``{'oracle': '/*+ APPEND PARALLEL(4) */', 'mysql': 'DELAYED'}``
+
+            .. note::
+                - Hints are database-specific and ignored for unsupported dialects.
+                - SQLite raises a ``UserWarning`` (hints not supported).
+                - ADBC connections raise ``NotImplementedError``.
+
+            .. versionadded:: 3.0.0
 
         Returns
         -------
@@ -3044,6 +3060,7 @@ def to_sql(
             chunksize=chunksize,
             dtype=dtype,
             method=method,
+            hints=hints,
         )
 
     @final

diff --git a/pandas/io/sql.py b/pandas/io/sql.py
@@ -18,7 +18,6 @@
     datetime,
     time,
 )
-from functools import partial
 import re
 from typing import (
     TYPE_CHECKING,
@@ -235,6 +234,18 @@ def _wrap_result_adbc(
     return df
 
 
+def _process_sql_hints(hints: dict[str, str] | None, dialect_name: str) -> str | None:
+    if hints is None:
+        return None
+
+    dialect_name = dialect_name.lower()
+    for key, value in hints.items():
+        if key.lower() == dialect_name:
+            return value
+
+    return None
+
+
 # -----------------------------------------------------------------------------
 # -- Read and write to DataFrames
 
@@ -753,6 +764,7 @@ def to_sql(
     dtype: DtypeArg | None = None,
     method: Literal["multi"] | Callable | None = None,
     engine: str = "auto",
+    hints: dict[str, str] | None = None,
     **engine_kwargs,
 ) -> int | None:
     """
@@ -813,6 +825,23 @@ def to_sql(
 
         .. versionadded:: 1.3.0
 
+    hints : dict[str, str], optional
+        SQL hints to optimize insertion performance, keyed by database dialect name.
+        Each hint should be a complete string formatted exactly as required by the
+        target database. The user is responsible for constructing dialect-specific
+        syntax.
+
+        Examples: ``{'oracle': '/*+ APPEND PARALLEL(4) */'}``
+                  ``{'mysql': 'DELAYED'}``
+                  ``{'mssql': 'WITH (TABLOCK)'}``
+
+        .. note::
+            - Hints are database-specific and will be ignored for unsupported dialects
+            - SQLite will raise a UserWarning (hints not supported)
+            - ADBC connections will raise NotImplementedError
+
+        .. versionadded:: 3.0.0
+
     **engine_kwargs
         Any additional kwargs are passed to the engine.
 
@@ -855,6 +884,7 @@ def to_sql(
             dtype=dtype,
             method=method,
             engine=engine,
+            hints=hints,
             **engine_kwargs,
         )
 
@@ -1004,7 +1034,13 @@ def create(self) -> None:
         else:
             self._execute_create()
 
-    def _execute_insert(self, conn, keys: list[str], data_iter) -> int:
+    def _execute_insert(
+        self,
+        conn,
+        keys: list[str],
+        data_iter,
+        hint_str: str | None = None,
+    ) -> int:
         """
         Execute SQL statement inserting data
 
@@ -1016,11 +1052,23 @@ def _execute_insert(self, conn, keys: list[str], data_iter) -> int:
         data_iter : generator of list
            Each item contains a list of values to be inserted
         """
-        data = [dict(zip(keys, row, strict=True)) for row in data_iter]
-        result = self.pd_sql.execute(self.table.insert(), data)
+        data = [dict(zip(keys, row, strict=False)) for row in data_iter]
+
+        if hint_str:
+            stmt = self.table.insert().prefix_with(hint_str)
+        else:
+            stmt = self.table.insert()
+
+        result = self.pd_sql.execute(stmt, data)
         return result.rowcount
 
-    def _execute_insert_multi(self, conn, keys: list[str], data_iter) -> int:
+    def _execute_insert_multi(
+        self,
+        conn,
+        keys: list[str],
+        data_iter,
+        hint_str: str | None = None,
+    ) -> int:
         """
         Alternative to _execute_insert for DBs support multi-value INSERT.
 
@@ -1029,11 +1077,15 @@ def _execute_insert_multi(self, conn, keys: list[str], data_iter) -> int:
         but performance degrades quickly with increase of columns.
 
         """
-
         from sqlalchemy import insert
 
-        data = [dict(zip(keys, row, strict=True)) for row in data_iter]
-        stmt = insert(self.table).values(data)
+        data = [dict(zip(keys, row, strict=False)) for row in data_iter]
+
+        if hint_str:
+            stmt = insert(self.table).values(data).prefix_with(hint_str)
+        else:
+            stmt = insert(self.table).values(data)
+
         result = self.pd_sql.execute(stmt)
         return result.rowcount
 
@@ -1090,14 +1142,20 @@ def insert(
         self,
         chunksize: int | None = None,
         method: Literal["multi"] | Callable | None = None,
+        hints: dict[str, str] | None = None,
+        dialect_name: str | None = None,
     ) -> int | None:
         # set insert method
         if method is None:
             exec_insert = self._execute_insert
         elif method == "multi":
             exec_insert = self._execute_insert_multi
         elif callable(method):
-            exec_insert = partial(method, self)
+
+            def callable_wrapper(conn, keys, data_iter, hint_str=None):
+                return method(self, conn, keys, data_iter)
+
+            exec_insert = callable_wrapper
         else:
             raise ValueError(f"Invalid parameter `method`: {method}")
 
@@ -1114,6 +1172,9 @@ def insert(
             raise ValueError("chunksize argument should be non-zero")
 
         chunks = (nrows // chunksize) + 1
+
+        hint_str = _process_sql_hints(hints, dialect_name) if dialect_name else None
+
         total_inserted = None
         with self.pd_sql.run_transaction() as conn:
             for i in range(chunks):
@@ -1125,7 +1186,7 @@ def insert(
                 chunk_iter = zip(
                     *(arr[start_i:end_i] for arr in data_list), strict=True
                 )
-                num_inserted = exec_insert(conn, keys, chunk_iter)
+                num_inserted = exec_insert(conn, keys, chunk_iter, hint_str)
                 # GH 46891
                 if num_inserted is not None:
                     if total_inserted is None:
@@ -1509,6 +1570,7 @@ def to_sql(
         chunksize: int | None = None,
         dtype: DtypeArg | None = None,
         method: Literal["multi"] | Callable | None = None,
+        hints: dict[str, str] | None = None,
         engine: str = "auto",
         **engine_kwargs,
     ) -> int | None:
@@ -1545,6 +1607,8 @@ def insert_records(
         schema=None,
         chunksize: int | None = None,
         method=None,
+        hints: dict[str, str] | None = None,
+        dialect_name: str | None = None,
         **engine_kwargs,
     ) -> int | None:
         """
@@ -1569,6 +1633,8 @@ def insert_records(
         schema=None,
         chunksize: int | None = None,
         method=None,
+        hints: dict[str, str] | None = None,
+        dialect_name: str | None = None,
         **engine_kwargs,
     ) -> int | None:
         from sqlalchemy import exc
@@ -1980,6 +2046,7 @@ def to_sql(
         chunksize: int | None = None,
         dtype: DtypeArg | None = None,
         method: Literal["multi"] | Callable | None = None,
+        hints: dict[str, str] | None = None,
         engine: str = "auto",
         **engine_kwargs,
     ) -> int | None:
@@ -2053,6 +2120,8 @@ def to_sql(
             schema=schema,
             chunksize=chunksize,
             method=method,
+            hints=hints,
+            dialect_name=self.con.dialect.name,
             **engine_kwargs,
         )
 
@@ -2344,6 +2413,7 @@ def to_sql(
         chunksize: int | None = None,
         dtype: DtypeArg | None = None,
         method: Literal["multi"] | Callable | None = None,
+        hints: dict[str, str] | None = None,
         engine: str = "auto",
         **engine_kwargs,
     ) -> int | None:
@@ -2394,6 +2464,8 @@ def to_sql(
             raise NotImplementedError(
                 "engine != 'auto' not implemented for ADBC drivers"
             )
+        if hints:
+            raise NotImplementedError("'hints' is not implemented for ADBC drivers")
 
         if schema:
             table_name = f"{schema}.{name}"
@@ -2575,7 +2647,9 @@ def insert_statement(self, *, num_rows: int) -> str:
         )
         return insert_statement
 
-    def _execute_insert(self, conn, keys, data_iter) -> int:
+    def _execute_insert(
+        self, conn, keys: list[str], data_iter, hint_str: str | None = None
+    ) -> int:
         from sqlite3 import Error
 
         data_list = list(data_iter)
@@ -2585,7 +2659,9 @@ def _execute_insert(self, conn, keys, data_iter) -> int:
             raise DatabaseError("Execution failed") from exc
         return conn.rowcount
 
-    def _execute_insert_multi(self, conn, keys, data_iter) -> int:
+    def _execute_insert_multi(
+        self, conn, keys: list[str], data_iter, hint_str: str | None = None
+    ) -> int:
         data_list = list(data_iter)
         flattened_data = [x for row in data_list for x in row]
         conn.execute(self.insert_statement(num_rows=len(data_list)), flattened_data)
@@ -2821,6 +2897,7 @@ def to_sql(
         chunksize: int | None = None,
         dtype: DtypeArg | None = None,
         method: Literal["multi"] | Callable | None = None,
+        hints: dict[str, str] | None = None,
         engine: str = "auto",
         **engine_kwargs,
     ) -> int | None:
@@ -2863,6 +2940,13 @@ def to_sql(
             Details and a sample callable implementation can be found in the
             section :ref:`insert method <io.sql.method>`.
         """
+        if hints:
+            warnings.warn(
+                "SQL hints are not supported for SQLite and will be ignored.",
+                UserWarning,
+                stacklevel=find_stack_level(),
+            )
+
         if dtype:
             if not is_dict_like(dtype):
                 # error: Value expression in dictionary comprehension has incompatible