From 4eebf23d3d00a9870b6199d2c8b78a703dca3947 Mon Sep 17 00:00:00 2001
From: JY Tan <jy8230@gmail.com>
Date: Fri, 30 Jan 2026 00:38:40 -0800
Subject: [PATCH 1/2] Commit

---
 .../psycopg/instrumentation.py                |  4 +-
 .../psycopg2/instrumentation.py               |  3 +-
 drift/instrumentation/utils/psycopg_utils.py  | 46 +++++++++++++++++++
 3 files changed, 51 insertions(+), 2 deletions(-)

diff --git a/drift/instrumentation/psycopg/instrumentation.py b/drift/instrumentation/psycopg/instrumentation.py
index f1ede88..bbdcfad 100644
--- a/drift/instrumentation/psycopg/instrumentation.py
+++ b/drift/instrumentation/psycopg/instrumentation.py
@@ -24,7 +24,7 @@
     TuskDriftMode,
 )
 from ..base import InstrumentationBase
-from ..utils.psycopg_utils import deserialize_db_value
+from ..utils.psycopg_utils import deserialize_db_value, restore_row_integer_types
 from ..utils.serialization import serialize_value
 from .mocks import MockConnection, MockCopy
 from .wrappers import TracedCopyWrapper
@@ -1663,6 +1663,7 @@ def _mock_execute_with_data(self, cursor: Any, mock_data: dict[str, Any], is_asy
         mock_rows = actual_data.get("rows", [])
         # Deserialize datetime strings back to datetime objects for consistent Flask serialization
         mock_rows = [deserialize_db_value(row) for row in mock_rows]
+        mock_rows = [restore_row_integer_types(row, description_data) for row in mock_rows]
         cursor._mock_rows = mock_rows  # pyright: ignore[reportAttributeAccessIssue]
         cursor._mock_index = 0  # pyright: ignore[reportAttributeAccessIssue]
 
@@ -1731,6 +1732,7 @@ def _mock_executemany_returning_with_data(self, cursor: Any, mock_data: dict[str
             # Deserialize rows
             mock_rows = result_set.get("rows", [])
             mock_rows = [deserialize_db_value(row) for row in mock_rows]
+            mock_rows = [restore_row_integer_types(row, description_data) for row in mock_rows]
 
             cursor._mock_result_sets.append(  # pyright: ignore[reportAttributeAccessIssue]
                 {
diff --git a/drift/instrumentation/psycopg2/instrumentation.py b/drift/instrumentation/psycopg2/instrumentation.py
index 040a84e..6145e48 100644
--- a/drift/instrumentation/psycopg2/instrumentation.py
+++ b/drift/instrumentation/psycopg2/instrumentation.py
@@ -29,7 +29,7 @@
     TuskDriftMode,
 )
 from ..base import InstrumentationBase
-from ..utils.psycopg_utils import deserialize_db_value
+from ..utils.psycopg_utils import deserialize_db_value, restore_row_integer_types
 from ..utils.serialization import serialize_value
 
 logger = logging.getLogger(__name__)
@@ -890,6 +890,7 @@ def _mock_execute_with_data(self, cursor: Any, mock_data: dict[str, Any]) -> Non
         mock_rows = actual_data.get("rows", [])
         # Deserialize datetime strings back to datetime objects for consistent Flask/Django serialization
         mock_rows = [deserialize_db_value(row) for row in mock_rows]
+        mock_rows = [restore_row_integer_types(row, description_data) for row in mock_rows]
 
         # Check if this is a dict-cursor (like RealDictCursor)
         # First check if cursor has _is_dict_cursor attribute (set by InstrumentedConnection.cursor())
diff --git a/drift/instrumentation/utils/psycopg_utils.py b/drift/instrumentation/utils/psycopg_utils.py
index f3669f0..c700a9d 100644
--- a/drift/instrumentation/utils/psycopg_utils.py
+++ b/drift/instrumentation/utils/psycopg_utils.py
@@ -8,6 +8,17 @@
 from decimal import Decimal
 from typing import Any
 
+# PostgreSQL integer type OIDs
+# These are the type codes for integer columns in PostgreSQL
+# See: https://github.com/postgres/postgres/blob/master/src/include/catalog/pg_type.dat
+POSTGRES_INTEGER_TYPE_CODES = {
+    20,  # BIGINT (int8)
+    21,  # SMALLINT (int2)
+    23,  # INTEGER (int4)
+    26,  # OID
+    28,  # XID
+}
+
 # Try to import psycopg Range type for deserialization support
 try:
     from psycopg.types.range import Range as PsycopgRange  # type: ignore[import-untyped]
@@ -86,3 +97,38 @@ def deserialize_db_value(val: Any) -> Any:
     elif isinstance(val, list):
         return [deserialize_db_value(v) for v in val]
     return val
+
+
+def restore_row_integer_types(row: list[Any], description: list[dict[str, Any]] | None) -> list[Any]:
+    """Restore integer types for database row values using column metadata.
+
+    During the record/replay cycle, integer values are lost due to JSON serialization:
+    - Recording: PostgreSQL INTEGER column → psycopg2 returns int(0) -> JSON stores 0
+    - Replay: CLI parses JSON -> Go float64(0) -> protobuf double -> Python float(0.0)
+
+    This function uses the column type_code from the cursor description to identify
+    which columns should contain integers and converts whole-number floats back to int.
+
+    Args:
+        row: A row of values from the mocked database query.
+        description: Column metadata from the cursor description, containing 'type_code' for each column.
+                    Format: [{"name": "col1", "type_code": 23}, ...]
+
+    Returns:
+        The row with integer types restored for INTEGER columns.
+    """
+    if not description or not row:
+        return row
+
+    result = []
+    for i, value in enumerate(row):
+        if i < len(description):
+            type_code = description[i].get("type_code") if isinstance(description[i], dict) else None
+            # Only convert if this is an INTEGER column and value is a whole-number float
+            if type_code in POSTGRES_INTEGER_TYPE_CODES and isinstance(value, float) and value.is_integer():
+                result.append(int(value))
+            else:
+                result.append(value)
+        else:
+            result.append(value)
+    return result

From f03b3c03365b7b4ed413b880b575329587992327 Mon Sep 17 00:00:00 2001
From: JY Tan <jy8230@gmail.com>
Date: Fri, 30 Jan 2026 00:56:04 -0800
Subject: [PATCH 2/2] Handle dict rows

---
 drift/instrumentation/utils/psycopg_utils.py | 28 +++++++++++++++++---
 1 file changed, 25 insertions(+), 3 deletions(-)

diff --git a/drift/instrumentation/utils/psycopg_utils.py b/drift/instrumentation/utils/psycopg_utils.py
index c700a9d..731996d 100644
--- a/drift/instrumentation/utils/psycopg_utils.py
+++ b/drift/instrumentation/utils/psycopg_utils.py
@@ -99,7 +99,9 @@ def deserialize_db_value(val: Any) -> Any:
     return val
 
 
-def restore_row_integer_types(row: list[Any], description: list[dict[str, Any]] | None) -> list[Any]:
+def restore_row_integer_types(
+    row: list[Any] | dict[str, Any], description: list[dict[str, Any]] | None
+) -> list[Any] | dict[str, Any]:
     """Restore integer types for database row values using column metadata.
 
     During the record/replay cycle, integer values are lost due to JSON serialization:
@@ -110,7 +112,8 @@ def restore_row_integer_types(row: list[Any], description: list[dict[str, Any]]
     which columns should contain integers and converts whole-number floats back to int.
 
     Args:
-        row: A row of values from the mocked database query.
+        row: A row of values from the mocked database query. Can be a list (standard cursor)
+             or dict (dict cursor like RealDictCursor).
         description: Column metadata from the cursor description, containing 'type_code' for each column.
                     Format: [{"name": "col1", "type_code": 23}, ...]
 
@@ -120,11 +123,30 @@ def restore_row_integer_types(row: list[Any], description: list[dict[str, Any]]
     if not description or not row:
         return row
 
+    # Handle dict rows (from dict cursors like RealDictCursor)
+    if isinstance(row, dict):
+        # Build a mapping of column names to type codes
+        type_code_by_name = {}
+        for col in description:
+            if isinstance(col, dict):
+                col_name = col.get("name")
+                if col_name:
+                    type_code_by_name[col_name] = col.get("type_code")
+
+        result = {}
+        for key, value in row.items():
+            type_code = type_code_by_name.get(key)
+            if type_code in POSTGRES_INTEGER_TYPE_CODES and isinstance(value, float) and value.is_integer():
+                result[key] = int(value)
+            else:
+                result[key] = value
+        return result
+
+    # Handle list/tuple rows (standard cursors)
     result = []
     for i, value in enumerate(row):
         if i < len(description):
             type_code = description[i].get("type_code") if isinstance(description[i], dict) else None
-            # Only convert if this is an INTEGER column and value is a whole-number float
             if type_code in POSTGRES_INTEGER_TYPE_CODES and isinstance(value, float) and value.is_integer():
                 result.append(int(value))
             else: