perf(rows): reduce row_factories overhead

author Daniele Varrazzo <daniele.varrazzo@gmail.com>

Tue, 13 Dec 2022 12:49:23 +0000 (12:49 +0000)

committer Daniele Varrazzo <daniele.varrazzo@gmail.com>

Tue, 13 Dec 2022 13:42:30 +0000 (13:42 +0000)
author Daniele Varrazzo <daniele.varrazzo@gmail.com>
Tue, 13 Dec 2022 12:49:23 +0000 (12:49 +0000)
committer Daniele Varrazzo <daniele.varrazzo@gmail.com>
Tue, 13 Dec 2022 13:42:30 +0000 (13:42 +0000)
diff --git a/docs/news.rst b/docs/news.rst

index 6189d7cba6bbb1c45cbc18f4dd619615e8470966..1ef62e165da80ba890d51124a597fc60401bcb67 100644 (file)
--- a/docs/news.rst
+++ b/docs/news.rst
@@ -14,13 +14,14 @@ Psycopg 3.1.5 (unreleased)
  ^^^^^^^^^^^^^^^^^^^^^^^^^^
  
  - Fix array loading slowness compared to psycopg2 (:ticket:`#359`).
-- Performance around network communication improved (:ticket:`#414`).
+- Improve performance around network communication (:ticket:`#414`).
  - Return `!bytes` instead of `!memoryview` from `pq.Encoding` methods
    (:ticket:`#422`).
  - Fix `Cursor.rownumber` to return `!None` when the result has no row to fetch
    (:ticket:`#437`).
-- Avoid error in pyright caused by aliasing TypeAlias (:ticket:`#439`).
+- Avoid error in Pyright caused by aliasing `!TypeAlias` (:ticket:`#439`).
  - Fix `Copy.set_types()` used with `varchar` and `name` types (:ticket:`#452`).
+- Improve performance using :ref:`row-factories` (:ticket:`#457`).
  
  
  Current release
diff --git a/psycopg/psycopg/rows.py b/psycopg/psycopg/rows.py

index bab954d2ccb7d4cab2c920eaa80d9a024d5fec6c..3bd921577003101d39d24504b01ac8e3730e20e1 100644 (file)
--- a/psycopg/psycopg/rows.py
+++ b/psycopg/psycopg/rows.py
@@ -5,11 +5,12 @@ psycopg row factories
  # Copyright (C) 2021 The Psycopg Team
  
  import functools
-from typing import Any, Callable, Dict, NamedTuple, NoReturn, Sequence, Tuple
-from typing import TYPE_CHECKING, Type, TypeVar
+from typing import Any, Callable, Dict, List, Optional, NamedTuple, NoReturn
+from typing import TYPE_CHECKING, Sequence, Tuple, Type, TypeVar
  from collections import namedtuple
  from typing_extensions import TypeAlias
  
+from . import pq
  from . import errors as e
  from ._compat import Protocol
  from ._encodings import _as_python_identifier
@@ -17,6 +18,10 @@ from ._encodings import _as_python_identifier
  if TYPE_CHECKING:
      from .cursor import BaseCursor, Cursor
      from .cursor_async import AsyncCursor
+    from psycopg.pq.abc import PGresult
+
+TUPLES_OK = pq.ExecStatus.TUPLES_OK
+SINGLE_TUPLE = pq.ExecStatus.SINGLE_TUPLE
  
  T = TypeVar("T", covariant=True)
  
@@ -110,14 +115,13 @@ def dict_row(cursor: "BaseCursor[Any, Any]") -> "RowMaker[DictRow]":
  
      The dictionary keys are taken from the column names of the returned columns.
      """
-    desc = cursor.description
-    if desc is None:
+    names = _get_names(cursor)
+    if names is None:
          return no_result
  
-    titles = [c.name for c in desc]
-
      def dict_row_(values: Sequence[Any]) -> Dict[str, Any]:
-        return dict(zip(titles, values))
+        # https://github.com/python/mypy/issues/2608
+        return dict(zip(names, values))  # type: ignore[arg-type]
  
      return dict_row_
  
@@ -130,20 +134,22 @@ def namedtuple_row(
      The field names are taken from the column names of the returned columns,
      with some mangling to deal with invalid names.
      """
-    desc = cursor.description
-    if desc is None:
+    res = cursor.pgresult
+    if not res:
+        return no_result
+
+    nfields = _get_nfields(res)
+    if nfields is None:
          return no_result
  
-    nt = _make_nt(*(c.name for c in desc))
+    nt = _make_nt(cursor._encoding, *(res.fname(i) for i in range(nfields)))
      return nt._make
  
  
  @functools.lru_cache(512)
-def _make_nt(*key: str) -> Type[NamedTuple]:
-    fields = []
-    for s in key:
-        fields.append(_as_python_identifier(s))
-    return namedtuple("Row", fields)  # type: ignore[return-value]
+def _make_nt(enc: str, *names: bytes) -> Type[NamedTuple]:
+    snames = tuple(_as_python_identifier(n.decode(enc)) for n in names)
+    return namedtuple("Row", snames)  # type: ignore[return-value]
  
  
  def class_row(cls: Type[T]) -> BaseRowFactory[T]:
@@ -156,15 +162,13 @@ def class_row(cls: Type[T]) -> BaseRowFactory[T]:
      :rtype: `!Callable[[Cursor],` `RowMaker`\[~T]]
      """
  
-    def class_row_(cur: "BaseCursor[Any, Any]") -> "RowMaker[T]":
-        desc = cur.description
-        if desc is None:
+    def class_row_(cursor: "BaseCursor[Any, Any]") -> "RowMaker[T]":
+        names = _get_names(cursor)
+        if names is None:
              return no_result
  
-        names = [d.name for d in desc]
-
          def class_row__(values: Sequence[Any]) -> T:
-            return cls(**dict(zip(names, values)))
+            return cls(**dict(zip(names, values)))  # type: ignore[arg-type]
  
          return class_row__
  
@@ -194,15 +198,13 @@ def kwargs_row(func: Callable[..., T]) -> BaseRowFactory[T]:
          returned by the query as keyword arguments.
      """
  
-    def kwargs_row_(cur: "BaseCursor[Any, T]") -> "RowMaker[T]":
-        desc = cur.description
-        if desc is None:
+    def kwargs_row_(cursor: "BaseCursor[Any, T]") -> "RowMaker[T]":
+        names = _get_names(cursor)
+        if names is None:
              return no_result
  
-        names = [d.name for d in desc]
-
          def kwargs_row__(values: Sequence[Any]) -> T:
-            return func(**dict(zip(names, values)))
+            return func(**dict(zip(names, values)))  # type: ignore[arg-type]
  
          return kwargs_row__
  
@@ -217,3 +219,32 @@ def no_result(values: Sequence[Any]) -> NoReturn:
      resulting `!RowMaker` never should.
      """
      raise e.InterfaceError("the cursor doesn't have a result")
+
+
+def _get_names(cursor: "BaseCursor[Any, Any]") -> Optional[List[str]]:
+    res = cursor.pgresult
+    if not res:
+        return None
+
+    nfields = _get_nfields(res)
+    if nfields is None:
+        return None
+
+    enc = cursor._encoding
+    return [
+        res.fname(i).decode(enc) for i in range(nfields)  # type: ignore[union-attr]
+    ]
+
+
+def _get_nfields(res: "PGresult") -> Optional[int]:
+    """
+    Return the number of columns in a result, if it returns tuples else None
+
+    Take into account the special case of results with zero columns.
+    """
+    nfields = res.nfields
+
+    if nfields or res.status == TUPLES_OK or res.status == SINGLE_TUPLE:
+        return nfields
+    else:
+        return None
author	Daniele Varrazzo <daniele.varrazzo@gmail.com>
	Tue, 13 Dec 2022 12:49:23 +0000 (12:49 +0000)
committer	Daniele Varrazzo <daniele.varrazzo@gmail.com>
	Tue, 13 Dec 2022 13:42:30 +0000 (13:42 +0000)
docs/news.rst		patch \| blob \| blame \| history
psycopg/psycopg/rows.py		patch \| blob \| blame \| history