Improve compiled extension perf tests

author Federico Caselli <cfederico87@gmail.com>

Thu, 23 Nov 2023 20:58:40 +0000 (21:58 +0100)

committer Federico Caselli <cfederico87@gmail.com>

Wed, 27 Mar 2024 20:12:07 +0000 (21:12 +0100)
author Federico Caselli <cfederico87@gmail.com>
Thu, 23 Nov 2023 20:58:40 +0000 (21:58 +0100)
committer Federico Caselli <cfederico87@gmail.com>
Wed, 27 Mar 2024 20:12:07 +0000 (21:12 +0100)
diff --git a/test/perf/compiled_extensions.py b/test/perf/compiled_extensions.py

deleted file mode 100644 (file)

index 682496a..0000000
--- a/test/perf/compiled_extensions.py
+++ /dev/null
@@ -1,1297 +0,0 @@
-from collections import defaultdict
-from decimal import Decimal
-import re
-from secrets import token_urlsafe
-from textwrap import wrap
-from timeit import timeit
-from types import MappingProxyType
-
-from sqlalchemy import bindparam
-from sqlalchemy import column
-from sqlalchemy.util.langhelpers import load_uncompiled_module
-
-
-def test_case(fn=None, *, number=None):
-    def wrap(fn):
-        fn.__test_case__ = True
-        if number is not None:
-            fn.__number__ = number
-        return fn
-
-    if fn is None:
-        return wrap
-    else:
-        return wrap(fn)
-
-
-class Case:
-    """Base test case. Mark test cases with ``test_case``"""
-
-    IMPLEMENTATIONS = {}
-    "Keys are the impl name, values are callable to load it"
-    NUMBER = 1_000_000
-
-    _CASES = []
-
-    def __init__(self, impl):
-        self.impl = impl
-        self.init_objects()
-
-    def __init_subclass__(cls):
-        if not cls.__name__.startswith("_"):
-            Case._CASES.append(cls)
-
-    def init_objects(self):
-        pass
-
-    @classmethod
-    def _load(cls, fn):
-        try:
-            return fn()
-        except Exception as e:
-            print(f"Error loading {fn}: {e!r}")
-
-    @classmethod
-    def import_object(cls):
-        impl = []
-        for name, fn in cls.IMPLEMENTATIONS.items():
-            obj = cls._load(fn)
-            if obj:
-                impl.append((name, obj))
-        return impl
-
-    @classmethod
-    def _divide_results(cls, results, num, div, name):
-        "utility method to create ratios of two implementation"
-        if div in results and num in results:
-            results[name] = {
-                m: results[num][m] / results[div][m] for m in results[div]
-            }
-
-    @classmethod
-    def update_results(cls, results):
-        pass
-
-    @classmethod
-    def run_case(cls, factor, filter_):
-        objects = cls.import_object()
-        number = max(1, int(cls.NUMBER * factor))
-
-        stack = [c for c in cls.mro() if c not in {object, Case}]
-        methods = []
-        while stack:
-            curr = stack.pop(0)
-            # dict keeps the definition order, dir is instead sorted
-            methods += [
-                m
-                for m, fn in curr.__dict__.items()
-                if hasattr(fn, "__test_case__")
-            ]
-
-        if filter_:
-            methods = [m for m in methods if re.search(filter_, m)]
-
-        results = defaultdict(dict)
-        for name, impl in objects:
-            print(f"Running {name:<10} ", end="", flush=True)
-            impl_case = cls(impl)
-            fails = []
-            for m in methods:
-                call = getattr(impl_case, m)
-                try:
-                    t_num = number
-                    fn_num = getattr(call, "__number__", None)
-                    if fn_num is not None:
-                        t_num = max(1, int(fn_num * factor))
-                    value = timeit(call, number=t_num)
-                    print(".", end="", flush=True)
-                except Exception as e:
-                    fails.append(f"{name}::{m} error: {e}")
-                    print("x", end="", flush=True)
-                    value = float("nan")
-
-                results[name][m] = value
-            print(" Done")
-            for f in fails:
-                print("\t", f)
-
-        cls.update_results(results)
-        return results
-
-
-class ImmutableDict(Case):
-    @staticmethod
-    def python():
-        from sqlalchemy.util import _immutabledict_cy
-
-        py_immutabledict = load_uncompiled_module(_immutabledict_cy)
-        assert not py_immutabledict._is_compiled()
-        return py_immutabledict.immutabledict
-
-    @staticmethod
-    def c():
-        from sqlalchemy.cimmutabledict import immutabledict
-
-        return immutabledict
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.util import _immutabledict_cy
-
-        assert _immutabledict_cy._is_compiled()
-        return _immutabledict_cy.immutabledict
-
-    IMPLEMENTATIONS = {
-        "python": python.__func__,
-        "c": c.__func__,
-        "cython": cython.__func__,
-    }
-
-    def init_objects(self):
-        self.small = {"a": 5, "b": 4}
-        self.large = {f"k{i}": f"v{i}" for i in range(50)}
-        self.d1 = self.impl({"x": 5, "y": 4})
-        self.d2 = self.impl({f"key{i}": f"value{i}" for i in range(50)})
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "c", "python", "c / py")
-        cls._divide_results(results, "cython", "python", "cy / py")
-        cls._divide_results(results, "cython", "c", "cy / c")
-
-    @test_case
-    def init_empty(self):
-        self.impl()
-
-    @test_case
-    def init(self):
-        self.impl(self.small)
-
-    @test_case
-    def init_large(self):
-        self.impl(self.large)
-
-    @test_case
-    def len(self):
-        len(self.d1) + len(self.d2)
-
-    @test_case
-    def getitem(self):
-        self.d1["x"]
-        self.d2["key42"]
-
-    @test_case
-    def union(self):
-        self.d1.union(self.small)
-        self.d1.union(self.small.items())
-
-    @test_case
-    def union_large(self):
-        self.d2.union(self.large)
-
-    @test_case
-    def merge_with(self):
-        self.d1.merge_with(self.small)
-        self.d1.merge_with(self.small.items())
-
-    @test_case
-    def merge_with_large(self):
-        self.d2.merge_with(self.large)
-
-    @test_case
-    def get(self):
-        self.d1.get("x")
-        self.d2.get("key42")
-
-    @test_case
-    def get_miss(self):
-        self.d1.get("xxx")
-        self.d2.get("xxx")
-
-    @test_case
-    def keys(self):
-        self.d1.keys()
-        self.d2.keys()
-
-    @test_case
-    def items(self):
-        self.d1.items()
-        self.d2.items()
-
-    @test_case
-    def values(self):
-        self.d1.values()
-        self.d2.values()
-
-    @test_case
-    def iter(self):
-        list(self.d1)
-        list(self.d2)
-
-    @test_case
-    def in_case(self):
-        "x" in self.d1
-        "key42" in self.d1
-
-    @test_case
-    def in_miss(self):
-        "xx" in self.d1
-        "xx" in self.d1
-
-    @test_case
-    def eq(self):
-        self.d1 == self.d1
-        self.d2 == self.d2
-
-    @test_case
-    def eq_dict(self):
-        self.d1 == dict(self.d1)
-        self.d2 == dict(self.d2)
-
-    @test_case
-    def eq_other(self):
-        self.d1 == self.d2
-        self.d1 == "foo"
-
-    @test_case
-    def ne(self):
-        self.d1 != self.d1
-        self.d2 != self.d2
-
-    @test_case
-    def ne_dict(self):
-        self.d1 != dict(self.d1)
-        self.d2 != dict(self.d2)
-
-    @test_case
-    def ne_other(self):
-        self.d1 != self.d2
-        self.d1 != "foo"
-
-
-class Processors(Case):
-    @staticmethod
-    def python():
-        from sqlalchemy.engine import _processors_cy
-
-        py_processors = load_uncompiled_module(_processors_cy)
-        assert not py_processors._is_compiled()
-        return py_processors
-
-    @staticmethod
-    def c():
-        from sqlalchemy import cprocessors as mod
-
-        mod.to_decimal_processor_factory = (
-            lambda t, s: mod.DecimalResultProcessor(t, "%%.%df" % s).process
-        )
-
-        return mod
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.engine import _processors_cy
-
-        assert _processors_cy._is_compiled()
-        return _processors_cy
-
-    IMPLEMENTATIONS = {
-        "python": python.__func__,
-        "c": c.__func__,
-        "cython": cython.__func__,
-    }
-    NUMBER = 500_000
-
-    def init_objects(self):
-        self.to_dec = self.impl.to_decimal_processor_factory(Decimal, 3)
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "c", "python", "c / py")
-        cls._divide_results(results, "cython", "python", "cy / py")
-        cls._divide_results(results, "cython", "c", "cy / c")
-
-    @test_case
-    def int_to_boolean(self):
-        self.impl.int_to_boolean(None)
-        self.impl.int_to_boolean(10)
-        self.impl.int_to_boolean(1)
-        self.impl.int_to_boolean(-10)
-        self.impl.int_to_boolean(0)
-
-    @test_case
-    def to_str(self):
-        self.impl.to_str(None)
-        self.impl.to_str(123)
-        self.impl.to_str(True)
-        self.impl.to_str(self)
-        self.impl.to_str("self")
-
-    @test_case
-    def to_float(self):
-        self.impl.to_float(None)
-        self.impl.to_float(123)
-        self.impl.to_float(True)
-        self.impl.to_float(42)
-        self.impl.to_float(0)
-        self.impl.to_float(42.0)
-        self.impl.to_float("nan")
-        self.impl.to_float("42")
-        self.impl.to_float("42.0")
-
-    @test_case
-    def str_to_datetime(self):
-        self.impl.str_to_datetime(None)
-        self.impl.str_to_datetime("2020-01-01 20:10:34")
-        self.impl.str_to_datetime("2030-11-21 01:04:34.123456")
-
-    @test_case
-    def str_to_time(self):
-        self.impl.str_to_time(None)
-        self.impl.str_to_time("20:10:34")
-        self.impl.str_to_time("01:04:34.123456")
-
-    @test_case
-    def str_to_date(self):
-        self.impl.str_to_date(None)
-        self.impl.str_to_date("2020-01-01")
-
-    @test_case
-    def to_decimal_call(self):
-        assert self.to_dec(None) is None
-        self.to_dec(123.44)
-        self.to_dec(99)
-        self.to_dec(1 / 3)
-
-    @test_case
-    def to_decimal_pf_make(self):
-        self.impl.to_decimal_processor_factory(Decimal, 3)
-        self.impl.to_decimal_processor_factory(Decimal, 7)
-
-
-class DistillParam(Case):
-    NUMBER = 2_000_000
-
-    @staticmethod
-    def python():
-        from sqlalchemy.engine import _util_cy
-
-        py_util = load_uncompiled_module(_util_cy)
-        assert not py_util._is_compiled()
-        return py_util
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.engine import _util_cy
-
-        assert _util_cy._is_compiled()
-        return _util_cy
-
-    IMPLEMENTATIONS = {
-        "python": python.__func__,
-        "cython": cython.__func__,
-    }
-
-    def init_objects(self):
-        self.tup_tup = tuple(tuple(range(10)) for _ in range(100))
-        self.list_tup = list(self.tup_tup)
-        self.dict = {f"c{i}": i for i in range(100)}
-        self.mapping = MappingProxyType(self.dict)
-        self.tup_dic = (self.dict, self.dict)
-        self.list_dic = [self.dict, self.dict]
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "c", "python", "c / py")
-        cls._divide_results(results, "cython", "python", "cy / py")
-        cls._divide_results(results, "cython", "c", "cy / c")
-
-    @test_case
-    def none_20(self):
-        self.impl._distill_params_20(None)
-
-    @test_case
-    def empty_sequence_20(self):
-        self.impl._distill_params_20(())
-        self.impl._distill_params_20([])
-
-    @test_case
-    def list_20(self):
-        self.impl._distill_params_20(self.list_tup)
-
-    @test_case
-    def tuple_20(self):
-        self.impl._distill_params_20(self.tup_tup)
-
-    @test_case
-    def list_dict_20(self):
-        self.impl._distill_params_20(self.list_tup)
-
-    @test_case
-    def tuple_dict_20(self):
-        self.impl._distill_params_20(self.dict)
-
-    @test_case
-    def mapping_20(self):
-        self.impl._distill_params_20(self.mapping)
-
-    @test_case
-    def raw_none(self):
-        self.impl._distill_raw_params(None)
-
-    @test_case
-    def raw_empty_sequence(self):
-        self.impl._distill_raw_params(())
-        self.impl._distill_raw_params([])
-
-    @test_case
-    def raw_list(self):
-        self.impl._distill_raw_params(self.list_tup)
-
-    @test_case
-    def raw_tuple(self):
-        self.impl._distill_raw_params(self.tup_tup)
-
-    @test_case
-    def raw_list_dict(self):
-        self.impl._distill_raw_params(self.list_tup)
-
-    @test_case
-    def raw_tuple_dict(self):
-        self.impl._distill_raw_params(self.dict)
-
-    @test_case
-    def raw_mapping(self):
-        self.impl._distill_raw_params(self.mapping)
-
-
-class IdentitySet(Case):
-    @staticmethod
-    def set_fn():
-        return set
-
-    @staticmethod
-    def python():
-        from sqlalchemy.util import _collections_cy
-
-        py_coll = load_uncompiled_module(_collections_cy)
-        assert not py_coll._is_compiled()
-        return py_coll.IdentitySet
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.util import _collections_cy
-
-        assert _collections_cy._is_compiled()
-        return _collections_cy.IdentitySet
-
-    IMPLEMENTATIONS = {
-        "set": set_fn.__func__,
-        "python": python.__func__,
-        "cython": cython.__func__,
-    }
-    NUMBER = 10
-
-    def init_objects(self):
-        self.val1 = list(range(10))
-        self.val2 = list(wrap(token_urlsafe(4 * 2048), 4))
-        self.imp_1 = self.impl(self.val1)
-        self.imp_2 = self.impl(self.val2)
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "python", "set", "py / set")
-        cls._divide_results(results, "cython", "python", "cy / py")
-        cls._divide_results(results, "cython", "set", "cy / set")
-
-    @test_case(number=2_500_000)
-    def init_empty(self):
-        self.impl()
-
-    @test_case(number=2_500)
-    def init(self):
-        self.impl(self.val1)
-        self.impl(self.val2)
-
-    @test_case(number=5_000)
-    def init_from_impl(self):
-        self.impl(self.imp_2)
-
-    @test_case(number=100)
-    def add(self):
-        ii = self.impl()
-        x = 25_000
-        for i in range(x):
-            ii.add(str(i % (x / 2)))
-
-    @test_case
-    def contains(self):
-        ii = self.impl(self.val2)
-        for _ in range(1_000):
-            for x in self.val1 + self.val2:
-                x in ii
-
-    @test_case(number=200)
-    def remove(self):
-        v = [str(i) for i in range(7500)]
-        ii = self.impl(v)
-        for x in v[:5000]:
-            ii.remove(x)
-
-    @test_case(number=200)
-    def discard(self):
-        v = [str(i) for i in range(7500)]
-        ii = self.impl(v)
-        for x in v[:5000]:
-            ii.discard(x)
-
-    @test_case
-    def pop(self):
-        for x in range(50_000):
-            ii = self.impl(self.val1)
-            for x in self.val1:
-                ii.pop()
-
-    @test_case
-    def clear(self):
-        i, v = self.impl, self.val1
-        for _ in range(125_000):
-            ii = i(v)
-            ii.clear()
-
-    @test_case(number=2_500_000)
-    def eq(self):
-        self.imp_1 == self.imp_1
-        self.imp_1 == self.imp_2
-        self.imp_1 == self.val2
-
-    @test_case(number=2_500_000)
-    def ne(self):
-        self.imp_1 != self.imp_1
-        self.imp_1 != self.imp_2
-        self.imp_1 != self.val2
-
-    @test_case(number=20_000)
-    def issubset(self):
-        self.imp_1.issubset(self.imp_1)
-        self.imp_1.issubset(self.imp_2)
-        self.imp_1.issubset(self.val1)
-        self.imp_1.issubset(self.val2)
-
-    @test_case(number=50_000)
-    def le(self):
-        self.imp_1 <= self.imp_1
-        self.imp_1 <= self.imp_2
-        self.imp_2 <= self.imp_1
-        self.imp_2 <= self.imp_2
-
-    @test_case(number=2_500_000)
-    def lt(self):
-        self.imp_1 < self.imp_1
-        self.imp_1 < self.imp_2
-        self.imp_2 < self.imp_1
-        self.imp_2 < self.imp_2
-
-    @test_case(number=20_000)
-    def issuperset(self):
-        self.imp_1.issuperset(self.imp_1)
-        self.imp_1.issuperset(self.imp_2)
-        self.imp_1.issubset(self.val1)
-        self.imp_1.issubset(self.val2)
-
-    @test_case(number=50_000)
-    def ge(self):
-        self.imp_1 >= self.imp_1
-        self.imp_1 >= self.imp_2
-        self.imp_2 >= self.imp_1
-        self.imp_2 >= self.imp_2
-
-    @test_case(number=2_500_000)
-    def gt(self):
-        self.imp_1 > self.imp_1
-        self.imp_2 > self.imp_2
-        self.imp_2 > self.imp_1
-        self.imp_2 > self.imp_2
-
-    @test_case(number=10_000)
-    def union(self):
-        self.imp_1.union(self.imp_2)
-
-    @test_case(number=10_000)
-    def or_test(self):
-        self.imp_1 | self.imp_2
-
-    @test_case
-    def update(self):
-        ii = self.impl(self.val1)
-        for _ in range(1_000):
-            ii.update(self.imp_2)
-
-    @test_case
-    def ior(self):
-        ii = self.impl(self.val1)
-        for _ in range(1_000):
-            ii |= self.imp_2
-
-    @test_case
-    def difference(self):
-        for _ in range(2_500):
-            self.imp_1.difference(self.imp_2)
-            self.imp_1.difference(self.val2)
-
-    @test_case(number=250_000)
-    def sub(self):
-        self.imp_1 - self.imp_2
-
-    @test_case
-    def difference_update(self):
-        ii = self.impl(self.val1)
-        for _ in range(2_500):
-            ii.difference_update(self.imp_2)
-            ii.difference_update(self.val2)
-
-    @test_case
-    def isub(self):
-        ii = self.impl(self.val1)
-        for _ in range(250_000):
-            ii -= self.imp_2
-
-    @test_case(number=20_000)
-    def intersection(self):
-        self.imp_1.intersection(self.imp_2)
-        self.imp_1.intersection(self.val2)
-
-    @test_case(number=250_000)
-    def and_test(self):
-        self.imp_1 & self.imp_2
-
-    @test_case
-    def intersection_up(self):
-        ii = self.impl(self.val1)
-        for _ in range(2_500):
-            ii.intersection_update(self.imp_2)
-            ii.intersection_update(self.val2)
-
-    @test_case
-    def iand(self):
-        ii = self.impl(self.val1)
-        for _ in range(250_000):
-            ii &= self.imp_2
-
-    @test_case(number=2_500)
-    def symmetric_diff(self):
-        self.imp_1.symmetric_difference(self.imp_2)
-        self.imp_1.symmetric_difference(self.val2)
-
-    @test_case(number=2_500)
-    def xor(self):
-        self.imp_1 ^ self.imp_2
-
-    @test_case
-    def symmetric_diff_up(self):
-        ii = self.impl(self.val1)
-        for _ in range(125):
-            ii.symmetric_difference_update(self.imp_2)
-            ii.symmetric_difference_update(self.val2)
-
-    @test_case
-    def ixor(self):
-        ii = self.impl(self.val1)
-        for _ in range(250):
-            ii ^= self.imp_2
-
-    @test_case(number=25_000)
-    def copy(self):
-        self.imp_1.copy()
-        self.imp_2.copy()
-
-    @test_case(number=2_500_000)
-    def len(self):
-        len(self.imp_1)
-        len(self.imp_2)
-
-    @test_case(number=25_000)
-    def iter(self):
-        list(self.imp_1)
-        list(self.imp_2)
-
-    @test_case(number=10_000)
-    def repr(self):
-        str(self.imp_1)
-        str(self.imp_2)
-
-
-class OrderedSet(IdentitySet):
-    @staticmethod
-    def set_fn():
-        return set
-
-    @staticmethod
-    def python():
-        from sqlalchemy.util import _collections_cy
-
-        py_coll = load_uncompiled_module(_collections_cy)
-        assert not py_coll._is_compiled()
-        return py_coll.OrderedSet
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.util import _collections_cy
-
-        assert _collections_cy._is_compiled()
-        return _collections_cy.OrderedSet
-
-    @staticmethod
-    def ordered_lib():
-        from orderedset import OrderedSet
-
-        return OrderedSet
-
-    IMPLEMENTATIONS = {
-        "set": set_fn.__func__,
-        "python": python.__func__,
-        "cython": cython.__func__,
-        "ordsetlib": ordered_lib.__func__,
-    }
-
-    @classmethod
-    def update_results(cls, results):
-        super().update_results(results)
-        cls._divide_results(results, "ordsetlib", "set", "ordlib/set")
-        cls._divide_results(results, "cython", "ordsetlib", "cy / ordlib")
-
-    @test_case
-    def add_op(self):
-        ii = self.impl(self.val1)
-        v2 = self.impl(self.val2)
-        for _ in range(500):
-            ii + v2
-
-    @test_case
-    def getitem(self):
-        ii = self.impl(self.val1)
-        for _ in range(250_000):
-            for i in range(len(self.val1)):
-                ii[i]
-
-    @test_case
-    def insert(self):
-        for _ in range(5):
-            ii = self.impl(self.val1)
-            for i in range(5_000):
-                ii.insert(i // 2, i)
-                ii.insert(-i % 2, i)
-
-
-class UniqueList(Case):
-    @staticmethod
-    def python():
-        from sqlalchemy.util import _collections_cy
-
-        py_coll = load_uncompiled_module(_collections_cy)
-        assert not py_coll._is_compiled()
-        return py_coll.unique_list
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.util import _collections_cy
-
-        assert _collections_cy._is_compiled()
-        return _collections_cy.unique_list
-
-    IMPLEMENTATIONS = {
-        "python": python.__func__,
-        "cython": cython.__func__,
-    }
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "cython", "python", "cy / py")
-
-    def init_objects(self):
-        self.int_small = list(range(10))
-        self.int_vlarge = list(range(25_000)) * 2
-        d = wrap(token_urlsafe(100 * 2048), 4)
-        assert len(d) > 50_000
-        self.vlarge = d[:50_000]
-        self.large = d[:500]
-        self.small = d[:15]
-
-    @test_case
-    def small_str(self):
-        self.impl(self.small)
-
-    @test_case(number=50_000)
-    def large_str(self):
-        self.impl(self.large)
-
-    @test_case(number=250)
-    def vlarge_str(self):
-        self.impl(self.vlarge)
-
-    @test_case
-    def small_range(self):
-        self.impl(range(10))
-
-    @test_case
-    def small_int(self):
-        self.impl(self.int_small)
-
-    @test_case(number=25_000)
-    def large_int(self):
-        self.impl([1, 1, 1, 2, 3] * 100)
-        self.impl(range(1000))
-
-    @test_case(number=250)
-    def vlarge_int(self):
-        self.impl(self.int_vlarge)
-
-
-class TupleGetter(Case):
-    NUMBER = 2_000_000
-
-    @staticmethod
-    def python():
-        from sqlalchemy.engine import _util_cy
-
-        py_util = load_uncompiled_module(_util_cy)
-        assert not py_util._is_compiled()
-        return py_util.tuplegetter
-
-    @staticmethod
-    def c():
-        from sqlalchemy import cresultproxy
-
-        return cresultproxy.tuplegetter
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.engine import _util_cy
-
-        assert _util_cy._is_compiled()
-        return _util_cy.tuplegetter
-
-    IMPLEMENTATIONS = {
-        "python": python.__func__,
-        "c": c.__func__,
-        "cython": cython.__func__,
-    }
-
-    def init_objects(self):
-        self.impl_tg = self.impl
-
-        self.tuple = tuple(range(1000))
-        self.tg_inst = self.impl_tg(42)
-        self.tg_inst_m = self.impl_tg(42, 420, 99, 9, 1)
-        self.tg_inst_seq = self.impl_tg(*range(70, 75))
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "c", "python", "c / py")
-        cls._divide_results(results, "cython", "python", "cy / py")
-        cls._divide_results(results, "cython", "c", "cy / c")
-
-    @test_case
-    def tuplegetter_one(self):
-        self.tg_inst(self.tuple)
-
-    @test_case
-    def tuplegetter_many(self):
-        self.tg_inst_m(self.tuple)
-
-    @test_case
-    def tuplegetter_seq(self):
-        self.tg_inst_seq(self.tuple)
-
-    @test_case
-    def tuplegetter_new_one(self):
-        self.impl_tg(42)(self.tuple)
-
-    @test_case
-    def tuplegetter_new_many(self):
-        self.impl_tg(42, 420, 99, 9, 1)(self.tuple)
-
-    @test_case
-    def tuplegetter_new_seq(self):
-        self.impl_tg(40, 41, 42, 43, 44)(self.tuple)
-
-
-class BaseRow(Case):
-    @staticmethod
-    def python():
-        from sqlalchemy.engine import _row_cy
-
-        py_res = load_uncompiled_module(_row_cy)
-        assert not py_res._is_compiled()
-        return py_res.BaseRow
-
-    @staticmethod
-    def c():
-        from sqlalchemy.cresultproxy import BaseRow
-
-        return BaseRow
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.engine import _row_cy
-
-        assert _row_cy._is_compiled()
-        return _row_cy.BaseRow
-
-    IMPLEMENTATIONS = {
-        "python": python.__func__,
-        # "c": c.__func__,
-        "cython": cython.__func__,
-    }
-
-    def init_objects(self):
-        from sqlalchemy.engine.result import SimpleResultMetaData
-        from string import ascii_letters
-
-        self.parent = SimpleResultMetaData(("a", "b", "c"))
-        self.row_args = (
-            self.parent,
-            self.parent._processors,
-            self.parent._key_to_index,
-            (1, 2, 3),
-        )
-        self.parent_long = SimpleResultMetaData(tuple(ascii_letters))
-        self.row_long_args = (
-            self.parent_long,
-            self.parent_long._processors,
-            self.parent_long._key_to_index,
-            tuple(range(len(ascii_letters))),
-        )
-        self.row = self.impl(*self.row_args)
-        self.row_long = self.impl(*self.row_long_args)
-        assert isinstance(self.row, self.impl), type(self.row)
-
-        class Row(self.impl):
-            pass
-
-        self.Row = Row
-        self.row_sub = Row(*self.row_args)
-
-        self.row_state = self.row.__getstate__()
-        self.row_long_state = self.row_long.__getstate__()
-
-        assert len(ascii_letters) == 52
-        _proc = [None, int, float, None, str] * 10
-        _proc += [int, float]
-        self.parent_proc = SimpleResultMetaData(
-            tuple(ascii_letters),
-            _processors=_proc,
-        )
-        self.row_proc_args = (
-            self.parent_proc,
-            self.parent_proc._processors,
-            self.parent_proc._key_to_index,
-            tuple(range(len(ascii_letters))),
-        )
-
-        self.parent_proc_none = SimpleResultMetaData(
-            tuple(ascii_letters), _processors=[None] * 52
-        )
-        self.row_proc_none_args = (
-            self.parent_proc_none,
-            # NOTE: usually the code calls _effective_processors that returns
-            # None for this case of all None.
-            self.parent_proc_none._processors,
-            self.parent_proc_none._key_to_index,
-            tuple(range(len(ascii_letters))),
-        )
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "c", "python", "c / py")
-        cls._divide_results(results, "cython", "python", "cy / py")
-        cls._divide_results(results, "cython", "c", "cy / c")
-
-    @test_case
-    def base_row_new(self):
-        self.impl(*self.row_args)
-        self.impl(*self.row_long_args)
-
-    @test_case
-    def row_new(self):
-        self.Row(*self.row_args)
-        self.Row(*self.row_long_args)
-
-    @test_case
-    def base_row_new_proc(self):
-        self.impl(*self.row_proc_args)
-
-    @test_case
-    def row_new_proc(self):
-        self.Row(*self.row_proc_args)
-
-    @test_case
-    def brow_new_proc_none(self):
-        self.impl(*self.row_proc_none_args)
-
-    @test_case
-    def row_new_proc_none(self):
-        self.Row(*self.row_proc_none_args)
-
-    @test_case
-    def row_dumps(self):
-        self.row.__getstate__()
-        self.row_long.__getstate__()
-
-    @test_case
-    def row_loads(self):
-        self.impl.__new__(self.impl).__setstate__(self.row_state)
-        self.impl.__new__(self.impl).__setstate__(self.row_long_state)
-
-    @test_case
-    def row_values_impl(self):
-        self.row._values_impl()
-        self.row_long._values_impl()
-
-    @test_case
-    def row_iter(self):
-        list(self.row)
-        list(self.row_long)
-
-    @test_case
-    def row_len(self):
-        len(self.row)
-        len(self.row_long)
-
-    @test_case
-    def row_hash(self):
-        hash(self.row)
-        hash(self.row_long)
-
-    @test_case
-    def getitem(self):
-        self.row[0]
-        self.row[1]
-        self.row[-1]
-        self.row_long[0]
-        self.row_long[1]
-        self.row_long[-1]
-
-    @test_case
-    def getitem_slice(self):
-        self.row[0:1]
-        self.row[1:-1]
-        self.row_long[0:1]
-        self.row_long[1:-1]
-
-    @test_case
-    def get_by_key(self):
-        self.row._get_by_key_impl_mapping("a")
-        self.row._get_by_key_impl_mapping("b")
-        self.row_long._get_by_key_impl_mapping("s")
-        self.row_long._get_by_key_impl_mapping("a")
-
-    @test_case
-    def getattr(self):
-        self.row.a
-        self.row.b
-        self.row_long.x
-        self.row_long.y
-
-    @test_case(number=25_000)
-    def get_by_key_recreate(self):
-        self.init_objects()
-        row = self.row
-        for _ in range(25):
-            row._get_by_key_impl_mapping("a")
-        l_row = self.row_long
-        for _ in range(25):
-            l_row._get_by_key_impl_mapping("f")
-            l_row._get_by_key_impl_mapping("o")
-            l_row._get_by_key_impl_mapping("r")
-            l_row._get_by_key_impl_mapping("t")
-            l_row._get_by_key_impl_mapping("y")
-            l_row._get_by_key_impl_mapping("t")
-            l_row._get_by_key_impl_mapping("w")
-            l_row._get_by_key_impl_mapping("o")
-
-    @test_case(number=10_000)
-    def getattr_recreate(self):
-        self.init_objects()
-        row = self.row
-        for _ in range(25):
-            row.a
-        l_row = self.row_long
-        for _ in range(25):
-            l_row.f
-            l_row.o
-            l_row.r
-            l_row.t
-            l_row.y
-            l_row.t
-            l_row.w
-            l_row.o
-
-
-class AnonMap(Case):
-    @staticmethod
-    def python():
-        from sqlalchemy.sql import _util_cy
-
-        py_util = load_uncompiled_module(_util_cy)
-        assert not py_util._is_compiled()
-        return py_util.anon_map
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.sql import _util_cy
-
-        assert _util_cy._is_compiled()
-        return _util_cy.anon_map
-
-    IMPLEMENTATIONS = {"python": python.__func__, "cython": cython.__func__}
-
-    NUMBER = 1000000
-
-    def init_objects(self):
-        self.object_1 = column("x")
-        self.object_2 = bindparam("y")
-
-        self.impl_w_non_present = self.impl()
-        self.impl_w_present = iwp = self.impl()
-        iwp.get_anon(self.object_1)
-        iwp.get_anon(self.object_2)
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "cython", "python", "cy / py")
-
-    @test_case
-    def test_make(self):
-        self.impl()
-
-    @test_case
-    def test_get_anon_np(self):
-        self.impl_w_non_present.get_anon(self.object_1)
-
-    @test_case
-    def test_get_anon_p(self):
-        self.impl_w_present.get_anon(self.object_1)
-
-    @test_case
-    def test_has_key_np(self):
-        id(self.object_1) in self.impl_w_non_present
-
-    @test_case
-    def test_has_key_p(self):
-        id(self.object_1) in self.impl_w_present
-
-
-class PrefixAnonMap(Case):
-    @staticmethod
-    def python():
-        from sqlalchemy.sql import _util_cy
-
-        py_util = load_uncompiled_module(_util_cy)
-        assert not py_util._is_compiled()
-        return py_util.prefix_anon_map
-
-    @staticmethod
-    def cython():
-        from sqlalchemy.sql import _util_cy
-
-        assert _util_cy._is_compiled()
-        return _util_cy.prefix_anon_map
-
-    IMPLEMENTATIONS = {"python": python.__func__, "cython": cython.__func__}
-
-    NUMBER = 1000000
-
-    def init_objects(self):
-        from sqlalchemy.sql.elements import _anonymous_label
-
-        self.name = _anonymous_label.safe_construct(58243, "some_column_name")
-
-        self.impl_w_non_present = self.impl()
-        self.impl_w_present = iwp = self.impl()
-        self.name.apply_map(iwp)
-
-    @classmethod
-    def update_results(cls, results):
-        cls._divide_results(results, "cython", "python", "cy / py")
-
-    @test_case
-    def test_make(self):
-        self.impl()
-
-    @test_case
-    def test_apply_np(self):
-        self.name.apply_map(self.impl_w_non_present)
-
-    @test_case
-    def test_apply_p(self):
-        self.name.apply_map(self.impl_w_present)
-
-
-def tabulate(results, inverse):
-    dim = 11
-    header = "{:<20}|" + (" {:<%s} |" % dim) * len(results)
-    num_format = "{:<%s.9f}" % dim
-    row = "{:<20}|" + " {} |" * len(results)
-    names = list(results)
-    print(header.format("", *names))
-
-    for meth in inverse:
-        strings = [
-            num_format.format(inverse[meth][name])[:dim] for name in names
-        ]
-        print(row.format(meth, *strings))
-
-
-def main():
-    import argparse
-
-    cases = Case._CASES
-
-    parser = argparse.ArgumentParser(
-        description="Compare implementation between them"
-    )
-    parser.add_argument(
-        "case",
-        help="Case to run",
-        nargs="+",
-        choices=["all"] + [c.__name__ for c in cases],
-    )
-    parser.add_argument("--filter", help="filter the test for this regexp")
-    parser.add_argument(
-        "--factor", help="scale number passed to timeit", type=float, default=1
-    )
-    parser.add_argument("--csv", help="save to csv", action="store_true")
-
-    args = parser.parse_args()
-
-    if "all" in args.case:
-        to_run = cases
-    else:
-        to_run = [c for c in cases if c.__name__ in args.case]
-
-    for case in to_run:
-        print("Running case", case.__name__)
-        result = case.run_case(args.factor, args.filter)
-
-        inverse = defaultdict(dict)
-        for name in result:
-            for meth in result[name]:
-                inverse[meth][name] = result[name][meth]
-
-        tabulate(result, inverse)
-
-        if args.csv:
-            import csv
-
-            file_name = f"{case.__name__}.csv"
-            with open(file_name, "w", newline="") as f:
-                w = csv.DictWriter(f, ["", *result])
-                w.writeheader()
-                for n in inverse:
-                    w.writerow({"": n, **inverse[n]})
-            print("Wrote file", file_name)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/test/perf/compiled_extensions/__init__.py b/test/perf/compiled_extensions/__init__.py

new file mode 100644 (file)

index 0000000..e69de29
diff --git a/test/perf/compiled_extensions/__main__.py b/test/perf/compiled_extensions/__main__.py

new file mode 100644 (file)

index 0000000..15696fb
--- /dev/null
+++ b/test/perf/compiled_extensions/__main__.py
@@ -0,0 +1,11 @@
+from pathlib import Path
+import sys
+
+parent_dir = Path(__file__).parent.parent
+sys.path.insert(0, str(parent_dir.absolute()))
+if True:
+    from compiled_extensions import command
+
+
+if __name__ == "__main__":
+    command.main()
diff --git a/test/perf/compiled_extensions/base.py b/test/perf/compiled_extensions/base.py

new file mode 100644 (file)

index 0000000..fd6c419
--- /dev/null
+++ b/test/perf/compiled_extensions/base.py
@@ -0,0 +1,123 @@
+from collections import defaultdict
+import math
+import re
+from timeit import timeit
+
+
+def test_case(fn=None, *, number=None):
+    def wrap(fn):
+        fn.__test_case__ = True
+        if number is not None:
+            fn.__number__ = number
+        return fn
+
+    if fn is None:
+        return wrap
+    else:
+        return wrap(fn)
+
+
+class Case:
+    """Base test case. Mark test cases with ``test_case``"""
+
+    IMPLEMENTATIONS = {}
+    "Keys are the impl name, values are callable to load it"
+    NUMBER = 1_000_000
+
+    _CASES = []
+
+    def __init__(self, impl):
+        self.impl = impl
+        self.init_objects()
+
+    def __init_subclass__(cls):
+        if not cls.__name__.startswith("_"):
+            Case._CASES.append(cls)
+
+    def init_objects(self):
+        pass
+
+    @classmethod
+    def init_class(cls):
+        pass
+
+    @classmethod
+    def _load(cls, fn):
+        try:
+            return fn()
+        except Exception as e:
+            print(f"Error loading {fn}: {e!r}")
+
+    @classmethod
+    def import_impl(cls):
+        impl = []
+        for name, fn in cls.IMPLEMENTATIONS.items():
+            obj = cls._load(fn)
+            if obj:
+                impl.append((name, obj))
+        return impl
+
+    @classmethod
+    def _divide_results(cls, results, num, div, name):
+        "utility method to create ratios of two implementation"
+        avg_str = "> mean of values"
+        if div in results and num in results:
+            num_dict = results[num]
+            div_dict = results[div]
+            assert avg_str not in num_dict and avg_str not in div_dict
+            assert num_dict.keys() == div_dict.keys()
+            results[name] = {m: num_dict[m] / div_dict[m] for m in div_dict}
+            not_na = [v for v in results[name].values() if not math.isnan(v)]
+            avg = sum(not_na) / len(not_na)
+            results[name][avg_str] = avg
+
+    @classmethod
+    def update_results(cls, results):
+        pass
+
+    @classmethod
+    def run_case(cls, factor, filter_):
+        objects = cls.import_impl()
+        cls.init_class()
+        number = max(1, int(cls.NUMBER * factor))
+
+        stack = [c for c in cls.mro() if c not in {object, Case}]
+        methods = []
+        while stack:
+            curr = stack.pop(0)
+            # dict keeps the definition order, dir is instead sorted
+            methods += [
+                m
+                for m, fn in curr.__dict__.items()
+                if hasattr(fn, "__test_case__")
+            ]
+
+        if filter_:
+            methods = [m for m in methods if re.search(filter_, m)]
+
+        results = defaultdict(dict)
+        for name, impl in objects:
+            print(f"Running {name:<10} ", end="", flush=True)
+            impl_case = cls(impl)
+            fails = []
+            for m in methods:
+                call = getattr(impl_case, m)
+                try:
+                    t_num = number
+                    fn_num = getattr(call, "__number__", None)
+                    if fn_num is not None:
+                        t_num = max(1, int(fn_num * factor))
+                    value = timeit(call, number=t_num)
+                    print(".", end="", flush=True)
+                except Exception as e:
+                    fails.append(f"{name}::{m} error: {e}")
+                    print("x", end="", flush=True)
+                    value = float("nan")
+
+                results[name][m] = value
+            print(" Done")
+            for f in fails:
+                print("\t", f)
+
+        cls.update_results(results)
+        return results
diff --git a/test/perf/compiled_extensions/cache_key.py b/test/perf/compiled_extensions/cache_key.py

new file mode 100644 (file)

index 0000000..ddc8f58
--- /dev/null
+++ b/test/perf/compiled_extensions/cache_key.py
@@ -0,0 +1,243 @@
+from types import SimpleNamespace
+
+import sqlalchemy as sa
+from sqlalchemy import orm
+from sqlalchemy.dialects.oracle.base import OracleDialect
+from sqlalchemy.dialects.postgresql.base import PGDialect
+from sqlalchemy.engine import ObjectKind
+from sqlalchemy.engine import ObjectScope
+from .base import Case
+from .base import test_case
+
+
+class CacheKey(Case):
+    NUMBER = 50_000
+
+    @staticmethod
+    def traversal():
+        from sqlalchemy.sql.cache_key import HasCacheKey
+
+        return HasCacheKey._generate_cache_key
+
+    IMPLEMENTATIONS = {
+        "traversal": traversal.__func__,
+    }
+
+    @classmethod
+    def init_class(cls):
+        cls.objects = setup_objects()
+        cls.statements = setup_statements(cls.objects)
+
+        for name in (
+            "parent_table",
+            "parent_orm",
+            "parent_orm_join",
+            "many_types",
+        ):
+            cls.make_test_cases(name, cls.statements.__dict__[name])
+
+        oracle = OracleDialect()
+        oracle.server_version_info = (21, 0, 0)
+        for name, stmt, num in (
+            (
+                "_all_objects_query",
+                oracle._all_objects_query(
+                    "scott", ObjectScope.DEFAULT, ObjectKind.ANY, False, False
+                ),
+                None,
+            ),
+            (
+                "_table_options_query",
+                oracle._table_options_query(
+                    "scott", ObjectScope.DEFAULT, ObjectKind.ANY, False, False
+                ),
+                None,
+            ),
+            ("_column_query", oracle._column_query("scott"), 15_000),
+            (
+                "_comment_query",
+                oracle._comment_query(
+                    "scott", ObjectScope.DEFAULT, ObjectKind.ANY, False
+                ),
+                20_000,
+            ),
+            ("_index_query", oracle._index_query("scott"), 20_000),
+            ("_constraint_query", oracle._constraint_query("scott"), 20_000),
+        ):
+            cls.make_test_cases("oracle" + name, stmt, num)
+
+        pg = PGDialect()
+        pg.server_version_info = (16, 0, 0)
+        for name, stmt, num in (
+            ("_has_table_query", pg._has_table_query("scott"), 30_000),
+            (
+                "_columns_query",
+                pg._columns_query(
+                    "scott", False, ObjectScope.DEFAULT, ObjectKind.ANY
+                ),
+                10_000,
+            ),
+            (
+                "_table_oids_query",
+                pg._table_oids_query(
+                    "scott", False, ObjectScope.DEFAULT, ObjectKind.ANY
+                ),
+                30_000,
+            ),
+            ("_index_query", pg._index_query, 7_000),
+            ("_constraint_query", pg._constraint_query(True), 10_000),
+            (
+                "_foreing_key_query",
+                pg._foreing_key_query(
+                    "scott", False, ObjectScope.DEFAULT, ObjectKind.ANY
+                ),
+                15_000,
+            ),
+            (
+                "_comment_query",
+                pg._comment_query(
+                    "scott", False, ObjectScope.DEFAULT, ObjectKind.ANY
+                ),
+                25_000,
+            ),
+            (
+                "_check_constraint_query",
+                pg._check_constraint_query(
+                    "scott", False, ObjectScope.DEFAULT, ObjectKind.ANY
+                ),
+                20_000,
+            ),
+            ("_enum_query", pg._enum_query("scott"), 20_000),
+            ("_domain_query", pg._domain_query("scott"), 15_000),
+        ):
+            cls.make_test_cases("pg" + name, stmt, num)
+
+    @classmethod
+    def make_test_cases(cls, name, obj, number=None):
+        def go(self):
+            assert self.impl(obj) is not None
+
+        go.__name__ = name
+        setattr(cls, name, test_case(go, number=number))
+
+    @test_case
+    def check_not_caching(self):
+        c1 = self.impl(self.statements.parent_table)
+        c2 = self.impl(self.statements.parent_table)
+        assert c1 is not None
+        assert c2 is not None
+        assert c1 is not c2
+        assert c1 == c2
+
+
+def setup_objects():
+    metadata = sa.MetaData()
+    parent = sa.Table(
+        "parent",
+        metadata,
+        sa.Column("id", sa.Integer, primary_key=True),
+        sa.Column("data", sa.String(20)),
+    )
+    child = sa.Table(
+        "child",
+        metadata,
+        sa.Column("id", sa.Integer, primary_key=True),
+        sa.Column("data", sa.String(20)),
+        sa.Column(
+            "parent_id", sa.Integer, sa.ForeignKey("parent.id"), nullable=False
+        ),
+    )
+
+    class Parent:
+        pass
+
+    class Child:
+        pass
+
+    registry = orm.registry()
+    registry.map_imperatively(
+        Parent,
+        parent,
+        properties={"children": orm.relationship(Child, backref="parent")},
+    )
+    registry.map_imperatively(Child, child)
+
+    many_types = sa.Table(
+        "large",
+        metadata,
+        sa.Column("col_ARRAY", sa.ARRAY(sa.Integer)),
+        sa.Column("col_BIGINT", sa.BIGINT),
+        sa.Column("col_BigInteger", sa.BigInteger),
+        sa.Column("col_BINARY", sa.BINARY),
+        sa.Column("col_BLOB", sa.BLOB),
+        sa.Column("col_BOOLEAN", sa.BOOLEAN),
+        sa.Column("col_Boolean", sa.Boolean),
+        sa.Column("col_CHAR", sa.CHAR),
+        sa.Column("col_CLOB", sa.CLOB),
+        sa.Column("col_DATE", sa.DATE),
+        sa.Column("col_Date", sa.Date),
+        sa.Column("col_DATETIME", sa.DATETIME),
+        sa.Column("col_DateTime", sa.DateTime),
+        sa.Column("col_DECIMAL", sa.DECIMAL),
+        sa.Column("col_DOUBLE", sa.DOUBLE),
+        sa.Column("col_Double", sa.Double),
+        sa.Column("col_DOUBLE_PRECISION", sa.DOUBLE_PRECISION),
+        sa.Column("col_Enum", sa.Enum),
+        sa.Column("col_FLOAT", sa.FLOAT),
+        sa.Column("col_Float", sa.Float),
+        sa.Column("col_INT", sa.INT),
+        sa.Column("col_INTEGER", sa.INTEGER),
+        sa.Column("col_Integer", sa.Integer),
+        sa.Column("col_Interval", sa.Interval),
+        sa.Column("col_JSON", sa.JSON),
+        sa.Column("col_LargeBinary", sa.LargeBinary),
+        sa.Column("col_NCHAR", sa.NCHAR),
+        sa.Column("col_NUMERIC", sa.NUMERIC),
+        sa.Column("col_Numeric", sa.Numeric),
+        sa.Column("col_NVARCHAR", sa.NVARCHAR),
+        sa.Column("col_PickleType", sa.PickleType),
+        sa.Column("col_REAL", sa.REAL),
+        sa.Column("col_SMALLINT", sa.SMALLINT),
+        sa.Column("col_SmallInteger", sa.SmallInteger),
+        sa.Column("col_String", sa.String),
+        sa.Column("col_TEXT", sa.TEXT),
+        sa.Column("col_Text", sa.Text),
+        sa.Column("col_TIME", sa.TIME),
+        sa.Column("col_Time", sa.Time),
+        sa.Column("col_TIMESTAMP", sa.TIMESTAMP),
+        sa.Column("col_TupleType", sa.TupleType),
+        sa.Column("col_Unicode", sa.Unicode),
+        sa.Column("col_UnicodeText", sa.UnicodeText),
+        sa.Column("col_UUID", sa.UUID),
+        sa.Column("col_Uuid", sa.Uuid),
+        sa.Column("col_VARBINARY", sa.VARBINARY),
+        sa.Column("col_VARCHAR", sa.VARCHAR),
+    )
+
+    registry.configure()
+
+    return SimpleNamespace(**locals())
+
+
+def setup_statements(setup: SimpleNamespace):
+    parent_table = sa.select(setup.parent).where(setup.parent.c.id == 42)
+
+    parent_orm = (
+        sa.select(setup.Parent)
+        .order_by(setup.Parent.id)
+        .where(setup.Parent.data.like("cat"))
+    )
+
+    parent_orm_join = (
+        sa.select(setup.Parent.id, setup.Child.id)
+        .select_from(
+            orm.join(setup.Parent, setup.Child, setup.Parent.children)
+        )
+        .where(setup.Child.id == 5)
+    )
+
+    many_types = sa.select(setup.many_types).where(
+        setup.many_types.c.col_Boolean
+    )
+
+    return SimpleNamespace(**locals())
diff --git a/test/perf/compiled_extensions/collections.py b/test/perf/compiled_extensions/collections.py

new file mode 100644 (file)

index 0000000..7643bd1
--- /dev/null
+++ b/test/perf/compiled_extensions/collections.py
@@ -0,0 +1,531 @@
+from secrets import token_urlsafe
+from textwrap import wrap
+
+from sqlalchemy.util.langhelpers import load_uncompiled_module
+from .base import Case
+from .base import test_case
+
+
+class ImmutableDict(Case):
+    @staticmethod
+    def python():
+        from sqlalchemy.util import _immutabledict_cy
+
+        py_immutabledict = load_uncompiled_module(_immutabledict_cy)
+        assert not py_immutabledict._is_compiled()
+        return py_immutabledict.immutabledict
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.util import _immutabledict_cy
+
+        assert _immutabledict_cy._is_compiled()
+        return _immutabledict_cy.immutabledict
+
+    IMPLEMENTATIONS = {
+        "python": python.__func__,
+        "cython": cython.__func__,
+    }
+
+    def init_objects(self):
+        self.small = {"a": 5, "b": 4}
+        self.large = {f"k{i}": f"v{i}" for i in range(50)}
+        self.d1 = self.impl({"x": 5, "y": 4})
+        self.d2 = self.impl({f"key{i}": f"value{i}" for i in range(50)})
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "c", "python", "c / py")
+        cls._divide_results(results, "cython", "python", "cy / py")
+        cls._divide_results(results, "cython", "c", "cy / c")
+
+    @test_case
+    def init_empty(self):
+        self.impl()
+
+    @test_case
+    def init(self):
+        self.impl(self.small)
+
+    @test_case
+    def init_large(self):
+        self.impl(self.large)
+
+    @test_case
+    def len(self):
+        len(self.d1) + len(self.d2)
+
+    @test_case
+    def getitem(self):
+        self.d1["x"]
+        self.d2["key42"]
+
+    @test_case
+    def union(self):
+        self.d1.union(self.small)
+        self.d1.union(self.small.items())
+
+    @test_case
+    def union_large(self):
+        self.d2.union(self.large)
+
+    @test_case
+    def merge_with(self):
+        self.d1.merge_with(self.small)
+        self.d1.merge_with(self.small.items())
+
+    @test_case
+    def merge_with_large(self):
+        self.d2.merge_with(self.large)
+
+    @test_case
+    def get(self):
+        self.d1.get("x")
+        self.d2.get("key42")
+
+    @test_case
+    def get_miss(self):
+        self.d1.get("xxx")
+        self.d2.get("xxx")
+
+    @test_case
+    def keys(self):
+        self.d1.keys()
+        self.d2.keys()
+
+    @test_case
+    def items(self):
+        self.d1.items()
+        self.d2.items()
+
+    @test_case
+    def values(self):
+        self.d1.values()
+        self.d2.values()
+
+    @test_case
+    def iter(self):
+        list(self.d1)
+        list(self.d2)
+
+    @test_case
+    def in_case(self):
+        "x" in self.d1
+        "key42" in self.d1
+
+    @test_case
+    def in_miss(self):
+        "xx" in self.d1
+        "xx" in self.d1
+
+    @test_case
+    def eq(self):
+        self.d1 == self.d1
+        self.d2 == self.d2
+
+    @test_case
+    def eq_dict(self):
+        self.d1 == dict(self.d1)
+        self.d2 == dict(self.d2)
+
+    @test_case
+    def eq_other(self):
+        self.d1 == self.d2
+        self.d1 == "foo"
+
+    @test_case
+    def ne(self):
+        self.d1 != self.d1
+        self.d2 != self.d2
+
+    @test_case
+    def ne_dict(self):
+        self.d1 != dict(self.d1)
+        self.d2 != dict(self.d2)
+
+    @test_case
+    def ne_other(self):
+        self.d1 != self.d2
+        self.d1 != "foo"
+
+
+class IdentitySet(Case):
+    @staticmethod
+    def set_fn():
+        return set
+
+    @staticmethod
+    def python():
+        from sqlalchemy.util import _collections_cy
+
+        py_coll = load_uncompiled_module(_collections_cy)
+        assert not py_coll._is_compiled()
+        return py_coll.IdentitySet
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.util import _collections_cy
+
+        assert _collections_cy._is_compiled()
+        return _collections_cy.IdentitySet
+
+    IMPLEMENTATIONS = {
+        "set": set_fn.__func__,
+        "python": python.__func__,
+        "cython": cython.__func__,
+    }
+    NUMBER = 10
+
+    def init_objects(self):
+        self.val1 = list(range(10))
+        self.val2 = list(wrap(token_urlsafe(4 * 2048), 4))
+        self.imp_1 = self.impl(self.val1)
+        self.imp_2 = self.impl(self.val2)
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "python", "set", "py / set")
+        cls._divide_results(results, "cython", "python", "cy / py")
+        cls._divide_results(results, "cython", "set", "cy / set")
+
+    @test_case(number=2_500_000)
+    def init_empty(self):
+        self.impl()
+
+    @test_case(number=2_500)
+    def init(self):
+        self.impl(self.val1)
+        self.impl(self.val2)
+
+    @test_case(number=5_000)
+    def init_from_impl(self):
+        self.impl(self.imp_2)
+
+    @test_case(number=100)
+    def add(self):
+        ii = self.impl()
+        x = 25_000
+        for i in range(x):
+            ii.add(str(i % (x / 2)))
+
+    @test_case
+    def contains(self):
+        ii = self.impl(self.val2)
+        for _ in range(1_000):
+            for x in self.val1 + self.val2:
+                x in ii
+
+    @test_case(number=200)
+    def remove(self):
+        v = [str(i) for i in range(7500)]
+        ii = self.impl(v)
+        for x in v[:5000]:
+            ii.remove(x)
+
+    @test_case(number=200)
+    def discard(self):
+        v = [str(i) for i in range(7500)]
+        ii = self.impl(v)
+        for x in v[:5000]:
+            ii.discard(x)
+
+    @test_case
+    def pop(self):
+        for x in range(50_000):
+            ii = self.impl(self.val1)
+            for x in self.val1:
+                ii.pop()
+
+    @test_case
+    def clear(self):
+        i, v = self.impl, self.val1
+        for _ in range(125_000):
+            ii = i(v)
+            ii.clear()
+
+    @test_case(number=2_500_000)
+    def eq(self):
+        self.imp_1 == self.imp_1
+        self.imp_1 == self.imp_2
+        self.imp_1 == self.val2
+
+    @test_case(number=2_500_000)
+    def ne(self):
+        self.imp_1 != self.imp_1
+        self.imp_1 != self.imp_2
+        self.imp_1 != self.val2
+
+    @test_case(number=20_000)
+    def issubset(self):
+        self.imp_1.issubset(self.imp_1)
+        self.imp_1.issubset(self.imp_2)
+        self.imp_1.issubset(self.val1)
+        self.imp_1.issubset(self.val2)
+
+    @test_case(number=50_000)
+    def le(self):
+        self.imp_1 <= self.imp_1
+        self.imp_1 <= self.imp_2
+        self.imp_2 <= self.imp_1
+        self.imp_2 <= self.imp_2
+
+    @test_case(number=2_500_000)
+    def lt(self):
+        self.imp_1 < self.imp_1
+        self.imp_1 < self.imp_2
+        self.imp_2 < self.imp_1
+        self.imp_2 < self.imp_2
+
+    @test_case(number=20_000)
+    def issuperset(self):
+        self.imp_1.issuperset(self.imp_1)
+        self.imp_1.issuperset(self.imp_2)
+        self.imp_1.issubset(self.val1)
+        self.imp_1.issubset(self.val2)
+
+    @test_case(number=50_000)
+    def ge(self):
+        self.imp_1 >= self.imp_1
+        self.imp_1 >= self.imp_2
+        self.imp_2 >= self.imp_1
+        self.imp_2 >= self.imp_2
+
+    @test_case(number=2_500_000)
+    def gt(self):
+        self.imp_1 > self.imp_1
+        self.imp_2 > self.imp_2
+        self.imp_2 > self.imp_1
+        self.imp_2 > self.imp_2
+
+    @test_case(number=10_000)
+    def union(self):
+        self.imp_1.union(self.imp_2)
+
+    @test_case(number=10_000)
+    def or_test(self):
+        self.imp_1 | self.imp_2
+
+    @test_case
+    def update(self):
+        ii = self.impl(self.val1)
+        for _ in range(1_000):
+            ii.update(self.imp_2)
+
+    @test_case
+    def ior(self):
+        ii = self.impl(self.val1)
+        for _ in range(1_000):
+            ii |= self.imp_2
+
+    @test_case
+    def difference(self):
+        for _ in range(2_500):
+            self.imp_1.difference(self.imp_2)
+            self.imp_1.difference(self.val2)
+
+    @test_case(number=250_000)
+    def sub(self):
+        self.imp_1 - self.imp_2
+
+    @test_case
+    def difference_update(self):
+        ii = self.impl(self.val1)
+        for _ in range(2_500):
+            ii.difference_update(self.imp_2)
+            ii.difference_update(self.val2)
+
+    @test_case
+    def isub(self):
+        ii = self.impl(self.val1)
+        for _ in range(250_000):
+            ii -= self.imp_2
+
+    @test_case(number=20_000)
+    def intersection(self):
+        self.imp_1.intersection(self.imp_2)
+        self.imp_1.intersection(self.val2)
+
+    @test_case(number=250_000)
+    def and_test(self):
+        self.imp_1 & self.imp_2
+
+    @test_case
+    def intersection_up(self):
+        ii = self.impl(self.val1)
+        for _ in range(2_500):
+            ii.intersection_update(self.imp_2)
+            ii.intersection_update(self.val2)
+
+    @test_case
+    def iand(self):
+        ii = self.impl(self.val1)
+        for _ in range(250_000):
+            ii &= self.imp_2
+
+    @test_case(number=2_500)
+    def symmetric_diff(self):
+        self.imp_1.symmetric_difference(self.imp_2)
+        self.imp_1.symmetric_difference(self.val2)
+
+    @test_case(number=2_500)
+    def xor(self):
+        self.imp_1 ^ self.imp_2
+
+    @test_case
+    def symmetric_diff_up(self):
+        ii = self.impl(self.val1)
+        for _ in range(125):
+            ii.symmetric_difference_update(self.imp_2)
+            ii.symmetric_difference_update(self.val2)
+
+    @test_case
+    def ixor(self):
+        ii = self.impl(self.val1)
+        for _ in range(250):
+            ii ^= self.imp_2
+
+    @test_case(number=25_000)
+    def copy(self):
+        self.imp_1.copy()
+        self.imp_2.copy()
+
+    @test_case(number=2_500_000)
+    def len(self):
+        len(self.imp_1)
+        len(self.imp_2)
+
+    @test_case(number=25_000)
+    def iter(self):
+        list(self.imp_1)
+        list(self.imp_2)
+
+    @test_case(number=10_000)
+    def repr(self):
+        str(self.imp_1)
+        str(self.imp_2)
+
+
+class OrderedSet(IdentitySet):
+    @staticmethod
+    def set_fn():
+        return set
+
+    @staticmethod
+    def python():
+        from sqlalchemy.util import _collections_cy
+
+        py_coll = load_uncompiled_module(_collections_cy)
+        assert not py_coll._is_compiled()
+        return py_coll.OrderedSet
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.util import _collections_cy
+
+        assert _collections_cy._is_compiled()
+        return _collections_cy.OrderedSet
+
+    @staticmethod
+    def ordered_lib():
+        from orderedset import OrderedSet
+
+        return OrderedSet
+
+    IMPLEMENTATIONS = {
+        "set": set_fn.__func__,
+        "python": python.__func__,
+        "cython": cython.__func__,
+        "ordsetlib": ordered_lib.__func__,
+    }
+
+    @classmethod
+    def update_results(cls, results):
+        super().update_results(results)
+        cls._divide_results(results, "ordsetlib", "set", "ordlib/set")
+        cls._divide_results(results, "cython", "ordsetlib", "cy / ordlib")
+
+    @test_case
+    def add_op(self):
+        ii = self.impl(self.val1)
+        v2 = self.impl(self.val2)
+        for _ in range(500):
+            ii + v2
+
+    @test_case
+    def getitem(self):
+        ii = self.impl(self.val1)
+        for _ in range(250_000):
+            for i in range(len(self.val1)):
+                ii[i]
+
+    @test_case
+    def insert(self):
+        for _ in range(5):
+            ii = self.impl(self.val1)
+            for i in range(5_000):
+                ii.insert(i // 2, i)
+                ii.insert(-i % 2, i)
+
+
+class UniqueList(Case):
+    @staticmethod
+    def python():
+        from sqlalchemy.util import _collections_cy
+
+        py_coll = load_uncompiled_module(_collections_cy)
+        assert not py_coll._is_compiled()
+        return py_coll.unique_list
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.util import _collections_cy
+
+        assert _collections_cy._is_compiled()
+        return _collections_cy.unique_list
+
+    IMPLEMENTATIONS = {
+        "python": python.__func__,
+        "cython": cython.__func__,
+    }
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "cython", "python", "cy / py")
+
+    def init_objects(self):
+        self.int_small = list(range(10))
+        self.int_vlarge = list(range(25_000)) * 2
+        d = wrap(token_urlsafe(100 * 2048), 4)
+        assert len(d) > 50_000
+        self.vlarge = d[:50_000]
+        self.large = d[:500]
+        self.small = d[:15]
+
+    @test_case
+    def small_str(self):
+        self.impl(self.small)
+
+    @test_case(number=50_000)
+    def large_str(self):
+        self.impl(self.large)
+
+    @test_case(number=250)
+    def vlarge_str(self):
+        self.impl(self.vlarge)
+
+    @test_case
+    def small_range(self):
+        self.impl(range(10))
+
+    @test_case
+    def small_int(self):
+        self.impl(self.int_small)
+
+    @test_case(number=25_000)
+    def large_int(self):
+        self.impl([1, 1, 1, 2, 3] * 100)
+        self.impl(range(1000))
+
+    @test_case(number=250)
+    def vlarge_int(self):
+        self.impl(self.int_vlarge)
diff --git a/test/perf/compiled_extensions/command.py b/test/perf/compiled_extensions/command.py

new file mode 100644 (file)

index 0000000..21fc1ca
--- /dev/null
+++ b/test/perf/compiled_extensions/command.py
@@ -0,0 +1,89 @@
+from collections import defaultdict
+
+from .base import Case
+
+if True:
+    from . import cache_key  # noqa: F401
+    from . import collections  # noqa: F401
+    from . import misc  # noqa: F401
+    from . import row  # noqa: F401
+
+
+def tabulate(
+    result_by_impl: dict[str, dict[str, float]],
+    result_by_method: dict[str, dict[str, float]],
+):
+    if not result_by_method:
+        return
+    dim = 11
+
+    width = max(20, *(len(m) + 1 for m in result_by_method))
+
+    string_cell = "{:<%s}" % dim
+    header = "{:<%s}|" % width + f" {string_cell} |" * len(result_by_impl)
+    num_format = "{:<%s.9f}" % dim
+    csv_row = "{:<%s}|" % width + " {} |" * len(result_by_impl)
+    names = list(result_by_impl)
+    print(header.format("", *names))
+
+    for meth in result_by_method:
+        data = result_by_method[meth]
+        strings = [
+            (
+                num_format.format(data[name])[:dim]
+                if name in data
+                else string_cell.format("—")
+            )
+            for name in names
+        ]
+        print(csv_row.format(meth, *strings))
+
+
+def main():
+    import argparse
+
+    cases = Case._CASES
+
+    parser = argparse.ArgumentParser(
+        description="Compare implementation between them"
+    )
+    parser.add_argument(
+        "case",
+        help="Case to run",
+        nargs="+",
+        choices=["all"] + sorted(c.__name__ for c in cases),
+    )
+    parser.add_argument("--filter", help="filter the test for this regexp")
+    parser.add_argument(
+        "--factor", help="scale number passed to timeit", type=float, default=1
+    )
+    parser.add_argument("--csv", help="save to csv", action="store_true")
+
+    args = parser.parse_args()
+
+    if "all" in args.case:
+        to_run = cases
+    else:
+        to_run = [c for c in cases if c.__name__ in args.case]
+
+    for case in to_run:
+        print("Running case", case.__name__)
+        result_by_impl = case.run_case(args.factor, args.filter)
+
+        result_by_method = defaultdict(dict)
+        for name in result_by_impl:
+            for meth in result_by_impl[name]:
+                result_by_method[meth][name] = result_by_impl[name][meth]
+
+        tabulate(result_by_impl, result_by_method)
+
+        if args.csv:
+            import csv
+
+            file_name = f"{case.__name__}.csv"
+            with open(file_name, "w", newline="") as f:
+                w = csv.DictWriter(f, ["", *result_by_impl])
+                w.writeheader()
+                for n in result_by_method:
+                    w.writerow({"": n, **result_by_method[n]})
+            print("Wrote file", file_name)
diff --git a/test/perf/compiled_extensions/misc.py b/test/perf/compiled_extensions/misc.py

new file mode 100644 (file)

index 0000000..01ff055
--- /dev/null
+++ b/test/perf/compiled_extensions/misc.py
@@ -0,0 +1,303 @@
+from decimal import Decimal
+from types import MappingProxyType
+
+from sqlalchemy import bindparam
+from sqlalchemy import column
+from sqlalchemy.util.langhelpers import load_uncompiled_module
+from .base import Case
+from .base import test_case
+
+
+class Processors(Case):
+    @staticmethod
+    def python():
+        from sqlalchemy.engine import _processors_cy
+
+        py_processors = load_uncompiled_module(_processors_cy)
+        assert not py_processors._is_compiled()
+        return py_processors
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.engine import _processors_cy
+
+        assert _processors_cy._is_compiled()
+        return _processors_cy
+
+    IMPLEMENTATIONS = {
+        "python": python.__func__,
+        "cython": cython.__func__,
+    }
+    NUMBER = 500_000
+
+    def init_objects(self):
+        self.to_dec = self.impl.to_decimal_processor_factory(Decimal, 3)
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "c", "python", "c / py")
+        cls._divide_results(results, "cython", "python", "cy / py")
+        cls._divide_results(results, "cython", "c", "cy / c")
+
+    @test_case
+    def int_to_boolean(self):
+        self.impl.int_to_boolean(None)
+        self.impl.int_to_boolean(10)
+        self.impl.int_to_boolean(1)
+        self.impl.int_to_boolean(-10)
+        self.impl.int_to_boolean(0)
+
+    @test_case
+    def to_str(self):
+        self.impl.to_str(None)
+        self.impl.to_str(123)
+        self.impl.to_str(True)
+        self.impl.to_str(self)
+        self.impl.to_str("self")
+
+    @test_case
+    def to_float(self):
+        self.impl.to_float(None)
+        self.impl.to_float(123)
+        self.impl.to_float(True)
+        self.impl.to_float(42)
+        self.impl.to_float(0)
+        self.impl.to_float(42.0)
+        self.impl.to_float("nan")
+        self.impl.to_float("42")
+        self.impl.to_float("42.0")
+
+    @test_case
+    def str_to_datetime(self):
+        self.impl.str_to_datetime(None)
+        self.impl.str_to_datetime("2020-01-01 20:10:34")
+        self.impl.str_to_datetime("2030-11-21 01:04:34.123456")
+
+    @test_case
+    def str_to_time(self):
+        self.impl.str_to_time(None)
+        self.impl.str_to_time("20:10:34")
+        self.impl.str_to_time("01:04:34.123456")
+
+    @test_case
+    def str_to_date(self):
+        self.impl.str_to_date(None)
+        self.impl.str_to_date("2020-01-01")
+
+    @test_case
+    def to_decimal_call(self):
+        assert self.to_dec(None) is None
+        self.to_dec(123.44)
+        self.to_dec(99)
+        self.to_dec(1 / 3)
+
+    @test_case
+    def to_decimal_pf_make(self):
+        self.impl.to_decimal_processor_factory(Decimal, 3)
+        self.impl.to_decimal_processor_factory(Decimal, 7)
+
+
+class DistillParam(Case):
+    NUMBER = 2_000_000
+
+    @staticmethod
+    def python():
+        from sqlalchemy.engine import _util_cy
+
+        py_util = load_uncompiled_module(_util_cy)
+        assert not py_util._is_compiled()
+        return py_util
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.engine import _util_cy
+
+        assert _util_cy._is_compiled()
+        return _util_cy
+
+    IMPLEMENTATIONS = {
+        "python": python.__func__,
+        "cython": cython.__func__,
+    }
+
+    def init_objects(self):
+        self.tup_tup = tuple(tuple(range(10)) for _ in range(100))
+        self.list_tup = list(self.tup_tup)
+        self.dict = {f"c{i}": i for i in range(100)}
+        self.mapping = MappingProxyType(self.dict)
+        self.tup_dic = (self.dict, self.dict)
+        self.list_dic = [self.dict, self.dict]
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "c", "python", "c / py")
+        cls._divide_results(results, "cython", "python", "cy / py")
+        cls._divide_results(results, "cython", "c", "cy / c")
+
+    @test_case
+    def none_20(self):
+        self.impl._distill_params_20(None)
+
+    @test_case
+    def empty_sequence_20(self):
+        self.impl._distill_params_20(())
+        self.impl._distill_params_20([])
+
+    @test_case
+    def list_20(self):
+        self.impl._distill_params_20(self.list_tup)
+
+    @test_case
+    def tuple_20(self):
+        self.impl._distill_params_20(self.tup_tup)
+
+    @test_case
+    def list_dict_20(self):
+        self.impl._distill_params_20(self.list_tup)
+
+    @test_case
+    def tuple_dict_20(self):
+        self.impl._distill_params_20(self.dict)
+
+    @test_case
+    def mapping_20(self):
+        self.impl._distill_params_20(self.mapping)
+
+    @test_case
+    def raw_none(self):
+        self.impl._distill_raw_params(None)
+
+    @test_case
+    def raw_empty_sequence(self):
+        self.impl._distill_raw_params(())
+        self.impl._distill_raw_params([])
+
+    @test_case
+    def raw_list(self):
+        self.impl._distill_raw_params(self.list_tup)
+
+    @test_case
+    def raw_tuple(self):
+        self.impl._distill_raw_params(self.tup_tup)
+
+    @test_case
+    def raw_list_dict(self):
+        self.impl._distill_raw_params(self.list_tup)
+
+    @test_case
+    def raw_tuple_dict(self):
+        self.impl._distill_raw_params(self.dict)
+
+    @test_case
+    def raw_mapping(self):
+        self.impl._distill_raw_params(self.mapping)
+
+
+class AnonMap(Case):
+    NUMBER = 5_000_000
+
+    @staticmethod
+    def python():
+        from sqlalchemy.sql import _util_cy
+
+        py_util = load_uncompiled_module(_util_cy)
+        assert not py_util._is_compiled()
+        return py_util.anon_map
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.sql import _util_cy
+
+        assert _util_cy._is_compiled()
+        return _util_cy.anon_map
+
+    IMPLEMENTATIONS = {"python": python.__func__, "cython": cython.__func__}
+
+    def init_objects(self):
+        self.object_1 = column("x")
+        self.object_2 = bindparam("y")
+
+        self.impl_w_non_present = self.impl()
+        self.impl_w_present = iwp = self.impl()
+        iwp.get_anon(self.object_1)
+        iwp.get_anon(self.object_2)
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "cython", "python", "cy / py")
+
+    @test_case
+    def test_make(self):
+        self.impl()
+
+    @test_case
+    def test_get_anon_np(self):
+        self.impl_w_non_present.get_anon(self.object_1)
+        self.impl_w_non_present.clear()
+
+    @test_case
+    def test_get_anon_p(self):
+        self.impl_w_present.get_anon(self.object_1)
+
+    @test_case
+    def test_get_item_np(self):
+        self.impl_w_non_present[self.object_1]
+        self.impl_w_non_present.clear()
+
+    @test_case
+    def test_get_item_p(self):
+        self.impl_w_present[self.object_1]
+
+    @test_case
+    def test_has_key_np(self):
+        id(self.object_1) in self.impl_w_non_present
+
+    @test_case
+    def test_has_key_p(self):
+        id(self.object_1) in self.impl_w_present
+
+
+class PrefixAnonMap(Case):
+    @staticmethod
+    def python():
+        from sqlalchemy.sql import _util_cy
+
+        py_util = load_uncompiled_module(_util_cy)
+        assert not py_util._is_compiled()
+        return py_util.prefix_anon_map
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.sql import _util_cy
+
+        assert _util_cy._is_compiled()
+        return _util_cy.prefix_anon_map
+
+    IMPLEMENTATIONS = {"python": python.__func__, "cython": cython.__func__}
+
+    NUMBER = 1000000
+
+    def init_objects(self):
+        from sqlalchemy.sql.elements import _anonymous_label
+
+        self.name = _anonymous_label.safe_construct(58243, "some_column_name")
+
+        self.impl_w_non_present = self.impl()
+        self.impl_w_present = iwp = self.impl()
+        self.name.apply_map(iwp)
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "cython", "python", "cy / py")
+
+    @test_case
+    def test_make(self):
+        self.impl()
+
+    @test_case
+    def test_apply_np(self):
+        self.name.apply_map(self.impl_w_non_present)
+
+    @test_case
+    def test_apply_p(self):
+        self.name.apply_map(self.impl_w_present)
diff --git a/test/perf/compiled_extensions/row.py b/test/perf/compiled_extensions/row.py

new file mode 100644 (file)

index 0000000..7fe8d00
--- /dev/null
+++ b/test/perf/compiled_extensions/row.py
@@ -0,0 +1,277 @@
+from sqlalchemy.util.langhelpers import load_uncompiled_module
+from .base import Case
+from .base import test_case
+
+
+class TupleGetter(Case):
+    NUMBER = 2_000_000
+
+    @staticmethod
+    def python():
+        from sqlalchemy.engine import _util_cy
+
+        py_util = load_uncompiled_module(_util_cy)
+        assert not py_util._is_compiled()
+        return py_util.tuplegetter
+
+    @staticmethod
+    def c():
+        from sqlalchemy import cresultproxy
+
+        return cresultproxy.tuplegetter
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.engine import _util_cy
+
+        assert _util_cy._is_compiled()
+        return _util_cy.tuplegetter
+
+    IMPLEMENTATIONS = {
+        "python": python.__func__,
+        "c": c.__func__,
+        "cython": cython.__func__,
+    }
+
+    def init_objects(self):
+        self.impl_tg = self.impl
+
+        self.tuple = tuple(range(1000))
+        self.tg_inst = self.impl_tg(42)
+        self.tg_inst_m = self.impl_tg(42, 420, 99, 9, 1)
+        self.tg_inst_seq = self.impl_tg(*range(70, 75))
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "c", "python", "c / py")
+        cls._divide_results(results, "cython", "python", "cy / py")
+        cls._divide_results(results, "cython", "c", "cy / c")
+
+    @test_case
+    def tuplegetter_one(self):
+        self.tg_inst(self.tuple)
+
+    @test_case
+    def tuplegetter_many(self):
+        self.tg_inst_m(self.tuple)
+
+    @test_case
+    def tuplegetter_seq(self):
+        self.tg_inst_seq(self.tuple)
+
+    @test_case
+    def tuplegetter_new_one(self):
+        self.impl_tg(42)(self.tuple)
+
+    @test_case
+    def tuplegetter_new_many(self):
+        self.impl_tg(42, 420, 99, 9, 1)(self.tuple)
+
+    @test_case
+    def tuplegetter_new_seq(self):
+        self.impl_tg(40, 41, 42, 43, 44)(self.tuple)
+
+
+class BaseRow(Case):
+    @staticmethod
+    def python():
+        from sqlalchemy.engine import _row_cy
+
+        py_res = load_uncompiled_module(_row_cy)
+        assert not py_res._is_compiled()
+        return py_res.BaseRow
+
+    @staticmethod
+    def cython():
+        from sqlalchemy.engine import _row_cy
+
+        assert _row_cy._is_compiled()
+        return _row_cy.BaseRow
+
+    IMPLEMENTATIONS = {
+        "python": python.__func__,
+        "cython": cython.__func__,
+    }
+
+    def init_objects(self):
+        from sqlalchemy.engine.result import SimpleResultMetaData
+        from string import ascii_letters
+
+        self.parent = SimpleResultMetaData(("a", "b", "c"))
+        self.row_args = (
+            self.parent,
+            self.parent._processors,
+            self.parent._key_to_index,
+            (1, 2, 3),
+        )
+        self.parent_long = SimpleResultMetaData(tuple(ascii_letters))
+        self.row_long_args = (
+            self.parent_long,
+            self.parent_long._processors,
+            self.parent_long._key_to_index,
+            tuple(range(len(ascii_letters))),
+        )
+        self.row = self.impl(*self.row_args)
+        self.row_long = self.impl(*self.row_long_args)
+        assert isinstance(self.row, self.impl), type(self.row)
+
+        class Row(self.impl):
+            pass
+
+        self.Row = Row
+        self.row_sub = Row(*self.row_args)
+
+        self.row_state = self.row.__getstate__()
+        self.row_long_state = self.row_long.__getstate__()
+
+        assert len(ascii_letters) == 52
+        _proc = [None, int, float, None, str] * 10
+        _proc += [int, float]
+        self.parent_proc = SimpleResultMetaData(
+            tuple(ascii_letters),
+            _processors=_proc,
+        )
+        self.row_proc_args = (
+            self.parent_proc,
+            self.parent_proc._processors,
+            self.parent_proc._key_to_index,
+            tuple(range(len(ascii_letters))),
+        )
+
+        self.parent_proc_none = SimpleResultMetaData(
+            tuple(ascii_letters), _processors=[None] * 52
+        )
+        self.row_proc_none_args = (
+            self.parent_proc_none,
+            # NOTE: usually the code calls _effective_processors that returns
+            # None for this case of all None.
+            self.parent_proc_none._processors,
+            self.parent_proc_none._key_to_index,
+            tuple(range(len(ascii_letters))),
+        )
+
+    @classmethod
+    def update_results(cls, results):
+        cls._divide_results(results, "c", "python", "c / py")
+        cls._divide_results(results, "cython", "python", "cy / py")
+        cls._divide_results(results, "cython", "c", "cy / c")
+
+    @test_case
+    def base_row_new(self):
+        self.impl(*self.row_args)
+        self.impl(*self.row_long_args)
+
+    @test_case
+    def row_new(self):
+        self.Row(*self.row_args)
+        self.Row(*self.row_long_args)
+
+    @test_case
+    def base_row_new_proc(self):
+        self.impl(*self.row_proc_args)
+
+    @test_case
+    def row_new_proc(self):
+        self.Row(*self.row_proc_args)
+
+    @test_case
+    def brow_new_proc_none(self):
+        self.impl(*self.row_proc_none_args)
+
+    @test_case
+    def row_new_proc_none(self):
+        self.Row(*self.row_proc_none_args)
+
+    @test_case
+    def row_dumps(self):
+        self.row.__getstate__()
+        self.row_long.__getstate__()
+
+    @test_case
+    def row_loads(self):
+        self.impl.__new__(self.impl).__setstate__(self.row_state)
+        self.impl.__new__(self.impl).__setstate__(self.row_long_state)
+
+    @test_case
+    def row_values_impl(self):
+        self.row._values_impl()
+        self.row_long._values_impl()
+
+    @test_case
+    def row_iter(self):
+        list(self.row)
+        list(self.row_long)
+
+    @test_case
+    def row_len(self):
+        len(self.row)
+        len(self.row_long)
+
+    @test_case
+    def row_hash(self):
+        hash(self.row)
+        hash(self.row_long)
+
+    @test_case
+    def getitem(self):
+        self.row[0]
+        self.row[1]
+        self.row[-1]
+        self.row_long[0]
+        self.row_long[1]
+        self.row_long[-1]
+
+    @test_case
+    def getitem_slice(self):
+        self.row[0:1]
+        self.row[1:-1]
+        self.row_long[0:1]
+        self.row_long[1:-1]
+
+    @test_case
+    def get_by_key(self):
+        self.row._get_by_key_impl_mapping("a")
+        self.row._get_by_key_impl_mapping("b")
+        self.row_long._get_by_key_impl_mapping("s")
+        self.row_long._get_by_key_impl_mapping("a")
+
+    @test_case
+    def getattr(self):
+        self.row.a
+        self.row.b
+        self.row_long.x
+        self.row_long.y
+
+    @test_case(number=25_000)
+    def get_by_key_recreate(self):
+        self.init_objects()
+        row = self.row
+        for _ in range(25):
+            row._get_by_key_impl_mapping("a")
+        l_row = self.row_long
+        for _ in range(25):
+            l_row._get_by_key_impl_mapping("f")
+            l_row._get_by_key_impl_mapping("o")
+            l_row._get_by_key_impl_mapping("r")
+            l_row._get_by_key_impl_mapping("t")
+            l_row._get_by_key_impl_mapping("y")
+            l_row._get_by_key_impl_mapping("t")
+            l_row._get_by_key_impl_mapping("w")
+            l_row._get_by_key_impl_mapping("o")
+
+    @test_case(number=10_000)
+    def getattr_recreate(self):
+        self.init_objects()
+        row = self.row
+        for _ in range(25):
+            row.a
+        l_row = self.row_long
+        for _ in range(25):
+            l_row.f
+            l_row.o
+            l_row.r
+            l_row.t
+            l_row.y
+            l_row.t
+            l_row.w
+            l_row.o
author	Federico Caselli <cfederico87@gmail.com>
	Thu, 23 Nov 2023 20:58:40 +0000 (21:58 +0100)
committer	Federico Caselli <cfederico87@gmail.com>
	Wed, 27 Mar 2024 20:12:07 +0000 (21:12 +0100)
test/perf/compiled_extensions.py	[deleted file]	patch \| blob \| blame \| history
test/perf/compiled_extensions/__init__.py	[new file with mode: 0644]	patch \| blob
test/perf/compiled_extensions/__main__.py	[new file with mode: 0644]	patch \| blob
test/perf/compiled_extensions/base.py	[new file with mode: 0644]	patch \| blob
test/perf/compiled_extensions/cache_key.py	[new file with mode: 0644]	patch \| blob
test/perf/compiled_extensions/collections.py	[new file with mode: 0644]	patch \| blob
test/perf/compiled_extensions/command.py	[new file with mode: 0644]	patch \| blob
test/perf/compiled_extensions/misc.py	[new file with mode: 0644]	patch \| blob
test/perf/compiled_extensions/row.py	[new file with mode: 0644]	patch \| blob