The GC for the free threaded build would get slower with each collection due
to effectively double counting objects freed by the GC.
--- /dev/null
+Fix quadratically increasing garbage collection delays in free-threaded
+build.
gc->alloc_count--;
if (gc->alloc_count <= -LOCAL_ALLOC_COUNT_THRESHOLD) {
GCState *gcstate = &tstate->interp->gc;
- _Py_atomic_add_int(&gcstate->young.count, (int)gc->alloc_count);
+ int count = _Py_atomic_load_int_relaxed(&gcstate->young.count);
+ int new_count;
+ do {
+ if (count == 0) {
+ break;
+ }
+ new_count = count + (int)gc->alloc_count;
+ if (new_count < 0) {
+ new_count = 0;
+ }
+ } while (!_Py_atomic_compare_exchange_int(&gcstate->young.count,
+ &count,
+ new_count));
gc->alloc_count = 0;
}
}