Python 3.14 Incremental GC: From 100ms to 10ms Pauses

Python 3.14 Incremental GC: From 100ms to 10ms Pauses | U-BLOG

import gc

# Default thresholds: (700, 10, 10)
print(gc.get_threshold())

# When (allocations - deallocations) > 700, generation 0 is collected.
# After 10 gen-0 collections, generation 1 is collected.
# After 10 gen-1 collections, generation 2 is collected.

import gc

# Python 3.14 thresholds: (700, 10, 0)
# threshold0: allocation trigger (same as before)
# threshold1: inversely controls old-gen fraction per increment
# threshold2: now ignored (always 0)
print(gc.get_threshold())

# gc.collect(0) -- collect young only
# gc.collect(1) -- collect young + one increment of old (NEW in 3.14)
# gc.collect(2) or gc.collect() -- full collection (same as before)

import gc
import time

class Node:
    """A node that forms reference cycles."""
    def __init__(self):
        self.next = None
        self.data = [0] * 100  # some bulk

def create_cycles(n):
    """Create n reference cycles of length 2."""
    nodes = []
    for _ in range(n):
        a, b = Node(), Node()
        a.next = b
        b.next = a
        nodes.extend([a, b])
    del nodes  # drop external refs; cycles remain

# Build up a large old generation
for _ in range(50):
    create_cycles(10_000)
    gc.collect()  # promote to old gen

# Now measure a single collection
create_cycles(5_000)  # fresh young-gen garbage

gc.disable()
start = time.perf_counter_ns()
gc.collect(1)  # Python 3.14: incremental old-gen scan
elapsed_ms = (time.perf_counter_ns() - start) / 1_000_000
gc.enable()

print(f"Incremental collection pause: {elapsed_ms:.2f} ms")

# Compare with full collection
gc.disable()
start = time.perf_counter_ns()
gc.collect(2)  # full scan
full_ms = (time.perf_counter_ns() - start) / 1_000_000
gc.enable()

print(f"Full collection pause: {full_ms:.2f} ms")

import gc

# Scan 5% of old gen per increment instead of 10%
# More increments needed for a full scan, but each one is shorter
gc.set_threshold(700, 20)

import gc

# Scan 20% of old gen per increment
# Fewer total increments, but each pause is longer
gc.set_threshold(700, 5)

import gc

# After application startup / model loading
gc.collect()    # clean up any startup garbage
gc.freeze()     # exclude current tracked objects from future GC

# Optionally raise threshold0 to reduce young-gen frequency
gc.set_threshold(5000, 10)

import gc
import time
import logging

logger = logging.getLogger("gc_monitor")

def gc_callback(phase, info):
    if phase == "start":
        gc_callback._start = time.perf_counter_ns()
    elif phase == "stop":
        elapsed_ms = (time.perf_counter_ns() - gc_callback._start) / 1_000_000
        logger.info(
            "GC pause: %.2f ms | generation: %d | collected: %d",
            elapsed_ms,
            info.get("generation", -1),
            info.get("collected", 0),
        )

gc.callbacks.append(gc_callback)

Python's Incremental GC in 3.14: From 100ms Pauses to 10ms — How the New Two-Generation Collector Works

Why GC Pauses Matter for Real Applications

Related Posts

The Old Generational Collector and Its Problems

How the New Incremental GC Works

Benchmarks: Pause Times Before and After

What This Means for Web Servers and Real-Time Systems

Tuning the New GC

Related Posts