`0d28d58`

Add BackendCache unit tests

Authored by mfwolffe <wolffemf@dukes.jmu.edu> 2 weeks ago

SHA: 0d28d586bb7e4569d1ed5d5953e36c985657fb88
Parents: 2c94d2b
Tree: 4be59ac

1 changed file

Status	File	+	-
A	`tests/unit/test_serve_cache.py`	226	0

tests/unit/test_serve_cache.pyadded

 +"""Unit tests for :class:`dlm_sway.serve.cache.BackendCache`.
++
 +The cache is the daemon's heart: an LRU of warm differential backends
 +keyed by the identity tuple over ``ModelSpec``. These tests exercise:
++
 +* hit / miss / LRU eviction order
 +* concurrent ``get_or_load`` for the same key only loads once
 +* ``close()`` runs on eviction (and tolerates close failures)
 +* ``cache_key_for`` is stable across spec field permutations that
 +  don't change identity
 +"""
++
 +from __future__ import annotations
++
 +import threading
 +import time
 +from pathlib import Path
 +from typing import Any
++
 +import pytest
++
 +from dlm_sway.core.model import ModelSpec
 +from dlm_sway.serve.cache import BackendCache, CachedBackend, cache_key_for
++
++
 +class _StubBackend:
 +    """Minimal stand-in implementing the loader contract.
++
 +    Tracks how many times :meth:`close` was called so eviction tests
 +    can assert the call happened. Doesn't need to satisfy the full
 +    ``DifferentialBackend`` Protocol — the cache only ever calls
 +    ``.close()`` on it, and tests look up ``.tag`` to identify entries.
 +    """
++
 +    def __init__(self, tag: str) -> None:
 +        self.tag = tag
 +        self.close_count = 0
++
 +    def close(self) -> None:
 +        self.close_count += 1
++
++
 +def _spec(base: str, *, adapter: Path | None = None) -> ModelSpec:
 +    return ModelSpec(base=base, kind="dummy", adapter=adapter)
++
++
 +def _seed(cache: BackendCache, spec: ModelSpec, tag: str) -> _StubBackend:
 +    """Helper: insert a stub entry under ``spec``'s identity key."""
 +    backend = _StubBackend(tag)
 +    key = cache_key_for(spec)
 +    entry = CachedBackend(
 +        key=key,
 +        backend=backend,  # type: ignore[arg-type]
 +        model_spec=spec,
 +        load_seconds=0.0,
 +    )
 +    # Use the cache's internal lock + dict directly so we don't trip
 +    # the build path. Accessing _entries is fine in unit tests; the
 +    # production path goes through get_or_load.
 +    with cache._lock:  # noqa: SLF001
 +        cache._entries[key] = entry  # noqa: SLF001
 +    return backend
++
++
 +class TestCacheKey:
 +    def test_key_is_stable_across_equivalent_specs(self) -> None:
 +        a = _spec("modelA")
 +        b = _spec("modelA")
 +        assert cache_key_for(a) == cache_key_for(b)
++
 +    def test_key_differs_on_base(self) -> None:
 +        assert cache_key_for(_spec("modelA")) != cache_key_for(_spec("modelB"))
++
 +    def test_key_differs_on_adapter(self, tmp_path: Path) -> None:
 +        adapter = tmp_path / "ad"
 +        adapter.mkdir()
 +        with_adapter = _spec("modelA", adapter=adapter)
 +        without_adapter = _spec("modelA")
 +        assert cache_key_for(with_adapter) != cache_key_for(without_adapter)
++
 +    def test_key_ignores_trust_remote_code(self) -> None:
 +        """Two specs differing only in non-identity fields hash equal."""
 +        plain = ModelSpec(base="modelA", kind="dummy")
 +        trust = ModelSpec(base="modelA", kind="dummy", trust_remote_code=True)
 +        assert cache_key_for(plain) == cache_key_for(trust)
++
++
 +class TestCacheLRU:
 +    def test_max_size_validation(self) -> None:
 +        with pytest.raises(ValueError, match="max_size must be >= 1"):
 +            BackendCache(max_size=0)
++
 +    def test_hit_promotes_to_mru(self) -> None:
 +        cache = BackendCache(max_size=2)
 +        spec_a = _spec("A")
 +        spec_b = _spec("B")
 +        backend_a = _seed(cache, spec_a, "A")
 +        _seed(cache, spec_b, "B")
++
 +        # Touch A so it becomes MRU. get_or_load goes through the
 +        # hit path and moves the entry to the end.
 +        result = cache.get_or_load(spec_a)
 +        assert result.backend is backend_a
++
 +        keys = cache.loaded_keys()
 +        assert keys[-1] == cache_key_for(spec_a)
 +        assert keys[0] == cache_key_for(spec_b)
++
 +    def test_eviction_closes_lru_backend(self) -> None:
 +        """Insert 2 with cap=2, then load a 3rd via get_or_load and
 +        confirm the LRU's close() fires."""
 +        cache = BackendCache(max_size=2)
 +        spec_a = _spec("A")
 +        spec_b = _spec("B")
 +        backend_a = _seed(cache, spec_a, "A")
 +        _seed(cache, spec_b, "B")
++
 +        # Stub the loader so we don't need a real backend build.
 +        third_backend = _StubBackend("C")
++
 +        def _fake_build(spec: ModelSpec, *, adapter_path: Path | None) -> Any:
 +            del spec, adapter_path
 +            return third_backend
++
 +        import dlm_sway.serve.cache as cache_mod
++
 +        original = cache_mod._build_entry  # noqa: SLF001
++
 +        def _fake_build_entry(spec: ModelSpec, *, key: Any, adapter_path: Any) -> CachedBackend:
 +            return CachedBackend(
 +                key=key,
 +                backend=_fake_build(spec, adapter_path=adapter_path),
 +                model_spec=spec,
 +                load_seconds=0.0,
 +            )
++
 +        cache_mod._build_entry = _fake_build_entry  # type: ignore[assignment]
 +        try:
 +            cache.get_or_load(_spec("C"))
 +        finally:
 +            cache_mod._build_entry = original  # type: ignore[assignment]
++
 +        assert backend_a.close_count == 1, "LRU eviction should call close()"
 +        keys = cache.loaded_keys()
 +        assert cache_key_for(spec_a) not in keys
 +        assert cache_key_for(spec_b) in keys
 +        assert cache_key_for(_spec("C")) in keys
++
 +    def test_evict_all_closes_every_backend(self) -> None:
 +        cache = BackendCache(max_size=3)
 +        backends = [_seed(cache, _spec(f"M{i}"), f"M{i}") for i in range(3)]
 +        cache.evict_all()
 +        assert cache.loaded_keys() == []
 +        for b in backends:
 +            assert b.close_count == 1
++
 +    def test_close_failure_is_swallowed(self, caplog: pytest.LogCaptureFixture) -> None:
 +        """A backend whose close() raises should not crash the daemon."""
 +        cache = BackendCache(max_size=1)
 +        spec = _spec("boom")
 +        backend = _seed(cache, spec, "boom")
++
 +        def _raising_close() -> None:
 +            raise RuntimeError("close failed")
++
 +        backend.close = _raising_close  # type: ignore[method-assign]
++
 +        with caplog.at_level("WARNING"):
 +            cache.evict_all()
++
 +        # The error was logged but didn't propagate.
 +        assert any("close raised" in r.message for r in caplog.records)
 +        assert cache.loaded_keys() == []
++
++
 +class TestSingleFlight:
 +    def test_concurrent_get_or_load_loads_once(self) -> None:
 +        """Two threads asking for the same spec must result in exactly
 +        one underlying build, not two."""
 +        cache = BackendCache(max_size=2)
++
 +        build_count = 0
 +        build_lock = threading.Lock()
 +        backend = _StubBackend("solo")
++
 +        import dlm_sway.serve.cache as cache_mod
++
 +        original = cache_mod._build_entry  # noqa: SLF001
++
 +        def _slow_build_entry(spec: ModelSpec, *, key: Any, adapter_path: Any) -> CachedBackend:
 +            nonlocal build_count
 +            with build_lock:
 +                build_count += 1
 +            # Sleep to widen the window for both threads to see a miss.
 +            time.sleep(0.05)
 +            return CachedBackend(
 +                key=key,
 +                backend=backend,  # type: ignore[arg-type]
 +                model_spec=spec,
 +                load_seconds=0.0,
 +            )
++
 +        cache_mod._build_entry = _slow_build_entry  # type: ignore[assignment]
++
 +        spec = _spec("solo")
 +        results: list[CachedBackend] = []
 +        errs: list[BaseException] = []
++
 +        def _worker() -> None:
 +            try:
 +                results.append(cache.get_or_load(spec))
 +            except BaseException as exc:  # noqa: BLE001
 +                errs.append(exc)
++
 +        try:
 +            threads = [threading.Thread(target=_worker) for _ in range(4)]
 +            for t in threads:
 +                t.start()
 +            for t in threads:
 +                t.join(timeout=5.0)
 +        finally:
 +            cache_mod._build_entry = original  # type: ignore[assignment]
++
 +        assert errs == []
 +        assert build_count == 1, f"single-flight broken: built {build_count} times"
 +        assert all(r.backend is backend for r in results)