`fd7e9a0`

Raise all coverage gates to 100%

* Cover store edge branches

* Cover hardware edge branches

* Cover CLI reporter branches

* Cover eval edge branches

* Cover export helper branches

* Cover export target helper branches

* Cover export runner branches

* Cover export helper modules

* Cover multimodal export branches

* Finish export coverage sweep

* Cover mlx backend staging refusal

* Cover replay decode edge cases

* Cover preference phase plumbing

* Finish doc and registry edge coverage

* Cover data helper edge branches

* Finish data resample coverage

* Cover train cache toggles

* Cover tokenization coercion edges

* Finish checkpoint commit coverage

* Cover RPC validation edges

* Finish state sidecar coverage

* Finish train helper coverage sweep

* Finish trainer helper coverage

* Finish metrics coverage sweep

* Finish directives coverage sweep

* Cover synth apply and pending

* Finish synth prompt and filter coverage

* Finish synth run coverage

* Cover synth teacher helpers

* Cover synth teacher runtime helpers

* Finish synth teacher coverage

* Retry transient empty lockfiles

* Skip peer roundtrip when bind denied

* Cover preference pending helpers

* Finish preference judge coverage

* Finish preference mine coverage

* Cover modality wrapper modules

* Cover repl and watch helpers

* Cover scaffold and template edges

* Cover app and harvest helpers

* Finish share helper coverage

* Cover share pull orchestrator

* Cover share push orchestrator

* Cover peer token edge cases

* Cover peer runtime flow

* Cover control apply edge branches

* Cover init helper edge cases

* Cover train validation edge cases

* Cover train watch edge cases

* Cover prompt edge cases

* Cover GPU resolve failure

* Cover export edge paths

* Cover export runtime targets

* Cover export run errors

* Cover audio probe generic processor load failure

* Raise coverage gates from 95% to 100%

* Fix import sort order in test_state_sidecar and test_tokenization

* Apply ruff format to 16 test files

* Cover vllm platform helpers on all OS targets

---------

Co-authored-by: mfwolffe <wolffemf@dukes.jmu.edu>

Authored by

espadonne 2 weeks ago

Committed by GitHub

SHA: fd7e9a0261360741d0d6496010c1727f55375496
Parents: 20cfe6f
Tree: 874199c

121 changed files

Status	File	+	-
M	`.github/workflows/ci.yml`	32	32
M	`scripts/coverage-gates.sh`	1	1
M	`src/dlm/eval/probes.py`	0	1
M	`src/dlm/store/lock.py`	8	3
M	`src/dlm/synth/run.py`	0	2
M	`src/dlm/train/cpt/schedule.py`	0	2
M	`tests/integration/share/test_peer_roundtrip.py`	10	3
M	`tests/unit/base_models/test_probes.py`	16	0
A	`tests/unit/cli/test_app_core.py`	91	0
A	`tests/unit/cli/test_export_edge_paths.py`	258	0
A	`tests/unit/cli/test_export_run_errors.py`	191	0
A	`tests/unit/cli/test_export_target_runtime_paths.py`	352	0
A	`tests/unit/cli/test_init_edges.py`	157	0
A	`tests/unit/cli/test_prompt_edges.py`	291	0
M	`tests/unit/cli/test_reporter.py`	27	1
M	`tests/unit/cli/test_scaffold.py`	16	0
M	`tests/unit/cli/test_train_prompt_repl_coverage.py`	10	0
A	`tests/unit/cli/test_train_validation_edges.py`	217	0
A	`tests/unit/cli/test_train_watch_edges.py`	260	0
M	`tests/unit/control/test_apply.py`	34	0
M	`tests/unit/data/test_audio_cache.py`	30	0
M	`tests/unit/data/test_audio_resample.py`	68	22
M	`tests/unit/data/test_dataset_builder.py`	17	0
M	`tests/unit/data/test_sections_to_rows.py`	14	0
M	`tests/unit/data/test_vl_cache.py`	30	0
M	`tests/unit/data/test_weighted_rows.py`	28	0
M	`tests/unit/directives/test_cache.py`	182	0
M	`tests/unit/directives/test_cache_key.py`	14	1
M	`tests/unit/directives/test_discovery.py`	37	0
M	`tests/unit/directives/test_expand.py`	64	0
M	`tests/unit/directives/test_ignore_parser.py`	7	0
M	`tests/unit/directives/test_merge.py`	23	0
M	`tests/unit/doc/test_parser_roundtrip.py`	29	0
M	`tests/unit/doc/test_serializer_edges.py`	12	0
M	`tests/unit/eval/test_mode_split.py`	37	1
M	`tests/unit/eval/test_probes.py`	33	1
M	`tests/unit/export/ollama/test_modelfile.py`	5	0
M	`tests/unit/export/targets/test_llama_server_argv.py`	128	1
M	`tests/unit/export/targets/test_mlx_serve_argv.py`	95	0
M	`tests/unit/export/targets/test_vllm_argv.py`	47	0
M	`tests/unit/export/test_arch_probe.py`	17	0
M	`tests/unit/export/test_audio_snapshot.py`	81	0
M	`tests/unit/export/test_draft_registry.py`	14	0
M	`tests/unit/export/test_embedding_sync.py`	34	0
M	`tests/unit/export/test_gate_fallback_resolve.py`	50	1
A	`tests/unit/export/test_gguf_io.py`	33	0
M	`tests/unit/export/test_gguf_tensors.py`	63	0
M	`tests/unit/export/test_imatrix.py`	99	0
A	`tests/unit/export/test_merge.py`	21	0
M	`tests/unit/export/test_precision_safety.py`	4	0
M	`tests/unit/export/test_preflight.py`	45	0
M	`tests/unit/export/test_runner.py`	274	0
M	`tests/unit/export/test_smoke.py`	21	0
M	`tests/unit/export/test_vendoring.py`	31	0
M	`tests/unit/export/test_vl_gguf.py`	113	1
M	`tests/unit/export/test_vl_snapshot.py`	77	0
M	`tests/unit/hardware/test_capabilities.py`	57	1
M	`tests/unit/hardware/test_plan.py`	52	1
M	`tests/unit/harvest/test_sway_reader.py`	12	0
M	`tests/unit/inference/test_mlx_backend.py`	20	1
M	`tests/unit/lock/test_mismatch_policy.py`	7	0
M	`tests/unit/metrics/test_queries.py`	217	1
M	`tests/unit/metrics/test_recorder.py`	54	2
A	`tests/unit/metrics/test_sinks.py`	168	0
A	`tests/unit/modality/test_dispatch_modules.py`	136	0
A	`tests/unit/modality/test_vl_contract.py`	72	0
M	`tests/unit/preference/test_cli_judge.py`	66	0
M	`tests/unit/preference/test_hf_reward_judge.py`	225	2
M	`tests/unit/preference/test_mine_dedup.py`	69	0
A	`tests/unit/preference/test_pending.py`	199	0
A	`tests/unit/preference/test_sway_bridge.py`	262	0
A	`tests/unit/repl/test_app_helpers.py`	10	0
M	`tests/unit/repl/test_commands.py`	6	1
A	`tests/unit/repl/test_streaming.py`	64	0
M	`tests/unit/replay/test_corpus.py`	15	0
M	`tests/unit/replay/test_sampler.py`	26	1
M	`tests/unit/share/test_hf_sink.py`	21	0
A	`tests/unit/share/test_peer_runtime.py`	388	0
M	`tests/unit/share/test_peer_tokens.py`	41	0
M	`tests/unit/share/test_provenance.py`	63	0
A	`tests/unit/share/test_pull.py`	393	0
A	`tests/unit/share/test_push.py`	435	0
M	`tests/unit/share/test_signing.py`	140	0
M	`tests/unit/share/test_url_sink.py`	81	0
M	`tests/unit/store/test_blobs.py`	26	0
M	`tests/unit/store/test_inspect.py`	56	1
M	`tests/unit/store/test_lock.py`	47	2
M	`tests/unit/store/test_paths.py`	36	1
A	`tests/unit/synth/test_apply_pending.py`	337	0
M	`tests/unit/synth/test_filter.py`	48	0
M	`tests/unit/synth/test_prompts.py`	19	5
M	`tests/unit/synth/test_run_dry_run.py`	118	2
M	`tests/unit/synth/test_teachers.py`	871	22
M	`tests/unit/templates/test_init.py`	28	0
M	`tests/unit/templates/test_registry.py`	16	0
M	`tests/unit/test_io_atomic.py`	39	0
A	`tests/unit/test_main.py`	15	0
A	`tests/unit/test_package_init.py`	24	0
M	`tests/unit/train/cpt/test_embed_warmup.py`	16	0
M	`tests/unit/train/distributed/test_gpus.py`	12	0
M	`tests/unit/train/distributed/test_rank_env.py`	4	0
M	`tests/unit/train/distributed/test_rank_io.py`	5	0
M	`tests/unit/train/gate/test_module.py`	23	0
M	`tests/unit/train/gate/test_orchestrator.py`	16	0
M	`tests/unit/train/gate/test_trainer.py`	18	0
M	`tests/unit/train/multi_adapter/test_orchestrator.py`	66	0
M	`tests/unit/train/preference/test_dpo_phase.py`	30	0
M	`tests/unit/train/preference/test_orpo_phase.py`	30	0
M	`tests/unit/train/preference/test_phase_orchestrator.py`	28	0
A	`tests/unit/train/test_cache.py`	38	0
M	`tests/unit/train/test_checkpoint_commit.py`	82	0
M	`tests/unit/train/test_inject.py`	4	0
M	`tests/unit/train/test_integrity.py`	3	0
M	`tests/unit/train/test_logger.py`	18	0
M	`tests/unit/train/test_rpc.py`	108	0
M	`tests/unit/train/test_state_sidecar.py`	67	0
M	`tests/unit/train/test_tokenization.py`	18	0
M	`tests/unit/train/test_trainer_helpers.py`	300	9
M	`tests/unit/watch/test_debounce.py`	7	0
M	`tests/unit/watch/test_watcher_filter.py`	31	0
A	`tests/unit/watch/test_watcher_loop.py`	55	0

.github/workflows/ci.ymlmodified

165 lines changed — click to load

        - name: Pytest (unit + integration, non-slow)
          run: uv run pytest
 -      - name: Coverage gate — src/dlm/doc ≥ 95% (audit 02 M4)
 +      - name: Coverage gate — src/dlm/doc = 100% (audit 02 M4)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/doc \
              --cov=src/dlm/doc \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/store ≥ 95% (Sprint 04)
 +      - name: Coverage gate — src/dlm/store = 100% (Sprint 04)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/store \
              --cov=src/dlm/store \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/hardware ≥ 95% (Sprint 05)
 +      - name: Coverage gate — src/dlm/hardware = 100% (Sprint 05)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/hardware \
              --cov=src/dlm/hardware \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/base_models ≥ 95% (Sprint 06)
 +      - name: Coverage gate — src/dlm/base_models = 100% (Sprint 06)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/base_models \
              --cov=src/dlm/base_models \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/data ≥ 95% (Sprint 07)
 +      - name: Coverage gate — src/dlm/data = 100% (Sprint 07)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/data \
              --cov=src/dlm/data \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/replay ≥ 95% (Sprint 08)
 +      - name: Coverage gate — src/dlm/replay = 100% (Sprint 08)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/replay \
              --cov=src/dlm/replay \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/train ≥ 95% (Sprint 09)
 +      - name: Coverage gate — src/dlm/train = 100% (Sprint 09)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/train \
              --cov=src/dlm/train \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/train/preference ≥ 95%
 +      - name: Coverage gate — src/dlm/train/preference = 100%
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/train/preference \
              --cov=src/dlm/train/preference \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/eval ≥ 95% (Sprint 10)
 +      - name: Coverage gate — src/dlm/eval = 100% (Sprint 10)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/eval \
              --cov=src/dlm/eval \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/inference ≥ 95% (Sprint 10)
 +      - name: Coverage gate — src/dlm/inference = 100% (Sprint 10)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/inference \
              --cov=src/dlm/inference \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/export ≥ 95% (Sprint 11)
 +      - name: Coverage gate — src/dlm/export = 100% (Sprint 11)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/export \
              --cov=src/dlm/export \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/export/ollama ≥ 95% (Sprint 12)
 +      - name: Coverage gate — src/dlm/export/ollama = 100% (Sprint 12)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/export/ollama \
              --cov=src/dlm/export/ollama \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/cli/reporter ≥ 95% (Sprint 13)
 +      - name: Coverage gate — src/dlm/cli/reporter = 100% (Sprint 13)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/cli \
              --cov=dlm.cli.reporter \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/io/ulid ≥ 95% (Sprint 13)
 +      - name: Coverage gate — src/dlm/io/ulid = 100% (Sprint 13)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/test_io_ulid.py \
              --cov=dlm.io.ulid \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/pack ≥ 95% (Sprint 14)
 +      - name: Coverage gate — src/dlm/pack = 100% (Sprint 14)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/pack tests/integration/pack \
              --cov=src/dlm/pack \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
 -      - name: Coverage gate — src/dlm/lock ≥ 95% (Sprint 15)
 +      - name: Coverage gate — src/dlm/lock = 100% (Sprint 15)
          if: matrix.os == 'ubuntu-latest'
          run: |
            uv run pytest tests/unit/lock \
              --cov=src/dlm/lock \
              --cov-report=term-missing \
 -            --cov-fail-under=95
 +            --cov-fail-under=100
    no-network-sandbox:
      # audit F13: dlm init / doctor / show must work with zero outbound network.

scripts/coverage-gates.shmodified

8 lines changed — click to load

          "${tests_arr[@]}" \
          --cov="$cov" \
          --cov-report=term-missing \
 -        --cov-fail-under=95 \
 +        --cov-fail-under=100 \
          -q
      echo
  done

src/dlm/eval/probes.pymodified

7 lines changed — click to load

              # Find the first non-blank body line and prefix it.
              i += 1
              while i < len(lines) and lines[i].strip() == "":
 -                rewritten.append(lines[i])
                  i += 1
              if i < len(lines):
                  rewritten.append(f"{_PROBE_MARKER}:{lines[i]}")

src/dlm/store/lock.pymodified

17 lines changed — click to load

          existing = _read_lock(lock_path)
          if existing is None:
 -            # Malformed lockfile, or a race between stat and read.
 -            # Treat as stale to avoid infinite contention.
 -            raise StaleLockError(lock_path, holder_pid=None)
 +            # Malformed lockfile, or a race between create and payload
 +            # write. If we still have timeout budget left, treat this as
 +            # transient and retry; callers with timeout=0 still get the
 +            # old immediate stale-lock signal.
 +            if deadline is None or time.monotonic() >= deadline:
 +                raise StaleLockError(lock_path, holder_pid=None)
 +            time.sleep(poll_interval)
 +            continue
          if not _is_alive(existing.pid):
              raise StaleLockError(lock_path, holder_pid=existing.pid)

src/dlm/synth/run.pymodified

8 lines changed — click to load

          for concrete_strategy, count in _strategy_counts(strategy, per_section):
              if count == 0:
                  continue
 -            if max_pairs is not None and len(additions) >= max_pairs:
 -                return SynthRunPlan(additions=tuple(additions), skipped=tuple(skipped))
              template = get_prompt_template(concrete_strategy)
              rendered = teacher.generate(

src/dlm/train/cpt/schedule.pymodified

8 lines changed — click to load

          raise ValueError(f"step must be non-negative, got {step}")
      if step < warmup_steps:
 -        if warmup_steps == 0:
 -            return 1.0
          return step / warmup_steps
      if step >= total_steps:

tests/unit/base_models/test_probes.pymodified

28 lines changed — click to load

          ):
              probe_chat_template(_spec())
 +    def test_load_error_returns_failed_probe(self) -> None:
 +        with patch("transformers.AutoTokenizer.from_pretrained", side_effect=RuntimeError("boom")):
 +            result = probe_chat_template(_spec())
 +        assert result.passed is False
 +        assert "load failed: RuntimeError: boom" in result.detail
++
  class TestProbeGgufArch:
      def test_skips_when_vendor_missing(self, tmp_path: Path) -> None:
          ):
              probe_audio_token(_audio_spec())
 +    def test_processor_load_generic_error_fails(self) -> None:
 +        with patch(
 +            "dlm.base_models._typed_shims.load_auto_processor",
 +            side_effect=RuntimeError("connection reset"),
 +        ):
 +            result = probe_audio_token(_audio_spec())
 +        assert result.passed is False
 +        assert "processor load failed" in result.detail
 +        assert "RuntimeError" in result.detail
++
      def test_missing_tokenizer_fails(self) -> None:
          with patch(
              "dlm.base_models._typed_shims.load_auto_processor",

tests/unit/cli/test_app_core.pyadded

91 lines changed — click to load

 +"""Direct coverage for top-level CLI app wiring."""
++
 +from __future__ import annotations
++
 +import logging
 +import runpy
 +from unittest.mock import patch
++
 +import pytest
 +import typer
++
 +import dlm.cli.app as cli_app
++
++
 +def test_disable_third_party_telemetry_sets_defaults(monkeypatch: pytest.MonkeyPatch) -> None:
 +    monkeypatch.delenv("HF_HUB_DISABLE_TELEMETRY", raising=False)
 +    monkeypatch.delenv("DO_NOT_TRACK", raising=False)
 +    monkeypatch.delenv("TRANSFORMERS_NO_ADVISORY_WARNINGS", raising=False)
++
 +    cli_app._disable_third_party_telemetry()
++
 +    assert cli_app.os.environ["HF_HUB_DISABLE_TELEMETRY"] == "1"
 +    assert cli_app.os.environ["DO_NOT_TRACK"] == "1"
 +    assert cli_app.os.environ["TRANSFORMERS_NO_ADVISORY_WARNINGS"] == "1"
++
++
 +def test_version_callback_exits_when_requested(capsys: pytest.CaptureFixture[str]) -> None:
 +    with pytest.raises(typer.Exit) as excinfo:
 +        cli_app._version_callback(True)
++
 +    assert excinfo.value.exit_code == 0
 +    assert "dlm " in capsys.readouterr().out
++
++
 +def test_version_callback_is_noop_when_flag_is_false(capsys: pytest.CaptureFixture[str]) -> None:
 +    cli_app._version_callback(False)
 +    assert capsys.readouterr().out == ""
++
++
 +def test_root_sets_home_and_debug_logging(monkeypatch: pytest.MonkeyPatch) -> None:
 +    monkeypatch.delenv("DLM_HOME", raising=False)
++
 +    with patch("logging.basicConfig") as basic_config:
 +        cli_app._root(version=False, home="/tmp/dlm-home", verbose=True, quiet=False)
++
 +    assert cli_app.os.environ["DLM_HOME"] == "/tmp/dlm-home"
 +    basic_config.assert_called_once_with(
 +        level=logging.DEBUG,
 +        format="%(asctime)s %(name)s %(levelname)s: %(message)s",
 +        force=True,
 +    )
++
++
 +def test_root_sets_warning_logging_for_quiet_mode() -> None:
 +    with patch("logging.basicConfig") as basic_config:
 +        cli_app._root(version=False, home=None, verbose=False, quiet=True)
++
 +    basic_config.assert_called_once_with(
 +        level=logging.WARNING,
 +        format="%(asctime)s %(name)s %(levelname)s: %(message)s",
 +        force=True,
 +    )
++
++
 +def test_root_rejects_verbose_and_quiet_together() -> None:
 +    with pytest.raises(typer.BadParameter, match="mutually exclusive"):
 +        cli_app._root(version=False, home=None, verbose=True, quiet=True)
++
++
 +def test_main_routes_through_reporter_and_exits() -> None:
 +    with (
 +        patch("dlm.cli.reporter.run_with_reporter", return_value=7) as run_with_reporter,
 +        patch("sys.exit", side_effect=SystemExit(7)) as sys_exit,
 +        pytest.raises(SystemExit) as excinfo,
 +    ):
 +        cli_app.main()
++
 +    assert excinfo.value.code == 7
 +    run_with_reporter.assert_called_once_with(cli_app.app)
 +    sys_exit.assert_called_once_with(7)
++
++
 +def test_module_main_guard_invokes_main() -> None:
 +    with (
 +        patch("dlm.cli.reporter.run_with_reporter", return_value=3),
 +        patch("sys.exit", side_effect=SystemExit(3)),
 +        pytest.raises(SystemExit) as excinfo,
 +    ):
 +        runpy.run_module("dlm.cli.app", run_name="__main__")
++
 +    assert excinfo.value.code == 3

tests/unit/cli/test_export_edge_paths.pyadded

258 lines changed — click to load

 +"""Focused early-branch coverage for `dlm export`."""
++
 +from __future__ import annotations
++
 +from pathlib import Path
 +from types import SimpleNamespace
++
 +import pytest
 +from typer.testing import CliRunner
++
 +from dlm.base_models import BaseModelSpec
 +from dlm.base_models.errors import GatedModelError
 +from dlm.cli.app import app
 +from dlm.export.errors import ExportError
++
++
 +def _joined_output(result: object) -> str:
 +    text = getattr(result, "output", "") + getattr(result, "stderr", "")
 +    return " ".join(text.split())
++
++
 +def _scaffold_doc(tmp_path: Path) -> Path:
 +    doc = tmp_path / "doc.dlm"
 +    runner = CliRunner()
 +    result = runner.invoke(
 +        app,
 +        [
 +            "--home",
 +            str(tmp_path / "home"),
 +            "init",
 +            str(doc),
 +            "--base",
 +            "smollm2-135m",
 +        ],
 +    )
 +    assert result.exit_code == 0, result.output
 +    return doc
++
++
 +def _spec(*, key: str = "demo-1b", modality: str = "text") -> BaseModelSpec:
 +    payload: dict[str, object] = {
 +        "key": key,
 +        "hf_id": f"org/{key}",
 +        "revision": "0123456789abcdef0123456789abcdef01234567",
 +        "architecture": "DemoForCausalLM",
 +        "params": 1_000_000_000,
 +        "target_modules": ["q_proj", "v_proj"],
 +        "template": "chatml",
 +        "gguf_arch": "demo",
 +        "tokenizer_pre": "demo",
 +        "license_spdx": "Apache-2.0",
 +        "license_url": None,
 +        "requires_acceptance": False,
 +        "redistributable": True,
 +        "size_gb_fp16": 2.0,
 +        "context_length": 4096,
 +        "recommended_seq_len": 2048,
 +        "modality": modality,
 +    }
 +    if modality == "vision-language":
 +        payload["vl_preprocessor_plan"] = {
 +            "target_size": [224, 224],
 +            "image_token": "<image>",
 +            "num_image_tokens": 256,
 +        }
 +    elif modality == "audio-language":
 +        payload["audio_preprocessor_plan"] = {
 +            "sample_rate": 16000,
 +            "audio_token": "<audio>",
 +            "num_audio_tokens": 64,
 +            "max_length_seconds": 30.0,
 +        }
 +    return BaseModelSpec.model_validate(payload)
++
++
 +def _patch_export_runtime(
 +    monkeypatch: pytest.MonkeyPatch,
 +    *,
 +    spec: BaseModelSpec | None = None,
 +    dispatch: object | None = None,
 +) -> None:
 +    monkeypatch.setattr(
 +        "dlm.base_models.resolve",
 +        lambda *args, **kwargs: spec or _spec(),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.modality.modality_for",
 +        lambda model_spec: (
 +            dispatch
 +            or SimpleNamespace(
 +                accepts_images=model_spec.modality == "vision-language",
 +                accepts_audio=model_spec.modality == "audio-language",
 +            )
 +        ),
 +    )
++
++
 +class TestExportEdgePaths:
 +    def test_gate_fallback_banner_prints_before_gated_base_refusal(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        monkeypatch.setattr(
 +            "dlm.export.gate_fallback.resolve_and_announce",
 +            lambda store, parsed: SimpleNamespace(
 +                entries=[("knowledge", 0.7), ("tone", 0.3)],
 +                banner_lines=["[yellow]gate:[/yellow] using learned adapter prior"],
 +            ),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.base_models.resolve",
 +            lambda *args, **kwargs: (_ for _ in ()).throw(
 +                GatedModelError("org/gated-base", "https://example.test/license")
 +            ),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc)],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        text = _joined_output(result)
 +        assert "using learned adapter prior" in text
 +        assert "review the license at: https://example.test/license" in text
 +        assert "accept via `dlm train --i-accept-license` before exporting." in text
++
 +    @pytest.mark.parametrize(
 +        ("target", "modality", "needle"),
 +        [
 +            (
 +                "vllm",
 +                "audio-language",
 +                "--target vllm is not wired for audio-language documents yet",
 +            ),
 +            (
 +                "mlx-serve",
 +                "audio-language",
 +                "--target mlx-serve is not wired for audio-language documents yet",
 +            ),
 +            (
 +                "vllm",
 +                "vision-language",
 +                "--target vllm is not wired for vision-language documents yet",
 +            ),
 +            (
 +                "mlx-serve",
 +                "vision-language",
 +                "--target mlx-serve is not wired for vision-language documents yet",
 +            ),
 +        ],
 +    )
 +    def test_runtime_targets_refuse_unsupported_modalities(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +        target: str,
 +        modality: str,
 +        needle: str,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        _patch_export_runtime(
 +            monkeypatch, spec=_spec(key=f"{target}-{modality}", modality=modality)
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc), "--target", target],
 +        )
++
 +        assert result.exit_code == 2, result.output
 +        assert needle in _joined_output(result)
++
 +    def test_audio_dispatch_export_error_maps_to_exit_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        class _AudioDispatch:
 +            accepts_images = False
 +            accepts_audio = True
++
 +            def dispatch_export(self, **kwargs: object) -> object:
 +                raise ExportError("audio snapshot failed")
++
 +        _patch_export_runtime(
 +            monkeypatch,
 +            spec=_spec(key="audio-demo", modality="audio-language"),
 +            dispatch=_AudioDispatch(),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc)],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        assert "audio snapshot failed" in _joined_output(result)
++
 +    def test_vl_dispatch_export_error_maps_to_exit_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        class _VlDispatch:
 +            accepts_images = True
 +            accepts_audio = False
++
 +            def dispatch_export(self, **kwargs: object) -> object:
 +                raise ExportError("vl snapshot failed")
++
 +        _patch_export_runtime(
 +            monkeypatch,
 +            spec=_spec(key="vl-demo", modality="vision-language"),
 +            dispatch=_VlDispatch(),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc)],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        assert "vl snapshot failed" in _joined_output(result)
++
 +    def test_invalid_export_plan_value_exits_2(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        _patch_export_runtime(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.export.resolve_export_plan",
 +            lambda **kwargs: (_ for _ in ()).throw(ValueError("bad export plan")),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc)],
 +        )
++
 +        assert result.exit_code == 2, result.output
 +        assert "bad export plan" in _joined_output(result)

tests/unit/cli/test_export_run_errors.pyadded

191 lines changed — click to load

 +"""CLI coverage for generic `run_export(...)` branches."""
++
 +from __future__ import annotations
++
 +from pathlib import Path
 +from types import SimpleNamespace
 +from typing import Any
++
 +import pytest
 +from typer.testing import CliRunner
++
 +from dlm.base_models import BaseModelSpec
 +from dlm.cli.app import app
 +from dlm.export.errors import ExportError, PreflightError, SubprocessError, UnsafeMergeError
 +from dlm.export.ollama.errors import (
 +    OllamaCreateError,
 +    OllamaError,
 +    OllamaSmokeError,
 +    OllamaVersionError,
 +)
++
++
 +def _joined_output(result: object) -> str:
 +    text = getattr(result, "output", "") + getattr(result, "stderr", "")
 +    return " ".join(text.split())
++
++
 +def _scaffold_doc(tmp_path: Path) -> Path:
 +    doc = tmp_path / "doc.dlm"
 +    runner = CliRunner()
 +    result = runner.invoke(
 +        app,
 +        [
 +            "--home",
 +            str(tmp_path / "home"),
 +            "init",
 +            str(doc),
 +            "--base",
 +            "smollm2-135m",
 +        ],
 +    )
 +    assert result.exit_code == 0, result.output
 +    return doc
++
++
 +def _spec() -> BaseModelSpec:
 +    return BaseModelSpec.model_validate(
 +        {
 +            "key": "demo-1b",
 +            "hf_id": "org/demo-1b",
 +            "revision": "0123456789abcdef0123456789abcdef01234567",
 +            "architecture": "DemoForCausalLM",
 +            "params": 1_000_000_000,
 +            "target_modules": ["q_proj", "v_proj"],
 +            "template": "chatml",
 +            "gguf_arch": "demo",
 +            "tokenizer_pre": "demo",
 +            "license_spdx": "Apache-2.0",
 +            "license_url": None,
 +            "requires_acceptance": False,
 +            "redistributable": True,
 +            "size_gb_fp16": 2.0,
 +            "context_length": 4096,
 +            "recommended_seq_len": 2048,
 +        }
 +    )
++
++
 +def _patch_export_runtime(monkeypatch: pytest.MonkeyPatch) -> None:
 +    monkeypatch.setattr("dlm.base_models.resolve", lambda *args, **kwargs: _spec())
 +    monkeypatch.setattr(
 +        "dlm.base_models.download_spec",
 +        lambda *args, **kwargs: SimpleNamespace(path=Path("/tmp/base-cache")),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.modality.modality_for",
 +        lambda spec: SimpleNamespace(accepts_images=False, accepts_audio=False),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.export.gate_fallback.resolve_and_announce",
 +        lambda store, parsed: SimpleNamespace(entries=None, banner_lines=[]),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.export.targets.resolve_target",
 +        lambda name: SimpleNamespace(name="ollama"),
 +    )
++
++
 +class TestExportRunErrors:
 +    def test_verbose_success_prints_shell_command_and_cached_tag(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
 +        captured: dict[str, Any] = {}
++
 +        _patch_export_runtime(monkeypatch)
++
 +        def _run_export(
 +            store: object,
 +            spec: object,
 +            plan: object,
 +            **kwargs: object,
 +        ) -> object:
 +            captured.update(kwargs)
 +            subprocess_runner = kwargs["subprocess_runner"]
 +            assert callable(subprocess_runner)
 +            subprocess_runner(["llama-quantize", "--version"])
 +            return SimpleNamespace(
 +                cached=True,
 +                export_dir=tmp_path / "exports" / "Q4_K_M",
 +                artifacts=[SimpleNamespace(name="base.gguf"), SimpleNamespace(name="adapter.gguf")],
 +                target="ollama",
 +                ollama_name="demo-model",
 +                ollama_version=1,
 +                smoke_output_first_line="hello smoke",
 +            )
++
 +        monkeypatch.setattr("dlm.export.run_export", _run_export)
 +        monkeypatch.setattr(
 +            "dlm.export.quantize.run_checked", lambda cmd: SimpleNamespace(returncode=0)
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc), "--verbose"],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        text = _joined_output(result)
 +        assert "$ llama-quantize --version" in text
 +        assert "(cached base)" in text
 +        assert "ollama: demo-model (v1)" in text
 +        assert "smoke: hello smoke" in text
 +        assert captured["cached_base_dir"] == Path("/tmp/base-cache")
 +        assert captured["target"] == "ollama"
++
 +    @pytest.mark.parametrize(
 +        ("error", "needle"),
 +        [
 +            (UnsafeMergeError("needs --dequantize"), "merge:"),
 +            (
 +                PreflightError(probe="template", detail="template mismatch"),
 +                "preflight: template mismatch",
 +            ),
 +            (
 +                SubprocessError(
 +                    cmd=["llama-quantize"],
 +                    returncode=3,
 +                    stderr_tail="quantize failed",
 +                ),
 +                "subprocess:",
 +            ),
 +            (
 +                OllamaVersionError(detected=(0, 1, 0), required=(0, 6, 0)),
 +                "ollama:",
 +            ),
 +            (OllamaCreateError(stdout="", stderr="create failed"), "ollama create:"),
 +            (OllamaSmokeError(stdout="", stderr="smoke failed"), "smoke:"),
 +            (OllamaError("generic ollama error"), "ollama:"),
 +            (ExportError("plain export failure"), "export:"),
 +        ],
 +    )
 +    def test_run_export_error_mappings_exit_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +        error: Exception,
 +        needle: str,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        _patch_export_runtime(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.export.run_export",
 +            lambda *args, **kwargs: (_ for _ in ()).throw(error),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc)],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        text = _joined_output(result)
 +        assert needle in text
 +        if isinstance(error, OllamaSmokeError):
 +            assert "re-run with `--no-smoke`" in text

tests/unit/cli/test_export_target_runtime_paths.pyadded

352 lines changed — click to load

 +"""CLI coverage for vLLM / MLX runtime-target success and smoke paths."""
++
 +from __future__ import annotations
++
 +from pathlib import Path
 +from types import SimpleNamespace
 +from typing import Any
++
 +import pytest
 +from typer.testing import CliRunner
++
 +from dlm.base_models import BaseModelSpec
 +from dlm.cli.app import app
 +from dlm.export.errors import ExportError
++
++
 +def _joined_output(result: object) -> str:
 +    text = getattr(result, "output", "") + getattr(result, "stderr", "")
 +    return " ".join(text.split())
++
++
 +def _scaffold_doc(tmp_path: Path) -> Path:
 +    doc = tmp_path / "doc.dlm"
 +    runner = CliRunner()
 +    result = runner.invoke(
 +        app,
 +        [
 +            "--home",
 +            str(tmp_path / "home"),
 +            "init",
 +            str(doc),
 +            "--base",
 +            "smollm2-135m",
 +        ],
 +    )
 +    assert result.exit_code == 0, result.output
 +    return doc
++
++
 +def _spec() -> BaseModelSpec:
 +    return BaseModelSpec.model_validate(
 +        {
 +            "key": "demo-1b",
 +            "hf_id": "org/demo-1b",
 +            "revision": "0123456789abcdef0123456789abcdef01234567",
 +            "architecture": "DemoForCausalLM",
 +            "params": 1_000_000_000,
 +            "target_modules": ["q_proj", "v_proj"],
 +            "template": "chatml",
 +            "gguf_arch": "demo",
 +            "tokenizer_pre": "demo",
 +            "license_spdx": "Apache-2.0",
 +            "license_url": None,
 +            "requires_acceptance": False,
 +            "redistributable": True,
 +            "size_gb_fp16": 2.0,
 +            "context_length": 4096,
 +            "recommended_seq_len": 2048,
 +        }
 +    )
++
++
 +def _patch_text_export_runtime(monkeypatch: pytest.MonkeyPatch) -> None:
 +    monkeypatch.setattr("dlm.base_models.resolve", lambda *args, **kwargs: _spec())
 +    monkeypatch.setattr(
 +        "dlm.base_models.download_spec",
 +        lambda *args, **kwargs: SimpleNamespace(path=Path("/tmp/base-cache")),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.modality.modality_for",
 +        lambda spec: SimpleNamespace(accepts_images=False, accepts_audio=False),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.export.gate_fallback.resolve_and_announce",
 +        lambda store, parsed: SimpleNamespace(entries=None, banner_lines=[]),
 +    )
++
++
 +class _FakeTarget:
 +    def __init__(self, name: str, smoke_result: object | None) -> None:
 +        self.name = name
 +        self._smoke_result = smoke_result
 +        self.calls: list[object] = []
++
 +    def smoke_test(self, prepared: object) -> object | None:
 +        self.calls.append(prepared)
 +        return self._smoke_result
++
++
 +class TestExportRuntimeTargetPaths:
 +    def test_vllm_target_success_prints_launch_config_and_smoke(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
 +        captured: dict[str, Any] = {}
 +        smoke = SimpleNamespace(ok=True, detail="vllm smoke ok")
 +        fake_target = _FakeTarget("vllm", smoke)
++
 +        _patch_text_export_runtime(monkeypatch)
 +        monkeypatch.setattr("dlm.export.targets.resolve_target", lambda name: fake_target)
++
 +        def _prepare(**kwargs: object) -> object:
 +            captured.update(kwargs)
 +            export_dir = tmp_path / "exports" / "vllm"
 +            launch = export_dir / "vllm_launch.sh"
 +            config = export_dir / "vllm_config.json"
 +            return SimpleNamespace(
 +                export_dir=export_dir,
 +                launch_script_path=launch,
 +                config_path=config,
 +            )
++
 +        monkeypatch.setattr("dlm.export.targets.prepare_vllm_export", _prepare)
 +        monkeypatch.setattr(
 +            "dlm.export.targets.finalize_vllm_export",
 +            lambda **kwargs: tmp_path / "exports" / "vllm" / "export_manifest.json",
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            [
 +                "--home",
 +                str(tmp_path / "home"),
 +                "export",
 +                str(doc),
 +                "--target",
 +                "vllm",
 +                "--name",
 +                "served-demo",
 +                "--quant",
 +                "Q4_K_M",
 +                "--merged",
 +                "--dequantize",
 +                "--no-template",
 +                "--skip-ollama",
 +                "--no-imatrix",
 +                "--draft",
 +                "qwen2.5:0.5b",
 +            ],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        text = _joined_output(result)
 +        assert "ignoring flags not applicable to `--target vllm`" in text
 +        assert "--quant" in text
 +        assert "--merged" in text
 +        assert "--dequantize" in text
 +        assert "--no-template" in text
 +        assert "--skip-ollama" in text
 +        assert "--no-imatrix" in text
 +        assert "--draft" in text
 +        assert "target: vllm" in text
 +        assert "launch: vllm_launch.sh" in text
 +        assert "config: vllm_config.json" in text
 +        assert "manifest: export_manifest.json" in text
 +        assert "smoke: vllm smoke ok" in text
 +        assert captured["served_model_name"] == "served-demo"
 +        assert captured["training_sequence_len"] == 2048
 +        assert fake_target.calls
++
 +    def test_vllm_target_prepare_error_exits_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        _patch_text_export_runtime(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.export.targets.resolve_target",
 +            lambda name: _FakeTarget("vllm", None),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.export.targets.prepare_vllm_export",
 +            lambda **kwargs: (_ for _ in ()).throw(ExportError("vllm prepare failed")),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc), "--target", "vllm"],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        assert "vllm prepare failed" in _joined_output(result)
++
 +    def test_vllm_target_smoke_failure_exits_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
 +        fake_target = _FakeTarget("vllm", SimpleNamespace(ok=False, detail="vllm smoke failed"))
++
 +        _patch_text_export_runtime(monkeypatch)
 +        monkeypatch.setattr("dlm.export.targets.resolve_target", lambda name: fake_target)
 +        monkeypatch.setattr(
 +            "dlm.export.targets.prepare_vllm_export",
 +            lambda **kwargs: SimpleNamespace(
 +                export_dir=tmp_path / "exports" / "vllm",
 +                launch_script_path=tmp_path / "exports" / "vllm" / "vllm_launch.sh",
 +                config_path=tmp_path / "exports" / "vllm" / "vllm_config.json",
 +            ),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.export.targets.finalize_vllm_export",
 +            lambda **kwargs: tmp_path / "exports" / "vllm" / "export_manifest.json",
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc), "--target", "vllm"],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        text = _joined_output(result)
 +        assert "vllm smoke failed" in text
 +        assert "re-run with `--no-smoke`" in text
++
 +    def test_mlx_target_success_prints_launch_manifest_and_smoke(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
 +        captured: dict[str, Any] = {}
 +        smoke = SimpleNamespace(ok=True, detail="mlx smoke ok")
 +        fake_target = _FakeTarget("mlx-serve", smoke)
++
 +        _patch_text_export_runtime(monkeypatch)
 +        monkeypatch.setattr("dlm.export.targets.resolve_target", lambda name: fake_target)
++
 +        def _prepare(**kwargs: object) -> object:
 +            captured.update(kwargs)
 +            export_dir = tmp_path / "exports" / "mlx-serve"
 +            launch = export_dir / "mlx_serve_launch.sh"
 +            return SimpleNamespace(
 +                export_dir=export_dir,
 +                launch_script_path=launch,
 +            )
++
 +        monkeypatch.setattr("dlm.export.targets.prepare_mlx_serve_export", _prepare)
 +        monkeypatch.setattr(
 +            "dlm.export.targets.finalize_mlx_serve_export",
 +            lambda **kwargs: tmp_path / "exports" / "mlx-serve" / "export_manifest.json",
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            [
 +                "--home",
 +                str(tmp_path / "home"),
 +                "export",
 +                str(doc),
 +                "--target",
 +                "mlx-serve",
 +                "--name",
 +                "ignored-name",
 +                "--quant",
 +                "Q4_K_M",
 +                "--merged",
 +                "--dequantize",
 +                "--no-template",
 +                "--skip-ollama",
 +                "--no-imatrix",
 +                "--draft",
 +                "qwen2.5:0.5b",
 +            ],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        text = _joined_output(result)
 +        assert "ignoring flags not applicable to `--target mlx-serve`" in text
 +        assert "--name" in text
 +        assert "--quant" in text
 +        assert "--merged" in text
 +        assert "--dequantize" in text
 +        assert "--no-template" in text
 +        assert "--skip-ollama" in text
 +        assert "--no-imatrix" in text
 +        assert "--draft" in text
 +        assert "target: mlx-serve" in text
 +        assert "launch: mlx_serve_launch.sh" in text
 +        assert "manifest: export_manifest.json" in text
 +        assert "smoke: mlx smoke ok" in text
 +        assert captured["adapter_name"] is None
 +        assert captured["adapter_path_override"] is None
 +        assert fake_target.calls
++
 +    def test_mlx_target_prepare_error_exits_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
++
 +        _patch_text_export_runtime(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.export.targets.resolve_target",
 +            lambda name: _FakeTarget("mlx-serve", None),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.export.targets.prepare_mlx_serve_export",
 +            lambda **kwargs: (_ for _ in ()).throw(ExportError("mlx prepare failed")),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc), "--target", "mlx-serve"],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        assert "mlx prepare failed" in _joined_output(result)
++
 +    def test_mlx_target_smoke_failure_exits_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = _scaffold_doc(tmp_path)
 +        runner = CliRunner()
 +        fake_target = _FakeTarget("mlx-serve", SimpleNamespace(ok=False, detail="mlx smoke failed"))
++
 +        _patch_text_export_runtime(monkeypatch)
 +        monkeypatch.setattr("dlm.export.targets.resolve_target", lambda name: fake_target)
 +        monkeypatch.setattr(
 +            "dlm.export.targets.prepare_mlx_serve_export",
 +            lambda **kwargs: SimpleNamespace(
 +                export_dir=tmp_path / "exports" / "mlx-serve",
 +                launch_script_path=tmp_path / "exports" / "mlx-serve" / "mlx_serve_launch.sh",
 +            ),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.export.targets.finalize_mlx_serve_export",
 +            lambda **kwargs: tmp_path / "exports" / "mlx-serve" / "export_manifest.json",
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "export", str(doc), "--target", "mlx-serve"],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        text = _joined_output(result)
 +        assert "mlx smoke failed" in text
 +        assert "re-run with `--no-smoke`" in text

tests/unit/cli/test_init_edges.pyadded

157 lines changed — click to load

 +"""Edge coverage for `dlm init` helper paths near the top of cli/commands."""
++
 +from __future__ import annotations
++
 +from pathlib import Path
 +from types import SimpleNamespace
++
 +import pytest
 +from rich.console import Console
 +from typer.testing import CliRunner
++
 +import dlm.base_models as base_models
 +import dlm.templates as templates
 +from dlm.base_models.errors import GatedModelError
 +from dlm.cli import commands
 +from dlm.cli.app import app
 +from dlm.templates.errors import TemplateError
++
++
 +def test_stub_mentions_sprint_and_subject() -> None:
 +    with pytest.raises(NotImplementedError, match="owned by Sprint 43"):
 +        commands._stub("43", "dlm synth")
++
++
 +class TestPromptAcceptLicense:
 +    def test_non_tty_returns_false(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        console = Console(record=True)
 +        monkeypatch.setattr("sys.stdin.isatty", lambda: False)
++
 +        assert commands._prompt_accept_license(console, "llama-3.2-1b", None) is False
++
 +    def test_yes_accepts_and_prints_license_url(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        console = Console(record=True)
 +        monkeypatch.setattr("sys.stdin.isatty", lambda: True)
 +        monkeypatch.setattr("builtins.input", lambda: "Yes")
++
 +        assert (
 +            commands._prompt_accept_license(
 +                console,
 +                "llama-3.2-1b",
 +                "https://example.test/license",
 +            )
 +            is True
 +        )
 +        text = console.export_text()
 +        assert "requires accepting the upstream license" in text
 +        assert "https://example.test/license" in text
++
 +    def test_eof_returns_false(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        console = Console(record=True)
 +        monkeypatch.setattr("sys.stdin.isatty", lambda: True)
++
 +        def _raise_eof() -> str:
 +            raise EOFError
++
 +        monkeypatch.setattr("builtins.input", _raise_eof)
++
 +        assert commands._prompt_accept_license(console, "llama-3.2-1b", None) is False
++
++
 +class TestInitTemplateEdges:
 +    def test_explicit_base_warning_when_template_overrides(self, tmp_path: Path) -> None:
 +        runner = CliRunner()
 +        out = tmp_path / "doc.dlm"
 +        home = tmp_path / "home"
++
 +        result = runner.invoke(
 +            app,
 +            [
 +                "--home",
 +                str(home),
 +                "init",
 +                str(out),
 +                "--base",
 +                "smollm2-135m",
 +                "--template",
 +                "changelog",
 +            ],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        joined = " ".join((result.output + result.stderr).split())
 +        assert "--base smollm2-135m ignored" in joined
 +        assert "uses smollm2-360m" in joined
++
 +    def test_interactive_acceptance_retries_resolution(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        runner = CliRunner()
 +        out = tmp_path / "doc.dlm"
 +        home = tmp_path / "home"
 +        calls: list[tuple[str, bool, bool]] = []
 +        spec = SimpleNamespace(key="llama-3.2-1b", revision="rev-1", modality="text")
++
 +        def _fake_resolve(
 +            base: str,
 +            *,
 +            accept_license: bool = False,
 +            skip_export_probes: bool = False,
 +        ) -> object:
 +            calls.append((base, accept_license, skip_export_probes))
 +            if len(calls) == 1:
 +                raise GatedModelError(base, "https://example.test/license")
 +            return spec
++
 +        monkeypatch.setattr(base_models, "resolve", _fake_resolve)
 +        monkeypatch.setattr(base_models, "is_gated", lambda spec: False)
 +        monkeypatch.setattr(commands, "_prompt_accept_license", lambda console, base, url: True)
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(home), "init", str(out), "--base", "llama-3.2-1b"],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        assert calls == [
 +            ("llama-3.2-1b", False, False),
 +            ("llama-3.2-1b", True, False),
 +        ]
 +        assert out.exists()
++
 +    def test_template_apply_error_exits_cleanly(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        runner = CliRunner()
 +        out = tmp_path / "doc.dlm"
 +        home = tmp_path / "home"
++
 +        monkeypatch.setattr(
 +            templates,
 +            "load_template",
 +            lambda name: SimpleNamespace(meta=SimpleNamespace(recommended_base="smollm2-135m")),
 +        )
++
 +        def _fake_apply_template(
 +            name: str,
 +            target: Path,
 +            *,
 +            force: bool = False,
 +            accept_license: bool = False,
 +        ) -> object:
 +            raise TemplateError("template exploded")
++
 +        monkeypatch.setattr(templates, "apply_template", _fake_apply_template)
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(home), "init", str(out), "--template", "custom"],
 +        )
++
 +        assert result.exit_code == 1
 +        assert "template exploded" in result.output
 +        assert not out.exists()

tests/unit/cli/test_prompt_edges.pyadded

291 lines changed — click to load

 +"""Focused `dlm prompt` edge coverage for the remaining text/VL/audio branches."""
++
 +from __future__ import annotations
++
 +from pathlib import Path
 +from types import SimpleNamespace
 +from typing import Any
++
 +import pytest
 +from typer.testing import CliRunner
++
 +from dlm.base_models import BaseModelSpec
 +from dlm.cli.app import app
++
++
 +def _write_doc(path: Path, *, base_model: str = "demo-1b") -> None:
 +    path.write_text(
 +        f"---\ndlm_id: 01HZ4X7TGZM3J1A2B3C4D5E6F7\nbase_model: {base_model}\n---\nbody\n",
 +        encoding="utf-8",
 +    )
++
++
 +def _joined_output(result: object) -> str:
 +    text = getattr(result, "output", "") + getattr(result, "stderr", "")
 +    return " ".join(text.split())
++
++
 +def _spec(*, key: str = "demo-1b", modality: str = "text") -> BaseModelSpec:
 +    payload: dict[str, object] = {
 +        "key": key,
 +        "hf_id": f"org/{key}",
 +        "revision": "0123456789abcdef0123456789abcdef01234567",
 +        "architecture": "DemoForCausalLM",
 +        "params": 1_000_000_000,
 +        "target_modules": ["q_proj", "v_proj"],
 +        "template": "chatml",
 +        "gguf_arch": "demo",
 +        "tokenizer_pre": "demo",
 +        "license_spdx": "Apache-2.0",
 +        "license_url": None,
 +        "requires_acceptance": False,
 +        "redistributable": True,
 +        "size_gb_fp16": 2.0,
 +        "context_length": 4096,
 +        "recommended_seq_len": 2048,
 +        "modality": modality,
 +    }
 +    if modality == "vision-language":
 +        payload["vl_preprocessor_plan"] = {
 +            "target_size": [224, 224],
 +            "image_token": "<image>",
 +            "num_image_tokens": 256,
 +        }
 +    elif modality == "audio-language":
 +        payload["audio_preprocessor_plan"] = {
 +            "sample_rate": 16000,
 +            "audio_token": "<audio>",
 +            "num_audio_tokens": 64,
 +            "max_length_seconds": 30.0,
 +        }
 +    return BaseModelSpec.model_validate(payload)
++
++
 +def _patch_prompt_runtime(
 +    monkeypatch: pytest.MonkeyPatch,
 +    *,
 +    spec: BaseModelSpec | None = None,
 +    dispatch: object | None = None,
 +) -> None:
 +    monkeypatch.setattr(
 +        "dlm.base_models.resolve",
 +        lambda *args, **kwargs: spec or _spec(),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.hardware.doctor",
 +        lambda: SimpleNamespace(capabilities=object()),
 +    )
 +    monkeypatch.setattr(
 +        "dlm.modality.modality_for",
 +        lambda model_spec: (
 +            dispatch
 +            or SimpleNamespace(
 +                accepts_images=model_spec.modality == "vision-language",
 +                accepts_audio=model_spec.modality == "audio-language",
 +            )
 +        ),
 +    )
++
++
 +class TestPromptEdgeBranches:
 +    def test_invalid_backend_value_exits_2(self, tmp_path: Path) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_doc(doc)
 +        runner = CliRunner()
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "prompt", str(doc), "hello", "--backend", "bogus"],
 +        )
++
 +        assert result.exit_code == 2, result.output
 +        assert "--backend must be" in _joined_output(result)
++
 +    def test_gated_base_without_recorded_acceptance_exits_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        from dlm.base_models.errors import GatedModelError
++
 +        doc = tmp_path / "doc.dlm"
 +        _write_doc(doc, base_model="gated-base")
 +        runner = CliRunner()
++
 +        monkeypatch.setattr(
 +            "dlm.base_models.resolve",
 +            lambda *args, **kwargs: (_ for _ in ()).throw(
 +                GatedModelError("org/gated-base", "https://license.example")
 +            ),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "prompt", str(doc), "hello"],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        assert "run `dlm train --i-accept-license` first" in _joined_output(result)
++
 +    def test_unsupported_backend_error_exits_2(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        from dlm.inference.backends.select import UnsupportedBackendError
++
 +        doc = tmp_path / "doc.dlm"
 +        _write_doc(doc)
 +        runner = CliRunner()
++
 +        _patch_prompt_runtime(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.inference.backends.select_backend",
 +            lambda *args, **kwargs: (_ for _ in ()).throw(
 +                UnsupportedBackendError("mlx backend unavailable")
 +            ),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "prompt", str(doc), "hello", "--backend", "mlx"],
 +        )
++
 +        assert result.exit_code == 2, result.output
 +        assert "mlx backend unavailable" in _joined_output(result)
++
 +    def test_verbose_text_prompt_logs_backend_and_generates(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_doc(doc)
 +        runner = CliRunner()
 +        captured: dict[str, Any] = {}
++
 +        class _FakeBackend:
 +            def load(self, spec: object, store: object, adapter_name: str | None = None) -> None:
 +                captured["adapter_name"] = adapter_name
++
 +            def generate(self, query: str, **kwargs: object) -> str:
 +                captured["query"] = query
 +                captured["kwargs"] = kwargs
 +                return "ok"
++
 +        _patch_prompt_runtime(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.inference.backends.select_backend",
 +            lambda *args, **kwargs: "pytorch",
 +        )
 +        monkeypatch.setattr(
 +            "dlm.inference.backends.build_backend",
 +            lambda *args, **kwargs: _FakeBackend(),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "prompt", str(doc), "hello", "--verbose"],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        assert captured["query"] == "hello"
 +        assert "backend: pytorch" in _joined_output(result)
 +        kwargs = captured["kwargs"]
 +        assert isinstance(kwargs, dict)
 +        assert kwargs["top_p"] is None
++
 +    def test_missing_adapter_maps_to_exit_1(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        from dlm.inference import AdapterNotFoundError
++
 +        doc = tmp_path / "doc.dlm"
 +        _write_doc(doc)
 +        runner = CliRunner()
++
 +        class _MissingAdapterBackend:
 +            def load(self, spec: object, store: object, adapter_name: str | None = None) -> None:
 +                raise AdapterNotFoundError("missing adapter")
++
 +        _patch_prompt_runtime(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.inference.backends.select_backend",
 +            lambda *args, **kwargs: "pytorch",
 +        )
 +        monkeypatch.setattr(
 +            "dlm.inference.backends.build_backend",
 +            lambda *args, **kwargs: _MissingAdapterBackend(),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "prompt", str(doc), "hello"],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        assert "missing adapter" in _joined_output(result)
++
 +    def test_vision_language_dispatch_branch_invokes_helper(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_doc(doc, base_model="vl-demo")
 +        image = tmp_path / "frame.png"
 +        image.write_bytes(b"\x89PNG fake")
 +        runner = CliRunner()
 +        captured: dict[str, Any] = {}
++
 +        _patch_prompt_runtime(
 +            monkeypatch,
 +            spec=_spec(key="vl-demo", modality="vision-language"),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.cli.commands._dispatch_vl_prompt",
 +            lambda **kwargs: captured.update(kwargs),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "prompt", str(doc), "hello", "--image", str(image)],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        assert captured["query"] == "hello"
 +        assert captured["image_paths"] == [image]
 +        assert captured["spec"].key == "vl-demo"
++
 +    def test_audio_dispatch_branch_invokes_helper(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_doc(doc, base_model="audio-demo")
 +        audio = tmp_path / "clip.wav"
 +        audio.write_bytes(b"fake wav bytes")
 +        runner = CliRunner()
 +        captured: dict[str, Any] = {}
++
 +        _patch_prompt_runtime(
 +            monkeypatch,
 +            spec=_spec(key="audio-demo", modality="audio-language"),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.cli.commands._dispatch_audio_prompt",
 +            lambda **kwargs: captured.update(kwargs),
 +        )
++
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path / "home"), "prompt", str(doc), "hello", "--audio", str(audio)],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        assert captured["query"] == "hello"
 +        assert captured["audio_paths"] == [audio]
 +        assert captured["spec"].key == "audio-demo"

tests/unit/cli/test_reporter.pymodified

46 lines changed — click to load

  import pytest
 -from dlm.cli.reporter import report_exception, run_with_reporter
 +from dlm.cli.reporter import _prefix_for, report_exception, run_with_reporter
  class TestTier1ParseError:
          err = capsys.readouterr().err
          assert "export:" in err
 +    def test_typed_error_verbose_env_surfaces_traceback(
 +        self,
 +        capsys: pytest.CaptureFixture[str],
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        from dlm.export.errors import UnsafeMergeError
++
 +        monkeypatch.setenv("DLM_VERBOSE", "1")
 +        exc = UnsafeMergeError("needs --dequantize")
 +        code = report_exception(exc)
++
 +        assert code == 1
 +        err = capsys.readouterr().err
 +        assert "export:" in err
 +        assert "UnsafeMergeError" in err
++
  class TestPrefixMapping:
      """Each known module prefix gets a distinct colored label."""
          err = capsys.readouterr().err
          assert "base_model:" in err
 +    def test_doc_prefix_branch_is_mapped(self) -> None:
 +        doc_error = type("DocError", (Exception,), {"__module__": "dlm.doc.custom"})("boom")
++
 +        assert _prefix_for(doc_error) == "doc"
++
 +    def test_hardware_prefix_branch_is_mapped(self) -> None:
 +        from dlm.hardware.refusals import ResolutionError
++
 +        assert _prefix_for(ResolutionError("no plan")) == "doctor"
++
  class TestTier3Uncaught:
      def test_unknown_exception_gets_verbose_hint(self, capsys: pytest.CaptureFixture[str]) -> None:

tests/unit/cli/test_scaffold.pymodified

22 lines changed — click to load

      assert second.dlm_id == first.dlm_id
 +def test_second_run_reuses_lone_existing_file_when_default_name_is_unmatched(
 +    tmp_path: Path,
 +) -> None:
 +    kwargs = _default_kwargs()
 +    kwargs["name"] = "notes"
 +    first = scaffold_train_target(tmp_path, **kwargs)  # type: ignore[arg-type]
++
 +    resume = _default_kwargs()
 +    resume["base"] = None
 +    resolved = scaffold_train_target(tmp_path, **resume)  # type: ignore[arg-type]
++
 +    assert resolved.scaffolded is False
 +    assert resolved.dlm_path == first.dlm_path
 +    assert resolved.dlm_id == first.dlm_id
++
++
  # ---- Multi-file disambiguation ---------------------------------------------

tests/unit/cli/test_train_prompt_repl_coverage.pymodified

16 lines changed — click to load

+         )
          assert _maybe_dispatch_multi_gpu("bogus", ["dlm", "train"], console) == 2
 +        class _BadResolveGpuSpec:
 +            def resolve(self, device_count: int) -> tuple[int, ...]:
 +                raise UnsupportedGpuSpecError("gpu index 7 is unavailable")
++
 +        monkeypatch.setattr(
 +            "dlm.train.distributed.parse_gpus",
 +            lambda raw: _BadResolveGpuSpec(),
 +        )
 +        assert _maybe_dispatch_multi_gpu("7", ["dlm", "train"], console) == 2
++
          monkeypatch.setattr("dlm.train.distributed.parse_gpus", lambda raw: _GpuSpec((0,)))
          import torch

tests/unit/cli/test_train_validation_edges.pyadded

217 lines changed — click to load

 +"""Extra edge coverage for the early validation block in `dlm train`."""
++
 +from __future__ import annotations
++
 +from pathlib import Path
 +from types import SimpleNamespace
 +from typing import Any
++
 +import pytest
 +from typer.testing import CliRunner
++
 +import dlm.base_models as base_models
 +from dlm.base_models.errors import GatedModelError
 +from dlm.cli.app import app
 +from dlm.cli.scaffold import ScaffoldError
 +from dlm.doc.errors import DlmParseError
++
++
 +def _write_minimal_dlm(path: Path) -> None:
 +    path.write_text(
 +        "---\n"
 +        "dlm_id: 01TRAINEDGE0000000000000000\n"
 +        "base_model: smollm2-135m\n"
 +        "training:\n"
 +        "  seed: 42\n"
 +        "---\n"
 +        "body\n",
 +        encoding="utf-8",
 +    )
++
++
 +def _parsed_doc(base_model: str = "smollm2-135m") -> object:
 +    return SimpleNamespace(
 +        frontmatter=SimpleNamespace(
 +            base_model=base_model,
 +            dlm_id="01TRAINEDGE0000000000000000",
 +            training=SimpleNamespace(sequence_len=2048),
 +        )
 +    )
++
++
 +def _resolved_spec(**overrides: Any) -> object:
 +    defaults: dict[str, Any] = {
 +        "key": "smollm2-135m",
 +        "revision": "0123456789abcdef0123456789abcdef01234567",
 +        "modality": "text",
 +        "params": 135_000_000,
 +        "effective_context_length": 2048,
 +    }
 +    defaults.update(overrides)
 +    return SimpleNamespace(**defaults)
++
++
 +class TestTrainValidationEdges:
 +    def test_invalid_phase_refused(self, tmp_path: Path) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
++
 +        runner = CliRunner()
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path), "train", str(doc), "--phase", "bogus"],
 +        )
++
 +        assert result.exit_code == 2, result.output
 +        assert "--phase must be one of sft|preference|all" in result.output
++
 +    def test_resume_and_fresh_refused_together(self, tmp_path: Path) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
++
 +        runner = CliRunner()
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path), "train", str(doc), "--resume", "--fresh"],
 +        )
++
 +        assert result.exit_code == 2, result.output
 +        assert "--resume and --fresh are mutually exclusive" in result.output
++
 +    def test_invalid_policy_refused(self, tmp_path: Path) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
++
 +        runner = CliRunner()
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path), "train", str(doc), "--policy", "bogus"],
 +        )
++
 +        assert result.exit_code == 2, result.output
 +        assert "--policy must be 'permissive' or 'strict'" in result.output
++
 +    def test_multi_gpu_exit_code_propagates(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
 +        seen: dict[str, object] = {}
++
 +        monkeypatch.setattr(
 +            "dlm.hardware.capabilities.probe",
 +            lambda: SimpleNamespace(supports_bf16=False),
 +        )
++
 +        def _fake_dispatch(
 +            gpus: str,
 +            argv: list[str],
 +            console: object,
 +            *,
 +            mixed_precision: str = "bf16",
 +        ) -> int | None:
 +            seen["gpus"] = gpus
 +            seen["argv"] = argv
 +            seen["mixed_precision"] = mixed_precision
 +            return 17
++
 +        monkeypatch.setattr("dlm.cli.commands._maybe_dispatch_multi_gpu", _fake_dispatch)
++
 +        runner = CliRunner()
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path), "train", str(doc), "--gpus", "0,1"],
 +        )
++
 +        assert result.exit_code == 17, result.output
 +        assert seen["gpus"] == "0,1"
 +        assert seen["mixed_precision"] == "fp16"
++
 +    def test_scaffold_error_exits_cleanly(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        target = tmp_path / "corpus"
 +        target.mkdir()
++
 +        def _fake_scaffold(*args: object, **kwargs: object) -> object:
 +            raise ScaffoldError("bad scaffold", path=target)
++
 +        monkeypatch.setattr("dlm.cli.scaffold.scaffold_train_target", _fake_scaffold)
++
 +        runner = CliRunner()
 +        result = runner.invoke(
 +            app,
 +            ["--home", str(tmp_path), "train", str(target), "--base", "smollm2-135m"],
 +        )
++
 +        assert result.exit_code == 1, result.output
 +        assert "bad scaffold" in result.output
++
 +    def test_parse_error_exits_cleanly(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
 +        monkeypatch.setattr(
 +            "dlm.doc.parser.parse_file",
 +            lambda path: (_ for _ in ()).throw(
 +                DlmParseError("broken frontmatter", path=doc, line=2, col=1)
 +            ),
 +        )
++
 +        runner = CliRunner()
 +        result = runner.invoke(app, ["--home", str(tmp_path), "train", str(doc)])
++
 +        assert result.exit_code == 1, result.output
 +        assert "broken frontmatter" in result.output
++
 +    def test_gated_base_refusal_surfaces_license_pointer(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
++
 +        monkeypatch.setattr("dlm.doc.parser.parse_file", lambda path: _parsed_doc("llama-3.2-1b"))
++
 +        def _fake_resolve(
 +            base: str,
 +            *,
 +            accept_license: bool = False,
 +            skip_export_probes: bool = False,
 +        ) -> object:
 +            raise GatedModelError(base, "https://example.test/license")
++
 +        monkeypatch.setattr(base_models, "resolve", _fake_resolve)
++
 +        runner = CliRunner()
 +        result = runner.invoke(app, ["--home", str(tmp_path), "train", str(doc)])
++
 +        assert result.exit_code == 1, result.output
 +        text = " ".join(result.output.split())
 +        assert "base model 'llama-3.2-1b' is gated" in text
 +        assert "https://example.test/license" in text
 +        assert "--i-accept-license" in text
++
 +    def test_doctor_no_plan_refused(self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
++
 +        monkeypatch.setattr("dlm.doc.parser.parse_file", lambda path: _parsed_doc())
 +        monkeypatch.setattr(base_models, "resolve", lambda *args, **kwargs: _resolved_spec())
 +        monkeypatch.setattr("dlm.train.distributed.detect_world_size", lambda: 1)
 +        monkeypatch.setattr(
 +            "dlm.hardware.doctor",
 +            lambda **kwargs: SimpleNamespace(plan=None, capabilities=object()),
 +        )
++
 +        runner = CliRunner()
 +        result = runner.invoke(app, ["--home", str(tmp_path), "train", str(doc)])
++
 +        assert result.exit_code == 1, result.output
 +        assert "no viable training plan for this host" in result.output

tests/unit/cli/test_train_watch_edges.pyadded

260 lines changed — click to load

 +"""Additional `dlm train` coverage for lock-mode and watch-loop tails."""
++
 +from __future__ import annotations
++
 +from pathlib import Path
 +from types import SimpleNamespace
++
 +import pytest
 +from typer.testing import CliRunner
++
 +import dlm.base_models as base_models
 +from dlm.cli.app import app
 +from dlm.modality.errors import ModalityError
 +from dlm.watch.loop import CycleResult
++
++
 +def _write_minimal_dlm(path: Path) -> None:
 +    path.write_text(
 +        "---\n"
 +        "dlm_id: 01TRAINWATCH00000000000000\n"
 +        "base_model: smollm2-135m\n"
 +        "training:\n"
 +        "  seed: 42\n"
 +        "---\n"
 +        "body\n",
 +        encoding="utf-8",
 +    )
++
++
 +def _parsed_doc() -> object:
 +    return SimpleNamespace(
 +        frontmatter=SimpleNamespace(
 +            base_model="smollm2-135m",
 +            dlm_id="01TRAINWATCH00000000000000",
 +            training=SimpleNamespace(sequence_len=2048),
 +        ),
 +        sections=[SimpleNamespace(content="body")],
 +    )
++
++
 +def _resolved_spec() -> object:
 +    return SimpleNamespace(
 +        key="smollm2-135m",
 +        revision="0123456789abcdef0123456789abcdef01234567",
 +        modality="text",
 +        params=135_000_000,
 +        effective_context_length=2048,
 +    )
++
++
 +def _fake_phase_result(tmp_path: Path) -> object:
 +    result = SimpleNamespace(
 +        adapter_version=1,
 +        steps=3,
 +        seed=42,
 +        determinism=SimpleNamespace(class_="strict"),
 +        adapter_path=tmp_path / "adapter",
 +        log_path=tmp_path / "train.jsonl",
 +        final_train_loss=0.25,
 +        final_val_loss=0.1,
 +    )
 +    return SimpleNamespace(phase="sft", result=result)
++
++
 +def _install_train_basics(monkeypatch: pytest.MonkeyPatch) -> None:
 +    monkeypatch.setattr("dlm.doc.parser.parse_file", lambda path: _parsed_doc())
 +    monkeypatch.setattr(base_models, "resolve", lambda *args, **kwargs: _resolved_spec())
 +    monkeypatch.setattr("dlm.train.distributed.detect_world_size", lambda: 1)
 +    monkeypatch.setattr(
 +        "dlm.hardware.doctor",
 +        lambda **kwargs: SimpleNamespace(plan=object(), capabilities=object()),
 +    )
++
++
 +class TestTrainLockModeEdges:
 +    @pytest.mark.parametrize(
 +        ("flag", "expected"),
 +        [
 +            ("--strict-lock", "strict"),
 +            ("--update-lock", "update"),
 +            ("--ignore-lock", "ignore"),
 +        ],
 +    )
 +    def test_single_lock_flags_propagate_to_run_phases(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +        flag: str,
 +        expected: str,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
 +        _install_train_basics(monkeypatch)
 +        captured: dict[str, object] = {}
++
 +        def _fake_run_phases(*args: object, **kwargs: object) -> list[object]:
 +            captured["lock_mode"] = kwargs["lock_mode"]
 +            return []
++
 +        monkeypatch.setattr("dlm.train.preference.phase_orchestrator.run_phases", _fake_run_phases)
++
 +        result = CliRunner().invoke(
 +            app,
 +            ["--home", str(tmp_path), "train", str(doc), flag],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        assert captured["lock_mode"] == expected
++
++
 +class TestTrainWatchEdges:
 +    def test_modality_error_maps_to_training_prefix(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
 +        _install_train_basics(monkeypatch)
 +        monkeypatch.setattr(
 +            "dlm.train.preference.phase_orchestrator.run_phases",
 +            lambda *args, **kwargs: (_ for _ in ()).throw(
 +                ModalityError("processor contract failed")
 +            ),
 +        )
++
 +        result = CliRunner().invoke(app, ["--home", str(tmp_path), "train", str(doc)])
++
 +        assert result.exit_code == 1, result.output
 +        assert "training:" in result.output
 +        assert "processor contract failed" in result.output
++
 +    def test_watch_rpc_logs_cycle_and_skip_messages(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
 +        _install_train_basics(monkeypatch)
 +        monkeypatch.setenv("DLM_PROBE_TOKEN", "secret")
 +        fake_phase = _fake_phase_result(tmp_path)
++
 +        class _FakeQueue:
 +            capacity = 5
++
 +            def drain(self) -> list[object]:
 +                return []
++
 +        class _FakeServer:
 +            def __init__(self, *, host: str, port: int, token: str, queue: object) -> None:
 +                self.address = (host, port)
 +                self.start_calls = 0
 +                self.stop_calls = 0
++
 +            def start(self) -> None:
 +                self.start_calls += 1
++
 +            def stop(self) -> None:
 +                self.stop_calls += 1
++
 +        def _fake_watch(**kwargs: object) -> int:
 +            on_cycle = kwargs["on_cycle"]
 +            on_cycle(
 +                CycleResult(
 +                    ran=True,
 +                    new_sections=1,
 +                    removed_sections=0,
 +                    run_result=SimpleNamespace(final_train_loss=0.2, final_val_loss=0.1, steps=4),
 +                )
 +            )
 +            on_cycle(CycleResult(ran=False, new_sections=0, removed_sections=0))
 +            return 23
++
 +        monkeypatch.setattr(
 +            "dlm.train.preference.phase_orchestrator.run_phases",
 +            lambda *args, **kwargs: [fake_phase],
 +        )
 +        monkeypatch.setattr("dlm.train.inject.InjectedProbeQueue", _FakeQueue)
 +        monkeypatch.setattr("dlm.train.rpc.ProbeRpcServer", _FakeServer)
 +        monkeypatch.setattr("dlm.watch.loop.run_watch", _fake_watch)
++
 +        result = CliRunner().invoke(
 +            app,
 +            [
 +                "--home",
 +                str(tmp_path),
 +                "train",
 +                str(doc),
 +                "--watch",
 +                "--listen-rpc",
 +                "127.0.0.1:7777",
 +            ],
 +        )
++
 +        assert result.exit_code == 23, result.output
 +        normalized = " ".join(result.output.split())
 +        assert "rpc:" in normalized
 +        assert "watch:" in normalized
 +        assert "no new content, skipping retrain" in normalized
++
 +    def test_watch_keyboard_interrupt_stops_server_and_exits_zero(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        doc = tmp_path / "doc.dlm"
 +        _write_minimal_dlm(doc)
 +        _install_train_basics(monkeypatch)
 +        monkeypatch.setenv("DLM_PROBE_TOKEN", "secret")
 +        fake_phase = _fake_phase_result(tmp_path)
 +        holder: dict[str, object] = {}
++
 +        class _FakeQueue:
 +            capacity = 3
++
 +            def drain(self) -> list[object]:
 +                return []
++
 +        class _FakeServer:
 +            def __init__(self, *, host: str, port: int, token: str, queue: object) -> None:
 +                self.address = (host, port)
 +                self.stop_calls = 0
 +                holder["server"] = self
++
 +            def start(self) -> None:
 +                return None
++
 +            def stop(self) -> None:
 +                self.stop_calls += 1
++
 +        monkeypatch.setattr(
 +            "dlm.train.preference.phase_orchestrator.run_phases",
 +            lambda *args, **kwargs: [fake_phase],
 +        )
 +        monkeypatch.setattr("dlm.train.inject.InjectedProbeQueue", _FakeQueue)
 +        monkeypatch.setattr("dlm.train.rpc.ProbeRpcServer", _FakeServer)
 +        monkeypatch.setattr(
 +            "dlm.watch.loop.run_watch",
 +            lambda **kwargs: (_ for _ in ()).throw(KeyboardInterrupt),
 +        )
++
 +        result = CliRunner().invoke(
 +            app,
 +            [
 +                "--home",
 +                str(tmp_path),
 +                "train",
 +                str(doc),
 +                "--watch",
 +                "--listen-rpc",
 +                "127.0.0.1:7777",
 +            ],
 +        )
++
 +        assert result.exit_code == 0, result.output
 +        assert "Ctrl-C received, exiting" in result.output
 +        server = holder["server"]
 +        assert isinstance(server, _FakeServer)
 +        assert server.stop_calls == 2

tests/unit/control/test_apply.pymodified

49 lines changed — click to load

  from torch import nn
  from dlm.control import ControlApplyError, apply_control
 +from dlm.control.apply import _make_hook
  class _ToyLayer(nn.Module):
  class TestHookArithmetic:
 +    def test_hook_with_no_args_returns_original_tuple(self) -> None:
 +        hook = _make_hook(torch.ones(4), 1.0)
 +        empty: tuple[object, ...] = ()
++
 +        assert hook(None, empty) == empty
++
      def test_adds_scaled_vector_to_hidden(self) -> None:
          model = _ToyModel(n_layers=4, hidden_dim=8)
          vector = np.ones(8, dtype=np.float32)
          with apply_control(wrapped, vector, layer_index=2, strength=1.0):
              out = _run_through_layer(inner, 2, hidden)
          assert torch.allclose(out, torch.ones_like(out))
++
 +    def test_falls_through_sparse_projection_paths(self) -> None:
 +        class _SparseProjLayer(nn.Module):
 +            def __init__(self, hidden_dim: int) -> None:
 +                super().__init__()
 +                self.self_attn = nn.Module()
 +                self.self_attn.q_proj = nn.Module()
 +                self.attn = nn.Module()
 +                self.attn.qkv_proj = nn.Linear(hidden_dim, hidden_dim, bias=False)
++
 +            def forward(self, hidden: torch.Tensor) -> torch.Tensor:
 +                return hidden
++
 +        class _SparseProjModel(nn.Module):
 +            def __init__(self, hidden_dim: int) -> None:
 +                super().__init__()
 +                self.model = nn.Module()
 +                self.model.layers = nn.ModuleList([_SparseProjLayer(hidden_dim)])
++
 +        model = _SparseProjModel(hidden_dim=4)
 +        vector = np.array([1.0, 0.0, 0.0, 0.0], dtype=np.float32)
 +        hidden = torch.zeros(1, 1, 4)
++
 +        with apply_control(model, vector, layer_index=0, strength=1.0):
 +            out = model.model.layers[0](hidden)
++
 +        assert out[0, 0, 0].item() == 1.0

tests/unit/data/test_audio_cache.pymodified

36 lines changed — click to load

          proc_b = SimpleNamespace(feature_extractor=FeB())
          assert processor_sha256(proc_a) != processor_sha256(proc_b)
 +    def test_nested_feature_extractor_fields_are_readable(self) -> None:
 +        proc = SimpleNamespace(
 +            feature_extractor=SimpleNamespace(
 +                sampling_rate=16_000,
 +                feature_size=(80, 2),
 +                n_fft=400,
 +                hop_length=160,
 +                chunk_length={"seconds": 30},
 +                padding_value=0.0,
 +                return_attention_mask=True,
 +            )
 +        )
 +        sha = processor_sha256(proc)
 +        assert len(sha) == 64
++
 +    def test_exotic_feature_field_stringifies_stably(self) -> None:
 +        proc = SimpleNamespace(
 +            feature_extractor=SimpleNamespace(
 +                sampling_rate=16_000,
 +                feature_size=80,
 +                n_fft=400,
 +                hop_length=160,
 +                chunk_length=object(),
 +                padding_value=0.0,
 +                return_attention_mask=True,
 +            )
 +        )
 +        sha = processor_sha256(proc)
 +        assert len(sha) == 64
++
  # --- WaveformCache (35.2 deferred-item follow-up) ---------------------------

tests/unit/data/test_audio_resample.pymodified

121 lines changed — click to load

  from __future__ import annotations
 +import builtins
  import sys
 -from types import SimpleNamespace
 +from types import ModuleType, SimpleNamespace
  import numpy as np
  import pytest
      def test_no_backend_raises(self, monkeypatch: pytest.MonkeyPatch) -> None:
          """Force both imports to fail and confirm the error names both paths."""
 -        real_import = (
 -            __builtins__["__import__"]
 -            if isinstance(__builtins__, dict)
 -            else __builtins__.__import__
 -        )
 +        real_import = builtins.__import__
          def fake_import(name: str, *args: object, **kwargs: object) -> object:
              if name in ("soxr", "scipy", "scipy.signal"):
                  raise ImportError(f"forced: {name}")
 -            return real_import(name, *args, **kwargs)  # type: ignore[operator]
 +            return real_import(name, *args, **kwargs)
 -        monkeypatch.setitem(sys.modules, "soxr", None)
 -        # Monkey-patch the _pick_backend helper's import probes so both
 -        # attempts fail regardless of what's installed in the env.
 -        monkeypatch.setattr(audio_resample, "_pick_backend", _no_backend)
 +        monkeypatch.setattr(builtins, "__import__", fake_import)
          with pytest.raises(AudioResampleUnavailable, match="soxr or scipy"):
 -            resample(np.zeros(8, dtype=np.float32), src_sr=48_000, dst_sr=16_000)
 +            audio_resample._pick_backend()
  def _no_backend() -> None:
  class TestScipyBackend:
 -    def test_scipy_fallback_resamples(self, monkeypatch: pytest.MonkeyPatch) -> None:
 -        """With soxr disabled, scipy fallback produces expected length."""
 -        # Pretend soxr isn't importable so the pick falls through to scipy.
 -        monkeypatch.setitem(sys.modules, "soxr", None)
 +    def test_resample_routes_through_selected_backend(
 +        self, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        called: dict[str, object] = {}
 -        pytest.importorskip("scipy.signal")
 +        def fake_backend(waveform: np.ndarray, *, src_sr: int, dst_sr: int) -> np.ndarray:
 +            called["waveform"] = waveform
 +            called["src_sr"] = src_sr
 +            called["dst_sr"] = dst_sr
 +            return np.ones(4, dtype=np.float32)
 -        # 1 second of 8 kHz silence → resample to 16 kHz = 2 s of samples.
 -        wave = np.zeros(8_000, dtype=np.float32)
 +        wave = np.zeros(8, dtype=np.float32)
 +        monkeypatch.setattr(audio_resample, "_pick_backend", lambda: fake_backend)
          out = resample(wave, src_sr=8_000, dst_sr=16_000)
 +        assert out.tolist() == [1.0, 1.0, 1.0, 1.0]
 +        assert called == {"waveform": wave, "src_sr": 8_000, "dst_sr": 16_000}
++
 +    def test_scipy_fallback_uses_fake_module(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        """With soxr disabled, _pick_backend falls through to scipy."""
 +        monkeypatch.setitem(sys.modules, "soxr", None)
 +        fake_signal = ModuleType("scipy.signal")
 +        fake_signal.resample_poly = lambda waveform, *, up, down: np.repeat(waveform, up)[
 +            : len(waveform) * up // down
 +        ]
 +        fake_scipy = ModuleType("scipy")
 +        fake_scipy.signal = fake_signal
 +        monkeypatch.setitem(sys.modules, "scipy", fake_scipy)
 +        monkeypatch.setitem(sys.modules, "scipy.signal", fake_signal)
++
 +        backend = audio_resample._pick_backend()
 +        assert backend is audio_resample._scipy_resample
++
 +    def test_soxr_backend_coerces_float32_contiguous(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        fake_soxr = ModuleType("soxr")
 +        fake_soxr.resample = lambda waveform, src_sr, dst_sr, quality="HQ": np.asarray(
 +            waveform * 2, dtype=np.float64
 +        )
 +        monkeypatch.setitem(sys.modules, "soxr", fake_soxr)
++
 +        wave = np.arange(6, dtype=np.float32)[::2]
 +        out = audio_resample._soxr_resample(wave, src_sr=8_000, dst_sr=16_000)
++
 +        assert out.dtype == np.float32
 +        assert out.flags.c_contiguous
 +        assert out.tolist() == [0.0, 4.0, 8.0]
++
 +    def test_scipy_backend_reduces_ratio_before_call(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        calls: dict[str, object] = {}
++
 +        def fake_resample_poly(waveform: np.ndarray, *, up: int, down: int) -> np.ndarray:
 +            calls["up"] = up
 +            calls["down"] = down
 +            return np.asarray(waveform + 1, dtype=np.float64)
++
 +        fake_signal = ModuleType("scipy.signal")
 +        fake_signal.resample_poly = fake_resample_poly
 +        fake_scipy = ModuleType("scipy")
 +        fake_scipy.signal = fake_signal
 +        monkeypatch.setitem(sys.modules, "scipy", fake_scipy)
 +        monkeypatch.setitem(sys.modules, "scipy.signal", fake_signal)
++
 +        wave = np.arange(5, dtype=np.float32)
 +        out = audio_resample._scipy_resample(wave, src_sr=48_000, dst_sr=16_000)
++
 +        assert calls == {"up": 1, "down": 3}
          assert out.dtype == np.float32
 -        # resample_poly produces len(x) * up // down on integer ratios.
 -        # scipy rounds up-or-down depending on filter length; accept ±1.
 -        assert abs(out.shape[0] - 16_000) <= 1
          assert out.flags.c_contiguous

tests/unit/data/test_dataset_builder.pymodified

20 lines changed — click to load

          sections = [_s(SectionType.PROSE, "   ")]
          with pytest.raises(ValueError, match="no trainable rows"):
              build_dataset(sections, seed=0, val_frac=0.1)
++
 +    def test_weights_dropping_every_row_raises(self) -> None:
 +        replay = [
 +            {
 +                "text": "replay-only",
 +                "_dlm_section_id": "replay-v1",
 +                "_dlm_row_tags": {"lang": "en"},
 +            },
 +        ]
 +        with pytest.raises(ValueError, match="weights dropped every row"):
 +            build_dataset(
 +                [],
 +                seed=0,
 +                val_frac=0.1,
 +                replay_rows=replay,
 +                weights={"lang": {"en": 0.0}},
 +            )

tests/unit/data/test_sections_to_rows.pymodified

20 lines changed — click to load

          with pytest.raises(InstructionParseError):
              sections_to_rows([s])
 +    def test_probe_markers_normalized_before_parse(self) -> None:
 +        s = _s(SectionType.INSTRUCTION, "### Q !probe\nq1\n### A\na1")
 +        rows = sections_to_rows([s])
 +        assert rows == [
 +            {
 +                "messages": [
 +                    {"role": "user", "content": "q1"},
 +                    {"role": "assistant", "content": "a1"},
 +                ],
 +                "_dlm_section_id": s.section_id,
 +                "_dlm_row_tags": {},
 +            },
 +        ]
++
  class TestPreferenceShape:
      def test_each_triple_becomes_preference_row(self) -> None:

tests/unit/data/test_vl_cache.pymodified

33 lines changed — click to load

              image_std = [0.5] * 3
          assert processor_sha256(ProcA()) != processor_sha256(ProcB())
++
 +    def test_nested_dict_and_tuple_fields_are_readable(self) -> None:
 +        proc = SimpleNamespace(
 +            image_processor=SimpleNamespace(
 +                size={"shortest_edge": 224, "crop": (224, 224)},
 +                image_mean=(0.5, 0.5, 0.5),
 +                image_std=[0.2, 0.2, 0.2],
 +                do_normalize=True,
 +                do_rescale=True,
 +                rescale_factor=1 / 255,
 +                resample="bicubic",
 +            )
 +        )
 +        sha = processor_sha256(proc)
 +        assert len(sha) == 64
++
 +    def test_exotic_resample_value_stringifies_stably(self) -> None:
 +        proc = SimpleNamespace(
 +            image_processor=SimpleNamespace(
 +                size={"shortest_edge": 224},
 +                image_mean=[0.5] * 3,
 +                image_std=[0.5] * 3,
 +                do_normalize=True,
 +                do_rescale=True,
 +                rescale_factor=1 / 255,
 +                resample=object(),
 +            )
 +        )
 +        sha = processor_sha256(proc)
 +        assert len(sha) == 64

tests/unit/data/test_weighted_rows.pymodified

41 lines changed — click to load

  from __future__ import annotations
  from dlm.data.weighted_rows import (
 +    _keep_fraction,
      expand_rows_by_weight,
 +    merge_weights_maps,
      resolve_row_weight,
      weight_distribution,
+ )
          assert len(out) == 6
 +class TestMergeWeightsMaps:
 +    def test_empty_sequence_returns_empty_map(self) -> None:
 +        assert merge_weights_maps([]) == {}
++
 +    def test_deeper_entries_override_shallower_ones(self) -> None:
 +        merged = merge_weights_maps(
 +            [
 +                {"lang": {"py": 2.0, "rs": 1.5}, "gen": {"true": 0.5}},
 +                {"lang": {"py": 3.0}, "new": {"x": 4.0}},
 +            ]
 +        )
 +        assert merged == {
 +            "lang": {"py": 3.0, "rs": 1.5},
 +            "gen": {"true": 0.5},
 +            "new": {"x": 4.0},
 +        }
++
++
 +class TestKeepFraction:
 +    def test_non_positive_fraction_never_keeps(self) -> None:
 +        assert _keep_fraction("sid", seed=42, fractional=0.0) is False
++
 +    def test_fraction_at_or_above_one_always_keeps(self) -> None:
 +        assert _keep_fraction("sid", seed=42, fractional=1.0) is True
++
++
  class TestWeightDistribution:
      def test_empty_rows_empty_dist(self) -> None:
          assert weight_distribution([]) == {}

tests/unit/directives/test_cache.pymodified

206 lines changed — click to load

      def test_empty_cache(self, tmp_path: Path) -> None:
          cache = TokenizedCache.open(tmp_path / "c")
 +        assert cache.root == tmp_path / "c"
          assert cache.entry_count == 0
          assert cache.total_bytes == 0
          assert cache.entry_count == 0
          assert any("unreadable" in rec.message for rec in caplog.records)
 +    def test_manifest_version_mismatch_starts_fresh(
 +        self,
 +        tmp_path: Path,
 +        caplog: pytest.LogCaptureFixture,
 +    ) -> None:
 +        import json
 +        import logging
++
 +        root = tmp_path / "c"
 +        root.mkdir()
 +        (root / "manifest.json").write_text(
 +            json.dumps({"version": 999, "entries": {}}),
 +            encoding="utf-8",
 +        )
 +        caplog.set_level(logging.WARNING, logger="dlm.directives.cache")
 +        cache = TokenizedCache.open(root)
 +        assert cache.entry_count == 0
 +        assert "version mismatch" in caplog.text
++
 +    def test_non_mapping_entries_starts_fresh(self, tmp_path: Path) -> None:
 +        import json
++
 +        root = tmp_path / "c"
 +        root.mkdir()
 +        (root / "manifest.json").write_text(
 +            json.dumps({"version": 1, "entries": []}),
 +            encoding="utf-8",
 +        )
 +        cache = TokenizedCache.open(root)
 +        assert cache.entry_count == 0
++
 +    def test_malformed_manifest_entry_is_skipped(
 +        self,
 +        tmp_path: Path,
 +        caplog: pytest.LogCaptureFixture,
 +    ) -> None:
 +        import json
 +        import logging
++
 +        root = tmp_path / "c"
 +        root.mkdir()
 +        (root / "manifest.json").write_text(
 +            json.dumps(
 +                {
 +                    "version": 1,
 +                    "entries": {
 +                        "good": {
 +                            "size": 4,
 +                            "last_access_ts": 1.0,
 +                            "shard": "aa",
 +                            "filename": "good.npz",
 +                            "tokenizer_sha": "a" * 64,
 +                        },
 +                        "bad": {
 +                            "size": "not-an-int",
 +                            "last_access_ts": 1.0,
 +                            "shard": "bb",
 +                            "filename": "bad.npz",
 +                        },
 +                    },
 +                }
 +            ),
 +            encoding="utf-8",
 +        )
 +        caplog.set_level(logging.WARNING, logger="dlm.directives.cache")
 +        cache = TokenizedCache.open(root)
 +        assert cache.entry_count == 1
 +        assert "skipping malformed entry" in caplog.text
++
 +    def test_non_mapping_manifest_entry_is_ignored(self, tmp_path: Path) -> None:
 +        import json
++
 +        root = tmp_path / "c"
 +        root.mkdir()
 +        (root / "manifest.json").write_text(
 +            json.dumps(
 +                {
 +                    "version": 1,
 +                    "entries": {
 +                        "bad": "not-a-dict",
 +                    },
 +                }
 +            ),
 +            encoding="utf-8",
 +        )
 +        cache = TokenizedCache.open(root)
 +        assert cache.entry_count == 0
++
  class TestGetPut:
      def test_miss_then_hit(self, tmp_path: Path) -> None:
          assert cache2.entry_count == 1
          assert cache2.get(key) is not None
 +    def test_hit_rate_zero_when_no_lookups(self, tmp_path: Path) -> None:
 +        cache = TokenizedCache.open(tmp_path / "c")
 +        assert cache.hit_rate == 0.0
++
 +    def test_corrupt_entry_recovers(
 +        self,
 +        tmp_path: Path,
 +        caplog: pytest.LogCaptureFixture,
 +    ) -> None:
 +        import logging
++
 +        cache = TokenizedCache.open(tmp_path / "c")
 +        key = _key()
 +        cache.put(key, _tokens(4))
 +        entry_file = next((tmp_path / "c" / "entries").rglob("*.npz"))
 +        entry_file.write_bytes(b"not a real npz")
++
 +        caplog.set_level(logging.WARNING, logger="dlm.directives.cache")
 +        assert cache.get(key) is None
 +        assert cache.entry_count == 0
 +        assert "corrupt entry" in caplog.text
++
 +    def test_put_write_failure_drops_entry(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +        caplog: pytest.LogCaptureFixture,
 +    ) -> None:
 +        import logging
++
 +        cache = TokenizedCache.open(tmp_path / "c")
++
 +        def _boom(*_args: object, **_kwargs: object) -> None:
 +            raise OSError("disk full")
++
 +        monkeypatch.setattr("numpy.savez_compressed", _boom)
 +        caplog.set_level(logging.WARNING, logger="dlm.directives.cache")
 +        cache.put(_key(), _tokens(4))
++
 +        assert cache.entry_count == 0
 +        assert list((tmp_path / "c" / "entries").rglob("*.tmp")) == []
 +        assert "write failed" in caplog.text
++
 +    def test_put_stat_failure_records_zero_sized_entry(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        cache = TokenizedCache.open(tmp_path / "c")
 +        real_stat = Path.stat
++
 +        def _patched_stat(path: Path, *, follow_symlinks: bool = True) -> object:
 +            if path.suffix == ".tmp":
 +                raise OSError("no stat")
 +            return real_stat(path, follow_symlinks=follow_symlinks)
++
 +        monkeypatch.setattr(Path, "stat", _patched_stat)
 +        cache.put(_key(), _tokens(4))
++
 +        assert cache.entry_count == 1
 +        assert cache.total_bytes == 0
++
  class TestInvalidation:
      def test_different_tokenizer_sha_misses(self, tmp_path: Path) -> None:
          assert cache.get(key_a) is not None
          assert cache.get(key_b) is not None
 +    def test_eviction_stops_once_under_budget(self, tmp_path: Path) -> None:
 +        import time
++
 +        cache = TokenizedCache.open(tmp_path / "c", max_bytes=10_000_000)
 +        key_a = _key("aa" * 8)
 +        key_b = _key("bb" * 8)
 +        key_c = _key("cc" * 8)
++
 +        cache.put(key_a, _tokens(20))
 +        size_a = next(
 +            entry.size
 +            for entry in cache._manifest.values()
 +            if entry.filename == key_a.as_filename()
 +        )
 +        cache._touched_this_run.clear()
 +        time.sleep(0.01)
 +        cache.put(key_b, _tokens(20))
 +        size_b = next(
 +            entry.size
 +            for entry in cache._manifest.values()
 +            if entry.filename == key_b.as_filename()
 +        )
 +        cache._touched_this_run.clear()
++
 +        cache._max_bytes = size_a + size_b
 +        cache.put(key_c, _tokens(20))
++
 +        assert cache.get(key_a) is None
 +        assert cache.get(key_b) is not None
 +        assert cache.get(key_c) is not None
++
  class TestPruneClear:
      def test_prune_removes_old_entries(self, tmp_path: Path) -> None:

tests/unit/directives/test_cache_key.pymodified

28 lines changed — click to load

          return self._canonical
 +class _BrokenBackendTokenizer:
 +    def to_str(self) -> str:
 +        raise RuntimeError("boom")
++
++
  class _FakeTokenizer:
      """Minimal shape for tokenizer_sha256 — just enough attrs."""
      def __init__(self, *, canonical: str | None = None, vocab_size: int = 32000) -> None:
 -        self.backend_tokenizer = _FakeBackendTokenizer(canonical) if canonical else None
 +        self.backend_tokenizer: object | None = (
 +            _FakeBackendTokenizer(canonical) if canonical else None
 +        )
          self.vocab_size = vocab_size
          self.model_max_length = 2048
          self.pad_token = "<pad>"
          tok.backend_tokenizer = _FakeBackendTokenizer('{"v": 2}')
          sha2 = tokenizer_sha256(tok)
          assert sha1 == sha2
++
 +    def test_backend_to_str_failure_falls_back_to_legacy(self) -> None:
 +        tok = _FakeTokenizer()
 +        tok.backend_tokenizer = _BrokenBackendTokenizer()
 +        sha = tokenizer_sha256(tok)
 +        assert len(sha) == 64

tests/unit/directives/test_discovery.pymodified

58 lines changed — click to load

      assert discover_configs(tmp_path) == ()
 +def test_non_directory_dot_dlm_is_ignored(tmp_path: Path) -> None:
 +    (tmp_path / ".dlm").write_text("not a directory", encoding="utf-8")
 +    assert discover_configs(tmp_path) == ()
++
++
  def test_single_dlm_at_root_with_both_files(tmp_path: Path) -> None:
      (tmp_path / ".dlm").mkdir()
      (tmp_path / ".dlm" / "training.yaml").write_text(
      assert any("invalid YAML" in rec.message for rec in caplog.records)
 +def test_invalid_utf8_training_yaml_logs_and_continues(
 +    tmp_path: Path,
 +    caplog: pytest.LogCaptureFixture,
 +) -> None:
 +    (tmp_path / ".dlm").mkdir()
 +    (tmp_path / ".dlm" / "training.yaml").write_bytes(b"caf\xe9\n")
 +    caplog.set_level(logging.WARNING, logger="dlm.directives.discovery")
 +    configs = discover_configs(tmp_path)
 +    assert configs[0].config is None
 +    assert any("not UTF-8" in rec.message for rec in caplog.records)
++
++
  def test_schema_violation_logs_and_continues(
      tmp_path: Path, caplog: pytest.LogCaptureFixture
  ) -> None:
      assert any("must be a mapping" in rec.message for rec in caplog.records)
 +def test_training_yaml_null_top_level_coerces_to_empty_config(tmp_path: Path) -> None:
 +    (tmp_path / ".dlm").mkdir()
 +    (tmp_path / ".dlm" / "training.yaml").write_text("null\n", encoding="utf-8")
 +    configs = discover_configs(tmp_path)
 +    assert configs[0].config is not None
 +    assert configs[0].config.dlm_training_version == 1
++
++
  def test_both_files_coexist(tmp_path: Path) -> None:
      (tmp_path / ".dlm").mkdir()
      (tmp_path / ".dlm" / "training.yaml").write_text("dlm_training_version: 1\nexclude: ['a']\n")
      assert c.config is not None
      assert c.config.exclude == ("a",)
      assert len(c.ignore_rules) == 1
++
++
 +def test_invalid_utf8_ignore_logs_and_continues(
 +    tmp_path: Path,
 +    caplog: pytest.LogCaptureFixture,
 +) -> None:
 +    (tmp_path / ".dlm").mkdir()
 +    (tmp_path / ".dlm" / "ignore").write_bytes(b"bad-\xff\n")
 +    caplog.set_level(logging.WARNING, logger="dlm.directives.discovery")
 +    configs = discover_configs(tmp_path)
 +    assert configs[0].ignore_rules == ()
 +    assert any("not UTF-8" in rec.message for rec in caplog.records)

tests/unit/directives/test_expand.pymodified

81 lines changed — click to load

  from __future__ import annotations
 +import os
  from pathlib import Path
  import pytest
  from dlm.directives import expand_sources
  from dlm.directives.errors import DirectivePathError, DirectivePolicyError
 +from dlm.directives.expand import _iter_candidates
  from dlm.doc.parser import parse_text
  from dlm.doc.sections import SectionType
 +from dlm.store.blobs import BlobStore
  _VALID_ULID = "01ABCDEFGHJKMNPQRSTVWXYZ00"
      result = expand_sources(parsed, base_path=tmp_path)  # type: ignore[arg-type]
      assert len(result.sections) == 1
      assert result.sections[0].content.startswith("# source: notes.md")
++
++
 +def test_stat_failure_skips_file(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
 +    src = tmp_path / "src"
 +    src.mkdir()
 +    target = src / "a.py"
 +    target.write_text("print(1)\n", encoding="utf-8")
 +    body = "  sources:\n    - path: src\n      include: ['**/*.py']\n"
 +    parsed, _ = _make_parsed(body, tmp_path)
 +    real_stat = Path.stat
 +    seen_target = 0
++
 +    def _patched_stat(path: Path, *, follow_symlinks: bool = True) -> os.stat_result:
 +        nonlocal seen_target
 +        if path == target:
 +            seen_target += 1
 +            if seen_target >= 2:
 +                raise OSError("no stat")
 +        return real_stat(path, follow_symlinks=follow_symlinks)
++
 +    monkeypatch.setattr(Path, "stat", _patched_stat)
 +    result = expand_sources(parsed, base_path=tmp_path)  # type: ignore[arg-type]
 +    assert result.sections == ()
++
++
 +def test_read_bytes_failure_skips_file(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
 +    src = tmp_path / "src"
 +    src.mkdir()
 +    target = src / "a.py"
 +    target.write_text("print(1)\n", encoding="utf-8")
 +    body = "  sources:\n    - path: src\n      include: ['**/*.py']\n"
 +    parsed, _ = _make_parsed(body, tmp_path)
 +    real_read_bytes = Path.read_bytes
++
 +    def _patched_read_bytes(path: Path, *args: object, **kwargs: object) -> bytes:
 +        if path == target:
 +            raise OSError("no read")
 +        return real_read_bytes(path, *args, **kwargs)
++
 +    monkeypatch.setattr(Path, "read_bytes", _patched_read_bytes)
 +    result = expand_sources(parsed, base_path=tmp_path)  # type: ignore[arg-type]
 +    assert result.sections == ()
++
++
 +def test_audio_transcript_unreadable_skips_audio(tmp_path: Path) -> None:
 +    corpus = tmp_path / "corpus"
 +    corpus.mkdir()
 +    (corpus / "clip.wav").write_bytes(b"RIFF....fake wav")
 +    (corpus / "clip.txt").write_bytes(b"bad-\xff\n")
 +    parsed, _ = _make_parsed(
 +        '  sources:\n    - path: corpus\n      include: ["**/*.wav"]\n',
 +        tmp_path,
 +    )
 +    blob_store = BlobStore(tmp_path / "blobs")
 +    result = expand_sources(parsed, base_path=tmp_path, blob_store=blob_store)  # type: ignore[arg-type]
 +    assert result.sections == ()
 +    assert result.provenance[0].skipped_audio_no_transcript == 1
++
++
 +def test_iter_candidates_non_file_non_dir_yields_nothing(tmp_path: Path) -> None:
 +    assert list(_iter_candidates(tmp_path / "missing")) == []

tests/unit/directives/test_ignore_parser.pymodified

13 lines changed — click to load

      assert any("bare '/'" in rec.message for rec in caplog.records)
 +def test_parse_pattern_reduced_to_empty_skipped(caplog: pytest.LogCaptureFixture) -> None:
 +    caplog.set_level(logging.WARNING, logger="dlm.directives.ignore_parser")
 +    rules = parse_ignore_file("//\n")
 +    assert rules == ()
 +    assert any("pattern reduced to empty" in rec.message for rec in caplog.records)
++
++
  # ---- matches ---------------------------------------------------------------

tests/unit/directives/test_merge.pymodified

32 lines changed — click to load

+     )
 +def test_parent_directive_exclude_blocks_file(tmp_path: Path) -> None:
 +    _write(tmp_path / "src" / "main.py", "x")
 +    directive = _directive(tmp_path, exclude=("**/*.py",))
 +    configs = discover_configs(tmp_path)
 +    eff = effective_config_for(
 +        tmp_path / "src" / "main.py",
 +        source_root=tmp_path,
 +        discovered=configs,
 +        parent_directive=directive,
 +    )
 +    assert eff.included is False
++
++
  # ---- .dlm/ignore negation --------------------------------------------------
          parent_directive=directive,
+     )
      assert dict(eff.tags) == {}
++
++
 +def test_relpath_falls_back_to_filename_for_non_ancestor_anchor(tmp_path: Path) -> None:
 +    from dlm.directives.merge import _relpath
++
 +    file_path = tmp_path / "src" / "main.py"
 +    _write(file_path, "x")
 +    other_anchor = tmp_path / "elsewhere"
 +    other_anchor.mkdir()
 +    assert _relpath(file_path, other_anchor) == "main.py"

tests/unit/doc/test_parser_roundtrip.pymodified

35 lines changed — click to load

              SectionType.PREFERENCE,
+         ]
 +    def test_whitespace_only_trailing_prose_is_elided(self) -> None:
 +        text = (
 +            f"---\ndlm_id: {VALID_ULID}\nbase_model: smollm2-135m\n---\n\n"
 +            "::instruction::\n"
 +            "### Q\n"
 +            "q\n"
 +            "### A\n"
 +            "a\n"
 +            "\n"
 +            "   \n"
 +            "\t\n"
 +        )
 +        parsed = parse_text(text)
 +        assert [section.type for section in parsed.sections] == [SectionType.INSTRUCTION]
++
 +    def test_whitespace_only_prose_before_first_fence_is_elided(self) -> None:
 +        text = (
 +            f"---\ndlm_id: {VALID_ULID}\nbase_model: smollm2-135m\n---\n\n"
 +            "   \n"
 +            "\t\n"
 +            "::instruction::\n"
 +            "### Q\n"
 +            "q\n"
 +            "### A\n"
 +            "a\n"
 +        )
 +        parsed = parse_text(text)
 +        assert [section.type for section in parsed.sections] == [SectionType.INSTRUCTION]
++
      def test_unknown_attribute_fence_raises(self) -> None:
          text = (
              f"---\ndlm_id: {VALID_ULID}\nbase_model: smollm2-135m\n---\n\n"

tests/unit/doc/test_serializer_edges.pymodified

18 lines changed — click to load

          assert out.endswith("\n")
          assert not out.endswith("\n\n")
 +    def test_serializer_adds_newline_when_section_render_omits_it(
 +        self, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        fm = DlmFrontmatter(dlm_id=VALID_ULID, base_model="smollm2-135m")
 +        parsed = ParsedDlm(
 +            frontmatter=fm,
 +            sections=(Section(SectionType.PROSE, "content"),),
 +        )
 +        monkeypatch.setattr("dlm.doc.serializer._serialize_frontmatter", lambda _fm: "---\n---")
 +        monkeypatch.setattr("dlm.doc.serializer._serialize_section", lambda _section: "body")
 +        assert serialize(parsed).endswith("\n")
++
  class TestFrontmatterExplicitTargetModulesList:
      """Ensures the list branch in the nested-mapping emitter is exercised."""

tests/unit/eval/test_mode_split.pymodified

59 lines changed — click to load

  import pytest
 -from dlm.eval.mode_split import compute_val_loss_by_mode
 +from dlm.eval.mode_split import _safe_eval_loss, compute_val_loss_by_mode
  class _FakeDataset:
          assert compute_val_loss_by_mode(trainer, _FakeDataset([])) == (None, None)
          trainer.evaluate.assert_not_called()
 +    def test_non_sized_dataset_returns_both_none(self) -> None:
 +        trainer = MagicMock()
 +        assert compute_val_loss_by_mode(trainer, _NonSizedDataset([{"text": "prose"}])) == (
 +            None,
 +            None,
 +        )
 +        trainer.evaluate.assert_not_called()
++
  class TestModeClassification:
      def test_only_cpt_rows(self) -> None:
          assert cpt is None
          assert sft is None
 +    def test_non_numeric_eval_loss_yields_none(self) -> None:
 +        trainer = MagicMock()
 +        trainer.evaluate.return_value = {"eval_loss": object()}
 +        val = _FakeDataset([{"text": "a"}])
 +        cpt, sft = compute_val_loss_by_mode(trainer, val)
 +        assert cpt is None
 +        assert sft is None
++
      def test_select_failure_yields_none(
          self,
          caplog: pytest.LogCaptureFixture,
      def __iter__(self):  # type: ignore[no-untyped-def]
          return iter(self._rows)
++
++
 +class _NonSizedDataset:
 +    def __init__(self, rows: list[dict[str, Any]]) -> None:
 +        self._rows = rows
++
 +    def __iter__(self):  # type: ignore[no-untyped-def]
 +        return iter(self._rows)
++
++
 +def test_safe_eval_loss_value_error_yields_none(
 +    caplog: pytest.LogCaptureFixture,
 +) -> None:
 +    caplog.set_level(logging.WARNING, logger="dlm.eval.mode_split")
 +    trainer = MagicMock()
 +    trainer.evaluate.side_effect = ValueError("bad eval")
 +    val = _FakeDataset([{"text": "a"}])
++
 +    assert _safe_eval_loss(trainer, val, [0], mode="cpt") is None
 +    assert "val-loss split skipped cpt evaluation" in caplog.text

tests/unit/eval/test_probes.pymodified

56 lines changed — click to load

  import pytest
 +from dlm.data.instruction_parser import QAPair
  from dlm.doc.sections import Section, SectionType
 -from dlm.eval.probes import Probe, extract_probes
 +from dlm.eval.probes import Probe, _auto_sample_probes, _normalize_probe_markers, extract_probes
  class TestExplicitProbes:
          # Auto-sampled fills the remainder.
          assert any(p.prompt == "not-probe" for p in probes)
 +    def test_probe_header_preserves_blank_lines_before_prompt(self) -> None:
 +        body = "### Q !probe\n\n\nWhat is Paris?\n### A\nCapital of France."
 +        s = Section(type=SectionType.INSTRUCTION, content=body)
++
 +        probes = extract_probes([s], k=1)
++
 +        assert len(probes) == 1
 +        assert probes[0].prompt == "What is Paris?"
++
  class TestAutoSample:
      def test_auto_sample_when_no_explicit(self) -> None:
          s = Section(type=SectionType.INSTRUCTION, content=body)
          assert extract_probes([s], k=0) == []
 +    def test_auto_sample_internal_k_zero_returns_empty(self) -> None:
 +        assert _auto_sample_probes([], k=0, seed=0, exclude=set(), parsed_pairs={}) == []
++
 +    def test_auto_sample_exclude_skips_seen_prompts(self) -> None:
 +        section = Section(type=SectionType.INSTRUCTION, content="### Q\nQ1?\n### A\nA1")
++
 +        probes = _auto_sample_probes(
 +            [section],
 +            k=1,
 +            seed=0,
 +            exclude={"Q1?"},
 +            parsed_pairs={section.section_id: [QAPair(question="Q1?", answer="A1")]},
 +        )
++
 +        assert probes == []
++
      def test_malformed_instruction_logs_warning_once(
          self,
          caplog: pytest.LogCaptureFixture,
          p = Probe(prompt="hi", reference="hello")
          with pytest.raises(dataclasses.FrozenInstanceError):
              p.prompt = "other"  # type: ignore[misc]
++
++
 +def test_normalize_probe_markers_keeps_non_probe_body() -> None:
 +    body = "### Q\nplain\n### A\nanswer"
++
 +    assert _normalize_probe_markers(body) == body

tests/unit/export/ollama/test_modelfile.pymodified

11 lines changed — click to load

          text = render_modelfile(_ctx(tmp_path))
          assert 'LICENSE "Apache-2.0"' in text
 +    def test_license_line_omitted_when_spec_has_no_spdx(self, tmp_path: Path) -> None:
 +        spec = _SPEC.model_copy(update={"license_spdx": ""})
 +        text = render_modelfile(_ctx(tmp_path, spec=spec))
 +        assert "LICENSE " not in text
++
      def test_trailing_newline(self, tmp_path: Path) -> None:
          assert render_modelfile(_ctx(tmp_path)).endswith("\n")

tests/unit/export/targets/test_llama_server_argv.pymodified

140 lines changed — click to load

  from datetime import datetime
  from pathlib import Path
 +import pytest
++
  from dlm.base_models import BASE_MODELS
 +from dlm.export.dispatch import DispatchResult
 +from dlm.export.errors import ExportError
  from dlm.export.manifest import ExportManifest, load_export_manifest
 -from dlm.export.targets.llama_server import prepare_llama_server_export
 +from dlm.export.targets.base import TargetResult
 +from dlm.export.targets.llama_server import (
 +    LLAMA_SERVER_TARGET,
 +    _find_artifact,
 +    _optional_int_extra,
 +    _optional_path_extra,
 +    _optional_prepared_path,
 +    _read_chat_template,
 +    _require_path_extra,
 +    _require_prepared_int,
 +    _require_prepared_path,
 +    _require_spec_extra,
 +    _script_dir_arg,
 +    prepare_llama_server_export,
 +)
  def _vendor_tree(tmp_path: Path) -> Path:
          script = prepared.launch_script_path.read_text(encoding="utf-8")
          assert "--lora " not in script
          assert "--ctx-size 512" in script
++
++
 +class TestLlamaServerHelpers:
 +    def test_read_chat_template_rejects_invalid_json(self, tmp_path: Path) -> None:
 +        adapter_dir = tmp_path / "adapter"
 +        adapter_dir.mkdir()
 +        (adapter_dir / "tokenizer_config.json").write_text("not json {{{", encoding="utf-8")
++
 +        with pytest.raises(ExportError, match="cannot load chat template"):
 +            _read_chat_template(adapter_dir)
++
 +    def test_read_chat_template_rejects_blank_template(self, tmp_path: Path) -> None:
 +        adapter_dir = tmp_path / "adapter"
 +        adapter_dir.mkdir()
 +        (adapter_dir / "tokenizer_config.json").write_text(
 +            json.dumps({"chat_template": "   "}),
 +            encoding="utf-8",
 +        )
++
 +        with pytest.raises(ExportError, match="has no non-empty chat_template"):
 +            _read_chat_template(adapter_dir)
++
 +    def test_find_artifact_missing_prefix_raises(self, tmp_path: Path) -> None:
 +        with pytest.raises(ExportError, match="missing export artifact with prefix"):
 +            _find_artifact([tmp_path / "adapter.gguf"], prefix="base.")
++
 +    def test_script_dir_arg_requires_path(self) -> None:
 +        with pytest.raises(ExportError, match="missing a required path"):
 +            _script_dir_arg(None)
++
 +    def test_dispatch_extra_validators_raise_on_wrong_types(self, tmp_path: Path) -> None:
 +        ctx = DispatchResult(
 +            export_dir=tmp_path,
 +            manifest_path=tmp_path / "export_manifest.json",
 +            artifacts=[],
 +            banner_lines=[],
 +            extras={
 +                "adapter_dir": "bad",
 +                "training_sequence_len": "bad",
 +                "spec": "bad",
 +                "vendor_override": "bad",
 +            },
 +        )
++
 +        with pytest.raises(ExportError, match="missing Path extra 'adapter_dir'"):
 +            _require_path_extra(ctx, "adapter_dir")
 +        with pytest.raises(ExportError, match="must be an int"):
 +            _optional_int_extra(ctx, "training_sequence_len")
 +        with pytest.raises(ExportError, match="missing BaseModelSpec extra 'spec'"):
 +            _require_spec_extra(ctx, "spec")
 +        with pytest.raises(ExportError, match="must be a Path"):
 +            _optional_path_extra(ctx, "vendor_override")
++
 +        empty_ctx = DispatchResult(
 +            export_dir=tmp_path,
 +            manifest_path=tmp_path / "export_manifest.json",
 +            artifacts=[],
 +            banner_lines=[],
 +            extras={},
 +        )
 +        assert _optional_path_extra(empty_ctx, "vendor_override") is None
 +        assert _optional_int_extra(empty_ctx, "training_sequence_len") is None
++
 +    def test_prepared_extra_validators_raise_on_wrong_types(self, tmp_path: Path) -> None:
 +        prepared = TargetResult(
 +            name="llama-server",
 +            export_dir=tmp_path,
 +            manifest_path=tmp_path / "export_manifest.json",
 +            config_path=tmp_path / "chat-template.jinja",
 +            extras={
 +                "model_path": tmp_path / "base.gguf",
 +                "adapter_gguf_path": "bad",
 +                "context_length": 512,
 +            },
 +        )
++
 +        assert _require_prepared_path(prepared, "model_path") == tmp_path / "base.gguf"
 +        with pytest.raises(ExportError, match="must be a Path"):
 +            _optional_prepared_path(prepared, "adapter_gguf_path")
 +        with pytest.raises(ExportError, match="must be a Path"):
 +            LLAMA_SERVER_TARGET.launch_command(prepared)
++
 +        bad_int = TargetResult(
 +            name="llama-server",
 +            export_dir=tmp_path,
 +            manifest_path=tmp_path / "export_manifest.json",
 +            config_path=tmp_path / "chat-template.jinja",
 +            extras={
 +                "model_path": tmp_path / "base.gguf",
 +                "context_length": "bad",
 +            },
 +        )
 +        with pytest.raises(ExportError, match="missing int extra 'context_length'"):
 +            _require_prepared_int(bad_int, "context_length")
++
 +    def test_smoke_failure_from_runtime_command_is_reported(self, tmp_path: Path) -> None:
 +        prepared = TargetResult(
 +            name="llama-server",
 +            export_dir=tmp_path,
 +            manifest_path=tmp_path / "export_manifest.json",
 +            extras={"model_path": "bad"},
 +            config_path=tmp_path / "chat-template.jinja",
 +        )
++
 +        result = LLAMA_SERVER_TARGET.smoke_test(prepared)
++
 +        assert result.attempted is True
 +        assert result.ok is False
 +        assert "missing Path extra 'model_path'" in result.detail

tests/unit/export/targets/test_mlx_serve_argv.pymodified

116 lines changed — click to load

      MLX_SERVE_TARGET,
      _quote_script_arg,
      _require_prepared_int,
 +    _require_prepared_path,
 +    _require_prepared_str,
 +    _version_from_dir_name,
      finalize_mlx_serve_export,
      prepare_mlx_serve_export,
+ )
          assert store_manifest.exports[-1].quant == "hf"
          assert store_manifest.exports[-1].smoke_output_first_line == "hello from mlx"
 +    def test_prepare_replaces_stale_staged_adapter_dir(
 +        self, tmp_path: Path, monkeypatch: object
 +    ) -> None:
 +        store = _setup_flat_store(tmp_path)
 +        export_dir = store.exports / "mlx-serve"
 +        stale_dir = export_dir / "adapter"
 +        stale_dir.mkdir(parents=True)
 +        (stale_dir / "stale.txt").write_text("stale", encoding="utf-8")
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.is_apple_silicon", lambda: True)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.mlx_available", lambda: True)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.stage_mlx_adapter_dir", _fake_stage_mlx)
++
 +        prepared = prepare_mlx_serve_export(
 +            store=store,
 +            spec=_SPEC,
 +            adapter_name=None,
 +            adapter_path_override=None,
 +            declared_adapter_names=None,
 +        )
++
 +        assert prepared.launch_script_path is not None
 +        assert not (prepared.export_dir / "adapter" / "stale.txt").exists()
 +        assert (prepared.export_dir / "adapter" / "adapters.safetensors").exists()
++
      def test_multi_adapter_export_requires_explicit_selection(
          self, tmp_path: Path, monkeypatch: object
      ) -> None:
                  declared_adapter_names=None,
+             )
 +    def test_named_adapter_export_uses_named_dir(self, tmp_path: Path, monkeypatch: object) -> None:
 +        store = _setup_named_store(tmp_path)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.is_apple_silicon", lambda: True)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.mlx_available", lambda: True)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.stage_mlx_adapter_dir", _fake_stage_mlx)
++
 +        prepared = prepare_mlx_serve_export(
 +            store=store,
 +            spec=_SPEC,
 +            adapter_name="knowledge",
 +            adapter_path_override=None,
 +            declared_adapter_names=None,
 +        )
++
 +        assert str(prepared.extras["adapter_dir"]).endswith("knowledge")
 +        assert prepared.extras["adapter_version"] == 2
++
 +    def test_missing_adapter_override_raises(self, tmp_path: Path, monkeypatch: object) -> None:
 +        store = _setup_flat_store(tmp_path)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.is_apple_silicon", lambda: True)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.mlx_available", lambda: True)
++
 +        with pytest.raises(ExportError, match="adapter_path_override .* does not exist"):
 +            prepare_mlx_serve_export(
 +                store=store,
 +                spec=_SPEC,
 +                adapter_name=None,
 +                adapter_path_override=tmp_path / "missing",
 +                declared_adapter_names=None,
 +            )
++
 +    def test_existing_adapter_override_uses_mixed_dir(
 +        self, tmp_path: Path, monkeypatch: object
 +    ) -> None:
 +        store = _setup_flat_store(tmp_path)
 +        override = tmp_path / "custom-adapter"
 +        _write_adapter(override)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.is_apple_silicon", lambda: True)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.mlx_available", lambda: True)
 +        monkeypatch.setattr("dlm.export.targets.mlx_serve.stage_mlx_adapter_dir", _fake_stage_mlx)
++
 +        prepared = prepare_mlx_serve_export(
 +            store=store,
 +            spec=_SPEC,
 +            adapter_name=None,
 +            adapter_path_override=override,
 +            declared_adapter_names=None,
 +        )
++
 +        assert str(prepared.extras["adapter_dir"]).endswith("mixed")
 +        assert prepared.extras["adapter_version"] == 1
++
      def test_missing_default_adapter_raises(self, tmp_path: Path, monkeypatch: object) -> None:
          store = for_dlm("01EMPTYMLX", home=tmp_path)
          store.ensure_layout()
+         )
          with pytest.raises(ExportError, match="missing int extra"):
              _require_prepared_int(prepared, "adapter_version")
++
 +    def test_string_and_path_validation(self) -> None:
 +        prepared = TargetResult(
 +            name="mlx-serve",
 +            export_dir=Path("/tmp/export"),
 +            manifest_path=Path("/tmp/export/export_manifest.json"),
 +            extras={"model": "", "adapter_dir": "bad"},
 +        )
++
 +        with pytest.raises(ExportError, match="missing string extra"):
 +            _require_prepared_str(prepared, "model")
 +        with pytest.raises(ExportError, match="missing Path extra"):
 +            _require_prepared_path(prepared, "adapter_dir")
++
 +    def test_version_from_dir_name_defaults_for_non_version_dirs(self) -> None:
 +        assert _version_from_dir_name(Path("custom-adapter")) == 1

tests/unit/export/targets/test_vllm_argv.pymodified

77 lines changed — click to load

      VLLM_TARGET,
      LoraModule,
      _default_runtime_env,
 +    _machine,
      _optional_prepared_int,
      _render_launch_script,
      _require_module_specs,
      _require_prepared_int,
      _require_prepared_str,
      _runtime_env,
 +    _sys_platform,
      finalize_vllm_export,
      prepare_vllm_export,
+ )
          assert store_manifest.exports[-1].quant == "hf"
          assert store_manifest.exports[-1].smoke_output_first_line == "hello from vllm"
 +    def test_prepare_replaces_stale_adapters_dir(self, tmp_path: Path) -> None:
 +        store = _setup_flat_store(tmp_path)
 +        export_dir = store.exports / "vllm"
 +        stale_dir = export_dir / "adapters"
 +        stale_dir.mkdir(parents=True)
 +        (stale_dir / "stale.txt").write_text("stale", encoding="utf-8")
++
 +        prepared = prepare_vllm_export(
 +            store=store,
 +            spec=_SPEC,
 +            served_model_name="dlm-flat",
 +            training_sequence_len=2048,
 +            adapter_name=None,
 +            adapter_path_override=None,
 +            declared_adapter_names=None,
 +        )
++
 +        assert prepared.launch_script_path is not None
 +        assert not (prepared.export_dir / "adapters" / "stale.txt").exists()
 +        assert (prepared.export_dir / "adapters" / "adapter" / "adapter_model.safetensors").exists()
++
      def test_multi_adapter_export_includes_all_named_modules(self, tmp_path: Path) -> None:
          store = _setup_named_store(tmp_path)
                  declared_adapter_names=None,
+             )
 +    def test_named_adapter_export_stages_only_named_module(self, tmp_path: Path) -> None:
 +        store = _setup_named_store(tmp_path)
++
 +        prepared = prepare_vllm_export(
 +            store=store,
 +            spec=_SPEC,
 +            served_model_name="dlm-knowledge",
 +            training_sequence_len=2048,
 +            adapter_name="knowledge",
 +            adapter_path_override=None,
 +            declared_adapter_names=None,
 +        )
++
 +        config = json.loads(
 +            (prepared.export_dir / VLLM_CONFIG_FILENAME).read_text(encoding="utf-8")
 +        )
 +        assert config["lora_modules"] == [
 +            {"adapter_version": 2, "name": "knowledge", "path": "adapters/knowledge"}
 +        ]
++
      def test_missing_default_adapter_raises(self, tmp_path: Path) -> None:
          store = for_dlm("01EMPTYVLLM", home=tmp_path)
          store.ensure_layout()
  class TestVllmHelpers:
 +    def test_platform_helpers_return_strings(self) -> None:
 +        assert isinstance(_sys_platform(), str)
 +        assert isinstance(_machine(), str)
++
      def test_default_runtime_env_is_empty_off_apple_silicon(
          self, monkeypatch: pytest.MonkeyPatch
      ) -> None:

tests/unit/export/test_arch_probe.pymodified

29 lines changed — click to load

  import pytest
 +import dlm.export.arch_probe as arch_probe
  from dlm.export.arch_probe import (
      ArchProbeResult,
      SupportLevel,
          # "GemmaForCausalLM" (without the 3) isn't registered.
          assert result.support is SupportLevel.UNSUPPORTED
 +    def test_decorator_without_following_class_is_ignored(self, tmp_path: Path) -> None:
 +        root = _fixture_llama_cpp(
 +            tmp_path,
 +            '@ModelBase.register("FooForCausalLM")\n# no class follows\n',
 +        )
 +        result = probe_gguf_arch("FooForCausalLM", llama_cpp_root=root)
 +        assert result.support is SupportLevel.UNSUPPORTED
++
 +    def test_unextractable_class_name_is_ignored(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        text = '@ModelBase.register("FooForCausalLM")\nclass FooModel(TextModel):\n    pass\n'
 +        monkeypatch.setattr(arch_probe, "_extract_class_name", lambda _text, _start: None)
 +        assert arch_probe._find_arch_bindings(text, "FooForCausalLM") == []
++
 +    def test_extract_class_name_returns_none_without_open_paren(self) -> None:
 +        assert arch_probe._extract_class_name("class FooModel:\n    pass\n", 0) is None
++
  class TestMemoization:
      def test_repeat_calls_hit_cache(self, tmp_path: Path) -> None:

tests/unit/export/test_audio_snapshot.pymodified

105 lines changed — click to load

  from __future__ import annotations
 +import json
  from pathlib import Path
  import pytest
          with pytest.raises(ExportError, match="only audio-language bases"):
              run_audio_snapshot_export(populated_store, _text_spec())
 +    def test_missing_audio_preprocessor_plan_refused(self, populated_store) -> None:
 +        spec = _audio_spec()
 +        object.__setattr__(spec, "audio_preprocessor_plan", None)
 +        with pytest.raises(ExportError, match="no audio_preprocessor_plan"):
 +            run_audio_snapshot_export(populated_store, spec)
++
      def test_missing_adapter_refused(self, tmp_path: Path) -> None:
          store = for_dlm(_VALID_ULID, home=tmp_path)
          store.ensure_layout()
          assert result.export_dir.name != "hf-snapshot"
          assert result.export_dir.name == AUDIO_SNAPSHOT_SUBDIR
 +    def test_named_adapter_export_uses_named_current_pointer(self, populated_store) -> None:
 +        named = populated_store.adapter_version_for("podcast", 5)
 +        named.mkdir(parents=True, exist_ok=True)
 +        (named / "adapter_config.json").write_text('{"r": 32}', encoding="utf-8")
 +        (named / "adapter_model.safetensors").write_bytes(b"named audio bytes")
 +        populated_store.set_current_adapter_for("podcast", named)
++
 +        result = run_audio_snapshot_export(
 +            populated_store,
 +            _audio_spec(),
 +            adapter_name="podcast",
 +        )
++
 +        assert (
 +            result.adapter_dir / "adapter_model.safetensors"
 +        ).read_bytes() == b"named audio bytes"
 +        manifest = load_audio_snapshot_manifest(result.export_dir)
 +        assert manifest.adapter_version == 5
 +        assert manifest.adapter_name == "podcast"
++
 +    def test_adapter_override_uses_provided_dir(self, populated_store, tmp_path: Path) -> None:
 +        override = tmp_path / "merged-adapter"
 +        override.mkdir()
 +        (override / "adapter_model.safetensors").write_bytes(b"override audio bytes")
++
 +        result = run_audio_snapshot_export(
 +            populated_store,
 +            _audio_spec(),
 +            adapter_path_override=override,
 +        )
++
 +        assert (
 +            result.adapter_dir / "adapter_model.safetensors"
 +        ).read_bytes() == b"override audio bytes"
 +        manifest = load_audio_snapshot_manifest(result.export_dir)
 +        assert manifest.adapter_version == 1
++
 +    def test_missing_adapter_override_refused(self, populated_store, tmp_path: Path) -> None:
 +        with pytest.raises(ExportError, match="adapter_path_override .* does not exist"):
 +            run_audio_snapshot_export(
 +                populated_store,
 +                _audio_spec(),
 +                adapter_path_override=tmp_path / "missing",
 +            )
++
 +    def test_processor_save_pretrained_writes_processor_artifact(self, populated_store) -> None:
 +        class _Processor:
 +            def save_pretrained(self, out_dir: str) -> None:
 +                Path(out_dir, "processor_config.json").write_text("{}", encoding="utf-8")
++
 +        result = run_audio_snapshot_export(populated_store, _audio_spec(), processor=_Processor())
++
 +        assert (result.processor_dir / "processor_config.json").exists()
 +        manifest = load_audio_snapshot_manifest(result.export_dir)
 +        paths = {entry.path for entry in manifest.artifacts}
 +        assert "processor/processor_config.json" in paths
++
 +    def test_noncallable_processor_save_is_ignored(self, populated_store) -> None:
 +        class _Processor:
 +            save_pretrained = "not-callable"
++
 +        result = run_audio_snapshot_export(populated_store, _audio_spec(), processor=_Processor())
++
 +        assert result.processor_dir.exists()
 +        assert not any(result.processor_dir.iterdir())
++
  class TestManifestContent:
      def test_export_target_is_hf_snapshot(self, populated_store) -> None:
          with pytest.raises(ExportManifestError, match="cannot parse"):
              load_audio_snapshot_manifest(tmp_path)
 +    def test_invalid_shape_raises(self, tmp_path: Path) -> None:
 +        (tmp_path / SNAPSHOT_MANIFEST_FILENAME).write_text(
 +            json.dumps({"created_by": "dlm-test"}),
 +            encoding="utf-8",
 +        )
 +        with pytest.raises(ExportManifestError, match="invalid shape"):
 +            load_audio_snapshot_manifest(tmp_path)
++
  class TestManifestModelDirect:
      def test_frozen(self) -> None:

tests/unit/export/test_draft_registry.pymodified

20 lines changed — click to load

          with pytest.raises(ValueError, match="target_key 'qwen2.5-3b' not in BASE_MODELS"):
              validate_registry(registry)
 +    def test_missing_draft_registry_key_raises(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        import dlm.export.draft_registry as mod
++
 +        bad_pair = DraftPair(
 +            target_key="a",
 +            draft_registry_key="missing",
 +            upstream_ollama_tag="a:tiny",
 +            notes="missing draft key",
 +        )
 +        monkeypatch.setattr(mod, "DRAFT_PAIRS", (bad_pair,))
 +        registry = {"a": self._fake_spec()}
 +        with pytest.raises(ValueError, match="draft_registry_key 'missing' not in BASE_MODELS"):
 +            validate_registry(registry)
++
      def test_mismatched_template_raises(self, monkeypatch: pytest.MonkeyPatch) -> None:
          import dlm.export.draft_registry as mod

tests/unit/export/test_embedding_sync.pymodified

51 lines changed — click to load

  from __future__ import annotations
  import json
 +import sys
  from pathlib import Path
 +from types import SimpleNamespace
  import numpy as np
  import pytest
 +import dlm.export.embedding_sync as embedding_sync
  from dlm.export.embedding_sync import assert_embedding_rows_match
  from dlm.export.errors import PreflightError
  from dlm.export.gguf_tensors import GGML_TYPE_F16
          assert _added_special_token_ids(adapter) == [3]
 +    def test_non_dict_added_tokens_decoder_returns_empty(self, tmp_path: Path) -> None:
 +        adapter = tmp_path / "adapter"
 +        adapter.mkdir()
 +        (adapter / "tokenizer_config.json").write_text(
 +            json.dumps(
 +                {
 +                    "vocab_size": 5,
 +                    "chat_template": "x",
 +                    "added_tokens_decoder": ["not", "a", "dict"],
 +                }
 +            )
 +        )
 +        assert embedding_sync._added_special_token_ids(adapter) == []
++
 +    def test_safe_open_oserror_raises_preflight(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        adapter = tmp_path / "adapter"
 +        adapter.mkdir()
 +        (adapter / "adapter_model.safetensors").write_bytes(b"placeholder")
++
 +        def _boom(*_args: object, **_kwargs: object) -> object:
 +            raise OSError("broken safetensors")
++
 +        monkeypatch.setitem(sys.modules, "safetensors", SimpleNamespace(safe_open=_boom))
 +        with pytest.raises(PreflightError, match="cannot read adapter safetensors"):
 +            embedding_sync._load_adapter_safetensors(adapter)
++
 +    def test_row_list_returns_empty_for_rank1_tensor(self) -> None:
 +        assert embedding_sync._as_row_list(np.asarray([1.0, 2.0], dtype=np.float16)) == []
++
  class TestBoundsChecks:
      def test_added_token_id_out_of_range_raises(self, tmp_path: Path) -> None:

tests/unit/export/test_gate_fallback_resolve.pymodified

72 lines changed — click to load

  from __future__ import annotations
  import json
 +from dataclasses import replace
  from pathlib import Path
  from types import MappingProxyType
  from dlm.doc.parser import ParsedDlm
  from dlm.doc.schema import AdapterConfig, DlmFrontmatter, GateConfig, TrainingConfig
  from dlm.doc.sections import Section, SectionType
 -from dlm.export.gate_fallback import resolve_gate_mix
 +from dlm.export.gate_fallback import resolve_and_announce, resolve_gate_mix
  from dlm.metrics.events import GateEvent, RunStart
  from dlm.metrics.recorder import MetricsRecorder
  from dlm.store.paths import StorePath
      assert resolve_gate_mix(store, _parsed()) is None
 +def test_single_adapter_returns_none(tmp_path: Path) -> None:
 +    store = StorePath(root=tmp_path)
 +    store.ensure_layout()
 +    parsed = _parsed(gate_enabled=False, adapters=("solo",))
 +    single_adapter_training = parsed.frontmatter.training.model_copy(
 +        update={"gate": GateConfig(enabled=True)}
 +    )
 +    single_adapter_frontmatter = parsed.frontmatter.model_copy(
 +        update={"training": single_adapter_training}
 +    )
 +    assert resolve_gate_mix(store, replace(parsed, frontmatter=single_adapter_frontmatter)) is None
++
++
 +def test_non_store_or_non_parsed_returns_none() -> None:
 +    assert resolve_gate_mix(object(), object()) is None
++
++
  def test_uniform_mode_returns_uniform_mix(tmp_path: Path) -> None:
      store = StorePath(root=tmp_path)
      store.ensure_layout()
      mix = resolve_gate_mix(store, _parsed(adapters=("zeta", "alpha")))
      # Order must match the config's adapter_names tuple, not alphabetic.
      assert mix == [("zeta", 0.4), ("alpha", 0.6)]
++
++
 +def test_resolve_and_announce_no_substitution(tmp_path: Path) -> None:
 +    store = StorePath(root=tmp_path)
 +    store.ensure_layout()
++
 +    resolution = resolve_and_announce(store, _parsed(gate_enabled=False))
++
 +    assert resolution.entries is None
 +    assert resolution.banner_lines == []
++
++
 +def test_resolve_and_announce_substitution_banner(tmp_path: Path) -> None:
 +    store = StorePath(root=tmp_path)
 +    store.ensure_layout()
 +    _write_gate_config(
 +        store,
 +        GateMetadata(
 +            input_dim=576,
 +            hidden_proj_dim=64,
 +            adapter_names=("a", "b"),
 +            mode="uniform",
 +        ),
 +    )
++
 +    resolution = resolve_and_announce(store, _parsed())
++
 +    assert resolution.entries == [("a", 0.5), ("b", 0.5)]
 +    assert resolution.banner_lines == [
 +        "[dim]export: substituting learned gate weights for --adapter-mix (gate_mode=static).[/dim]"
 +    ]

tests/unit/export/test_gguf_io.pyadded

33 lines changed — click to load

 +"""Private GGUF IO helper coverage."""
++
 +from __future__ import annotations
++
 +import io
 +import struct
++
 +import pytest
++
 +from dlm.export._gguf_io import _TYPE_ARRAY, _TYPE_STRING, _read_string, _read_u64, _skip_value
++
++
 +def test_read_u64_short_read_raises() -> None:
 +    with pytest.raises(struct.error, match="short read"):
 +        _read_u64(io.BytesIO(b"\x01\x02"))
++
++
 +def test_read_string_short_read_raises() -> None:
 +    data = io.BytesIO(struct.pack("<Q", 4) + b"ab")
++
 +    with pytest.raises(struct.error, match="short read in string"):
 +        _read_string(data)
++
++
 +def test_skip_value_string_array_huge_length_raises() -> None:
 +    data = io.BytesIO(
 +        struct.pack("<I", _TYPE_STRING)
 +        + struct.pack("<Q", 1)
 +        + struct.pack("<Q", (16 * 1024 * 1024) + 1)
 +    )
++
 +    with pytest.raises(struct.error, match="exceeds bound"):
 +        _skip_value(data, _TYPE_ARRAY)

tests/unit/export/test_gguf_tensors.pymodified

75 lines changed — click to load

          with pytest.raises(PreflightError, match="cannot parse GGUF"):
              load_tensor_index(path)
 +    def test_short_tensor_name_read_refused(self, tmp_path: Path) -> None:
 +        header = bytearray(b"GGUF")
 +        header.extend(struct.pack("<I", 3))
 +        header.extend(struct.pack("<Q", 1))  # tensor_count
 +        header.extend(struct.pack("<Q", 1))  # kv_count
 +        _write_kv_u32(header, "general.alignment", 32)
 +        header.extend(struct.pack("<Q", 5))  # claims 5 bytes
 +        header.extend(b"abc")  # only 3 bytes available
 +        path = tmp_path / "short-name.gguf"
 +        path.write_bytes(bytes(header))
 +        with pytest.raises(PreflightError, match="cannot parse GGUF"):
 +            load_tensor_index(path)
++
 +    @pytest.mark.parametrize("n_dims", [0, 9])
 +    def test_invalid_tensor_rank_refused(self, tmp_path: Path, n_dims: int) -> None:
 +        header = bytearray(b"GGUF")
 +        header.extend(struct.pack("<I", 3))
 +        header.extend(struct.pack("<Q", 1))  # tensor_count
 +        header.extend(struct.pack("<Q", 1))  # kv_count
 +        _write_kv_u32(header, "general.alignment", 32)
 +        _write_string(header, "token_embd.weight")
 +        header.extend(struct.pack("<I", n_dims))
 +        path = tmp_path / f"ndims-{n_dims}.gguf"
 +        path.write_bytes(bytes(header))
 +        with pytest.raises(PreflightError, match="cannot parse GGUF"):
 +            load_tensor_index(path)
++
  class TestRowBytesErrors:
      def _build_basic(self, tmp_path: Path) -> Path:
          with pytest.raises(PreflightError, match="block-quantized"):
              index.row_bytes("token_embd.weight", 0)
 +    def test_rank_zero_tensor_refused(self, tmp_path: Path) -> None:
 +        index = load_tensor_index(self._build_basic(tmp_path))
 +        index = index.__class__(
 +            path=index.path,
 +            entries=(
 +                TensorEntry(name="token_embd.weight", shape=(), dtype=GGML_TYPE_F16, offset=0),
 +            ),
 +            data_block_start=index.data_block_start,
 +            alignment=index.alignment,
 +        )
 +        with pytest.raises(PreflightError, match="rank 0"):
 +            index.row_bytes("token_embd.weight", 0)
++
 +    def test_short_row_read_raises(self, tmp_path: Path) -> None:
 +        path = self._build_basic(tmp_path)
 +        index = load_tensor_index(path)
 +        path.write_bytes(path.read_bytes()[:-1])
 +        with pytest.raises(PreflightError, match="short read on row 1"):
 +            index.row_bytes("token_embd.weight", 1)
++
 +    def test_oserror_while_opening_tensor_raises(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        path = self._build_basic(tmp_path)
 +        index = load_tensor_index(path)
 +        original_open = Path.open
++
 +        def _boom(self: Path, *args: object, **kwargs: object) -> object:
 +            if self == index.path:
 +                raise OSError("nope")
 +            return original_open(self, *args, **kwargs)
++
 +        monkeypatch.setattr(Path, "open", _boom)
 +        with pytest.raises(PreflightError, match="cannot read row 0"):
 +            index.row_bytes("token_embd.weight", 0)
++
  class TestFindApi:
      def test_find_returns_entry_or_none(self, tmp_path: Path) -> None:

tests/unit/export/test_imatrix.pymodified

108 lines changed — click to load

              is None
+         )
 +    def test_non_string_sha_returns_none(self, tmp_path: Path) -> None:
 +        export_dir = self._seed(tmp_path)
 +        meta = json.loads((export_dir / "imatrix.meta.json").read_text())
 +        meta["sha256"] = 123
 +        (export_dir / "imatrix.meta.json").write_text(json.dumps(meta))
 +        assert (
 +            resolve_imatrix(
 +                export_dir,
 +                base_revision="r1",
 +                corpus_sha256="c1",
 +                chunks=DEFAULT_CHUNKS,
 +            )
 +            is None
 +        )
++
 +    def test_invalid_built_at_returns_none(self, tmp_path: Path) -> None:
 +        export_dir = self._seed(tmp_path)
 +        meta = json.loads((export_dir / "imatrix.meta.json").read_text())
 +        meta["built_at"] = "not-a-datetime"
 +        (export_dir / "imatrix.meta.json").write_text(json.dumps(meta))
 +        assert (
 +            resolve_imatrix(
 +                export_dir,
 +                base_revision="r1",
 +                corpus_sha256="c1",
 +                chunks=DEFAULT_CHUNKS,
 +            )
 +            is None
 +        )
++
  # --- calibration_text_from_replay --------------------------------------------
          # `max_chars` is the pre-joiner content budget; the `\n\n`
          # separator between snapshots adds a small constant overhead.
          assert len(text) <= 8_000 + 2 * 10  # 10 possible joiners
++
 +    def test_empty_and_whitespace_snapshots_are_skipped(self, tmp_path: Path) -> None:
 +        from datetime import UTC
 +        from datetime import datetime as _dt
++
 +        from dlm.replay.models import SectionSnapshot
 +        from dlm.replay.store import ReplayStore
++
 +        corpus = tmp_path / "corpus.zst"
 +        idx = tmp_path / "index.json"
 +        store = ReplayStore.at(corpus, idx)
 +        snaps = [
 +            SectionSnapshot(
 +                section_id="0000000000000001",
 +                section_type="prose",
 +                content="",
 +                first_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +                last_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +            ),
 +            SectionSnapshot(
 +                section_id="0000000000000002",
 +                section_type="prose",
 +                content="   \n\t  ",
 +                first_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +                last_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +            ),
 +            SectionSnapshot(
 +                section_id="0000000000000003",
 +                section_type="prose",
 +                content="real calibration content",
 +                first_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +                last_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +            ),
 +        ]
 +        store.append_many(snaps)
++
 +        text, _sha = calibration_text_from_replay(corpus_path=corpus, index_path=idx)
 +        assert text == "real calibration content"
++
 +    def test_truncation_can_clip_with_zero_remaining_budget(self, tmp_path: Path) -> None:
 +        from datetime import UTC
 +        from datetime import datetime as _dt
++
 +        from dlm.replay.models import SectionSnapshot
 +        from dlm.replay.store import ReplayStore
++
 +        corpus = tmp_path / "corpus.zst"
 +        idx = tmp_path / "index.json"
 +        store = ReplayStore.at(corpus, idx)
 +        snaps = [
 +            SectionSnapshot(
 +                section_id="0000000000000001",
 +                section_type="prose",
 +                content="abcd",
 +                first_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +                last_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +            ),
 +            SectionSnapshot(
 +                section_id="0000000000000002",
 +                section_type="prose",
 +                content="efgh",
 +                first_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +                last_seen_at=_dt(2026, 4, 19, tzinfo=UTC).replace(tzinfo=None),
 +            ),
 +        ]
 +        store.append_many(snaps)
++
 +        text, _sha = calibration_text_from_replay(corpus_path=corpus, index_path=idx, max_chars=4)
 +        assert text == "abcd"

tests/unit/export/test_merge.pyadded

21 lines changed — click to load

 +"""Pure merge helper coverage."""
++
 +from __future__ import annotations
++
 +import pytest
++
 +from dlm.export.errors import UnsafeMergeError
 +from dlm.export.merge import check_merge_safety
 +from dlm.export.plan import ExportPlan
++
++
 +def test_check_merge_safety_delegates_to_plan() -> None:
 +    check_merge_safety(ExportPlan(merged=False), was_qlora=True)
++
++
 +def test_check_merge_safety_refuses_unsafe_qlora_merge() -> None:
 +    with pytest.raises(UnsafeMergeError, match="QLoRA"):
 +        check_merge_safety(
 +            ExportPlan(merged=True, dequantize_confirmed=False),
 +            was_qlora=True,
 +        )

tests/unit/export/test_precision_safety.pymodified

10 lines changed — click to load

          with pytest.raises(PreflightError, match="training_run_json"):
              was_trained_with_qlora(tmp_path, strict_training_run=True)
 +    def test_malformed_pinned_versions_falls_back_to_false(self, tmp_path: Path) -> None:
 +        (tmp_path / "pinned_versions.json").write_text("not json", encoding="utf-8")
 +        assert was_trained_with_qlora(tmp_path) is False
++
  class TestResolvePrecisionSafety:
      def test_unmerged_export_is_safe(self, tmp_path: Path) -> None:

tests/unit/export/test_preflight.pymodified

73 lines changed — click to load

  import json
  from pathlib import Path
 +from types import SimpleNamespace
  import pytest
  from dlm.export.preflight import (
      check_adapter_config,
      check_chat_template,
 +    check_pretokenizer_fingerprint,
      check_tokenizer_vocab,
 +    check_vl_target_modules_lm_only,
      check_was_adapter_qlora,
+ )
          with pytest.raises(PreflightError, match="cannot determine vocab"):
              check_tokenizer_vocab(tmp_path)
 +    def test_malformed_tokenizer_json_raises(self, tmp_path: Path) -> None:
 +        (tmp_path / "tokenizer_config.json").write_text(
 +            json.dumps({"chat_template": "{{messages}}"})
 +        )
 +        (tmp_path / "tokenizer.json").write_text("not json {{{")
 +        with pytest.raises(PreflightError, match="cannot parse"):
 +            check_tokenizer_vocab(tmp_path)
++
  class TestChatTemplate:
      def test_present_ok(self, tmp_path: Path) -> None:
          with pytest.raises(PreflightError, match="missing"):
              check_chat_template(tmp_path, required=True)
 +    def test_malformed_config_raises(self, tmp_path: Path) -> None:
 +        (tmp_path / "tokenizer_config.json").write_text("not json {{{")
 +        with pytest.raises(PreflightError, match="cannot parse"):
 +            check_chat_template(tmp_path, required=True)
++
  class TestQloraFlag:
      def test_missing_file_returns_false(self, tmp_path: Path) -> None:
          (tmp_path / "training_run.json").write_text("not json")
          with pytest.raises(PreflightError, match="training_run_json"):
              check_was_adapter_qlora(tmp_path)
++
++
 +class TestPretokenizerFingerprint:
 +    def test_failed_probe_raises(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        monkeypatch.setattr(
 +            "dlm.base_models.probes.probe_pretokenizer_hash",
 +            lambda _spec: SimpleNamespace(skipped=False, passed=False, detail="mismatch"),
 +        )
++
 +        with pytest.raises(PreflightError, match="pre-tokenizer fingerprint mismatch"):
 +            check_pretokenizer_fingerprint(_SPEC)
++
++
 +class TestVlTargetModulesLmOnly:
 +    def test_missing_config_is_noop(self, tmp_path: Path) -> None:
 +        check_vl_target_modules_lm_only(tmp_path)
++
 +    def test_malformed_config_is_noop(self, tmp_path: Path) -> None:
 +        (tmp_path / "adapter_config.json").write_text("not json {{{")
 +        check_vl_target_modules_lm_only(tmp_path)
++
 +    def test_string_pattern_target_modules_is_noop(self, tmp_path: Path) -> None:
 +        _write_adapter_config(tmp_path, target_modules=".*q_proj.*")
 +        check_vl_target_modules_lm_only(tmp_path)
++
 +    def test_vision_targets_raise(self, tmp_path: Path) -> None:
 +        _write_adapter_config(tmp_path, target_modules=["q_proj", "vision_tower.block.0"])
 +        with pytest.raises(PreflightError, match="vision-tower modules"):
 +            check_vl_target_modules_lm_only(tmp_path)

tests/unit/export/test_runner.pymodified

301 lines changed — click to load

      return cached_base, store, vendor
 +def _setup_named_store(tmp_path: Path) -> tuple[Path, Any, Path]:
 +    cached_base, store, vendor = _setup_store(tmp_path)
 +    knowledge = store.adapter_version_for("knowledge", 2)
 +    knowledge.mkdir(parents=True)
 +    (knowledge / "adapter_config.json").write_text(
 +        json.dumps({"base_model_name_or_path": _SPEC.hf_id, "peft_type": "LORA"})
 +    )
 +    (knowledge / "tokenizer_config.json").write_text(
 +        json.dumps({"vocab_size": 32000, "chat_template": "{{messages}}"})
 +    )
 +    (knowledge / "training_run.json").write_text(json.dumps({"use_qlora": False}))
 +    store.set_current_adapter_for("knowledge", knowledge)
 +    return cached_base, store, vendor
++
++
  def _relative_file_bytes(root: Path) -> dict[str, bytes]:
      return {
          str(path.relative_to(root)): path.read_bytes()
  class TestHappyPath:
 +    def test_default_ollama_name_lowercases_dlm_id(self) -> None:
 +        from dlm.export.runner import default_ollama_name
++
 +        assert default_ollama_name("01ABCDEF", 7) == "dlm-01abcdef:v0007"
++
      def test_unmerged_export_emits_base_and_adapter(self, tmp_path: Path) -> None:
          cached_base, store, vendor = _setup_store(tmp_path)
          plan = ExportPlan(quant="Q4_K_M", merged=False)
          # No subprocess should have launched on the safety-gate path.
          assert recorder.commands == []
 +    def test_merged_export_delegates_to_merge_path(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        cached_base, store, vendor = _setup_store(tmp_path, use_qlora=False)
 +        plan = ExportPlan(merged=True, dequantize_confirmed=True)
 +        recorder = _SubprocessRecorder(store.export_quant_dir(plan.quant))
 +        seen: list[dict[str, object]] = []
++
 +        def _fake_merge_path(**kwargs: object) -> None:
 +            seen.append(kwargs)
++
 +        monkeypatch.setattr("dlm.export.runner._perform_merge_path", _fake_merge_path)
++
 +        result = run_export(
 +            store,
 +            _SPEC,
 +            plan,
 +            cached_base_dir=cached_base,
 +            subprocess_runner=recorder,
 +            vendor_override=vendor,
 +            skip_ollama=True,
 +            vocab_checker=lambda _a, _g: None,
 +            embedding_checker=lambda _a, _g: None,
 +        )
++
 +        assert result.merged is True
 +        assert len(seen) == 1
 +        assert seen[0]["adapter_path"] == store.resolve_current_adapter()
 +        assert seen[0]["was_qlora"] is False
++
  class TestDefaultVocabCheck:
      """Default path loads the adapter tokenizer-vocab and compares against the base GGUF."""
                  subprocess_runner=lambda _cmd: None,
+             )
 +    def test_missing_adapter_override_raises(self, tmp_path: Path) -> None:
 +        cached_base, store, vendor = _setup_store(tmp_path)
++
 +        with pytest.raises(ExportError, match="adapter_path_override .* does not exist"):
 +            run_export(
 +                store,
 +                _SPEC,
 +                ExportPlan(),
 +                cached_base_dir=cached_base,
 +                subprocess_runner=lambda _cmd: None,
 +                vendor_override=vendor,
 +                adapter_path_override=tmp_path / "missing",
 +            )
++
 +    def test_missing_named_adapter_raises(self, tmp_path: Path) -> None:
 +        cached_base, store, vendor = _setup_store(tmp_path)
++
 +        with pytest.raises(ExportError, match="run `dlm train` before exporting for adapter"):
 +            run_export(
 +                store,
 +                _SPEC,
 +                ExportPlan(),
 +                cached_base_dir=cached_base,
 +                subprocess_runner=lambda _cmd: None,
 +                vendor_override=vendor,
 +                adapter_name="knowledge",
 +            )
++
 +    def test_named_adapter_export_uses_named_pointer(self, tmp_path: Path) -> None:
 +        cached_base, store, vendor = _setup_named_store(tmp_path)
 +        recorder = _SubprocessRecorder(store.export_quant_dir("Q4_K_M"))
++
 +        result = run_export(
 +            store,
 +            _SPEC,
 +            ExportPlan(),
 +            cached_base_dir=cached_base,
 +            subprocess_runner=recorder,
 +            vendor_override=vendor,
 +            skip_ollama=True,
 +            vocab_checker=lambda _a, _g: None,
 +            embedding_checker=lambda _a, _g: None,
 +            adapter_name="knowledge",
 +        )
++
 +        assert result.export_dir == store.export_quant_dir("Q4_K_M")
 +        assert len(recorder.commands) == 3
++
  class TestManifestAppend:
      def test_exports_list_grows(self, tmp_path: Path) -> None:
          # Peer released → no export summary landed (we errored before save).
          manifest = load_manifest(store.manifest)
          assert len(manifest.exports) == 0
++
++
 +class TestRunnerInternals:
 +    def test_cached_base_missing_manifest_is_false(self, tmp_path: Path) -> None:
 +        from dlm.export.runner import _cached_base_matches
++
 +        export_dir = tmp_path / "exports" / "Q4_K_M"
 +        export_dir.mkdir(parents=True)
 +        base_gguf = export_dir / "base.Q4_K_M.gguf"
 +        base_gguf.write_bytes(b"cached bytes")
++
 +        assert _cached_base_matches(export_dir, base_gguf, "Q4_K_M") is False
++
 +    def test_cached_base_quant_mismatch_is_false(self, tmp_path: Path) -> None:
 +        from dlm.export.manifest import ExportManifest
 +        from dlm.export.runner import _cached_base_matches
++
 +        export_dir = tmp_path / "exports" / "Q4_K_M"
 +        export_dir.mkdir(parents=True)
 +        base_gguf = export_dir / "base.Q4_K_M.gguf"
 +        base_gguf.write_bytes(b"cached bytes")
 +        manifest = ExportManifest(
 +            target="ollama",
 +            quant="Q5_K_M",
 +            created_at=datetime(2026, 4, 23, 12, 0, 0),
 +            created_by="dlm-test",
 +            base_model_hf_id="org/base",
 +            base_model_revision="a" * 40,
 +            adapter_version=1,
 +            artifacts=[],
 +        )
 +        (export_dir / "export_manifest.json").write_text(
 +            manifest.model_dump_json(indent=2) + "\n",
 +            encoding="utf-8",
 +        )
++
 +        assert _cached_base_matches(export_dir, base_gguf, "Q4_K_M") is False
++
 +    def test_cached_base_without_recorded_artifact_is_false(self, tmp_path: Path) -> None:
 +        from dlm.export.manifest import ExportManifest, build_artifact
 +        from dlm.export.runner import _cached_base_matches
++
 +        export_dir = tmp_path / "exports" / "Q4_K_M"
 +        export_dir.mkdir(parents=True)
 +        base_gguf = export_dir / "base.Q4_K_M.gguf"
 +        other = export_dir / "other.gguf"
 +        base_gguf.write_bytes(b"cached bytes")
 +        other.write_bytes(b"other bytes")
 +        manifest = ExportManifest(
 +            target="ollama",
 +            quant="Q4_K_M",
 +            created_at=datetime(2026, 4, 23, 12, 0, 0),
 +            created_by="dlm-test",
 +            base_model_hf_id="org/base",
 +            base_model_revision="a" * 40,
 +            adapter_version=1,
 +            artifacts=[build_artifact(export_dir, other)],
 +        )
 +        (export_dir / "export_manifest.json").write_text(
 +            manifest.model_dump_json(indent=2) + "\n",
 +            encoding="utf-8",
 +        )
++
 +        assert _cached_base_matches(export_dir, base_gguf, "Q4_K_M") is False
++
 +    def test_cached_imatrix_without_existing_file_returns_none(self, tmp_path: Path) -> None:
 +        from dlm.export.runner import _resolve_or_build_imatrix
++
 +        cached_base, store, _vendor = _setup_store(tmp_path)
 +        fp16 = tmp_path / "base.fp16.gguf"
 +        fp16.write_bytes(b"fp16")
++
 +        assert (
 +            _resolve_or_build_imatrix(
 +                export_dir=tmp_path,
 +                fp16_path=fp16,
 +                plan=ExportPlan(quant="Q4_K_M", imatrix="cached"),
 +                run=lambda _cmd: None,
 +                vendor_override=None,
 +                spec=_SPEC,
 +                store=store,
 +            )
 +            is None
 +        )
++
 +    def test_auto_imatrix_cache_hit_logs_and_returns_path(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch, caplog: pytest.LogCaptureFixture
 +    ) -> None:
 +        from types import SimpleNamespace
++
 +        from dlm.export.runner import _resolve_or_build_imatrix
++
 +        cached_base, store, _vendor = _setup_store(tmp_path)
 +        fp16 = tmp_path / "base.fp16.gguf"
 +        fp16.write_bytes(b"fp16")
 +        imatrix = tmp_path / "imatrix.gguf"
 +        imatrix.write_bytes(b"imatrix")
++
 +        monkeypatch.setattr(
 +            "dlm.export.imatrix.calibration_text_from_replay",
 +            lambda **_kwargs: ("calibration text", "abc123"),
 +        )
 +        monkeypatch.setattr(
 +            "dlm.export.imatrix.resolve_imatrix",
 +            lambda *_args, **_kwargs: SimpleNamespace(path=imatrix, sha256="abcdef123456"),
 +        )
 +        caplog.set_level(logging.INFO, logger="dlm.export.runner")
++
 +        resolved = _resolve_or_build_imatrix(
 +            export_dir=tmp_path,
 +            fp16_path=fp16,
 +            plan=ExportPlan(quant="Q4_K_M", imatrix="auto"),
 +            run=lambda _cmd: None,
 +            vendor_override=None,
 +            spec=_SPEC,
 +            store=store,
 +        )
++
 +        assert resolved == imatrix
 +        assert "imatrix: cache hit (" in caplog.text
++
 +    def test_run_ollama_stage_records_detected_version(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        from dlm.export.runner import _run_ollama_stage
++
 +        cached_base, store, _vendor = _setup_store(tmp_path)
 +        export_dir = store.export_quant_dir("Q4_K_M")
 +        export_dir.mkdir(parents=True, exist_ok=True)
 +        base_gguf = export_dir / "base.Q4_K_M.gguf"
 +        base_gguf.write_bytes(b"base")
 +        adapter = store.resolve_current_adapter()
 +        assert adapter is not None
++
 +        monkeypatch.setattr("dlm.export.ollama.check_ollama_version", lambda: (1, 2, 3))
 +        monkeypatch.setattr("dlm.export.draft_registry.resolve_draft", lambda *args, **kwargs: None)
 +        monkeypatch.setattr(
 +            "dlm.export.ollama.render_modelfile",
 +            lambda _ctx: "FROM ./base.Q4_K_M.gguf\n",
 +        )
++
 +        seen: list[str] = []
++
 +        def _create(*, name: str, modelfile_path: Path, cwd: Path) -> str:
 +            seen.append(name)
 +            assert modelfile_path.exists()
 +            assert cwd == export_dir
 +            return "created"
++
 +        monkeypatch.setattr("dlm.export.ollama.ollama_create", _create)
 +        monkeypatch.setattr("dlm.export.ollama.ollama_run", lambda **_kwargs: "unused")
++
 +        modelfile_path, name, ver_str, smoke_first_line = _run_ollama_stage(
 +            store=store,
 +            spec=_SPEC,
 +            plan=ExportPlan(quant="Q4_K_M"),
 +            adapter_path=adapter,
 +            export_dir=export_dir,
 +            base_gguf_path=base_gguf,
 +            adapter_version=1,
 +            system_prompt=None,
 +            source_dlm_path=None,
 +            skip_smoke=True,
 +            ollama_create_runner=None,
 +            ollama_run_runner=None,
 +            training_sequence_len=None,
 +            override_temperature=None,
 +            override_top_p=None,
 +            draft_override=None,
 +            draft_disabled=False,
 +        )
++
 +        assert modelfile_path.exists()
 +        assert name == seen[0]
 +        assert ver_str == "1.2.3"
 +        assert smoke_first_line is None

tests/unit/export/test_smoke.pymodified

33 lines changed — click to load

  class TestSmokeHelpers:
 +    def test_reserve_local_port_returns_loopback_port(
 +        self, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        class _FakeSocket:
 +            def __enter__(self) -> _FakeSocket:
 +                return self
++
 +            def __exit__(self, exc_type: object, exc: object, tb: object) -> None:
 +                return None
++
 +            def bind(self, address: tuple[str, int]) -> None:
 +                assert address == ("127.0.0.1", 0)
++
 +            def getsockname(self) -> tuple[str, int]:
 +                return ("127.0.0.1", 43123)
++
 +        monkeypatch.setattr(smoke_mod.socket, "socket", lambda *_args, **_kwargs: _FakeSocket())
++
 +        assert smoke_mod.reserve_local_port() == 43123
++
      def test_normalize_message_content(self) -> None:
          assert smoke_mod._normalize_message_content("  hello  ") == "hello"
          assert (
+             )
              == "first\nsecond"
+         )
 +        assert smoke_mod._normalize_message_content([{"text": "first"}, "skip-me"]) == "first"
          assert smoke_mod._normalize_message_content([{"text": "   "}]) is None
          assert smoke_mod._normalize_message_content(3) is None

tests/unit/export/test_vendoring.pymodified

49 lines changed — click to load

  from __future__ import annotations
 +import errno
  from pathlib import Path
  import pytest
          root = _populate_vendor(tmp_path / "llama.cpp")
          assert llama_cpp_root(override=root) == root
 +    def test_enumeration_failure_raises(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        root = _populate_vendor(tmp_path / "llama.cpp")
++
 +        def _raise_iterdir() -> object:
 +            raise OSError(errno.EIO, "boom")
++
 +        monkeypatch.setattr(Path, "iterdir", lambda self: _raise_iterdir())
++
 +        with pytest.raises(VendoringError, match="cannot enumerate"):
 +            llama_cpp_root(override=root)
++
  class TestScriptResolvers:
      def test_convert_hf_resolves(self, tmp_path: Path) -> None:
          with pytest.raises(VendoringError, match="llama-server"):
              llama_server_bin(override=root)
 +    def test_path_lookup_returns_binary_when_vendor_missing(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        monkeypatch.setenv("PATH", str(tmp_path))
 +        fake = tmp_path / "llama-quantize"
 +        fake.write_text("#!/bin/sh\n", encoding="utf-8")
 +        fake.chmod(0o755)
 +        monkeypatch.setattr(
 +            "shutil.which", lambda name: str(fake) if name == "llama-quantize" else None
 +        )
++
 +        path = llama_quantize_bin(
 +            override=_populate_vendor(tmp_path / "llama.cpp", with_binary=False)
 +        )
++
 +        assert path == fake
++
      def test_dlm_llama_cpp_build_env_preferred(
          self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
      ) -> None:

tests/unit/export/test_vl_gguf.pymodified

131 lines changed — click to load

  import pytest
 +import dlm.export.vl_gguf as vl_gguf
  from dlm.base_models.schema import BaseModelSpec, VlPreprocessorPlan
  from dlm.export.arch_probe import ArchProbeResult, SupportLevel
 -from dlm.export.errors import VlGgufUnsupportedError
 +from dlm.export.errors import ExportError, VlGgufUnsupportedError
  from dlm.export.plan import ExportPlan
  from dlm.export.vl_gguf import VlGgufResult, run_vl_gguf_export
  from dlm.store.paths import for_dlm
      return adapter
 +def _populate_named_adapter(store: Any, name: str, version: int = 1) -> Path:
 +    """Write a minimally-valid named adapter checkpoint under `adapter/<name>/`."""
 +    store.ensure_layout()
 +    adapter: Path = store.adapter_version_for(name, version)
 +    adapter.mkdir(parents=True, exist_ok=True)
 +    (adapter / "adapter_config.json").write_text(
 +        json.dumps(
 +            {
 +                "base_model_name_or_path": "Qwen/Qwen2-VL-2B-Instruct",
 +                "target_modules": ["q_proj", "v_proj"],
 +                "r": 16,
 +            }
 +        ),
 +        encoding="utf-8",
 +    )
 +    (adapter / "tokenizer_config.json").write_text(
 +        json.dumps(
 +            {
 +                "vocab_size": 151643,
 +                "chat_template": "{{ 'hi' }}",
 +            }
 +        ),
 +        encoding="utf-8",
 +    )
 +    (adapter / "training_run.json").write_text(
 +        json.dumps({"use_qlora": False}),
 +        encoding="utf-8",
 +    )
 +    store.set_current_adapter_for(name, adapter)
 +    return adapter
++
++
  class TestRefusals:
      """Covers `_assert_supported` — the three preconditions + adapter gate."""
          paths = {a["path"] for a in manifest["artifacts"]}
          assert "base.Q4_K_M.gguf" in paths
          assert "Modelfile" in paths
++
 +    def test_named_adapter_export_uses_named_current_pointer(self, tmp_path: Path) -> None:
 +        store = for_dlm(_VALID_ULID, home=tmp_path)
 +        flat = _populate_adapter(store, version=1)
 +        named = _populate_named_adapter(store, "knowledge", version=2)
 +        cached_base = tmp_path / "base-cache"
 +        cached_base.mkdir()
 +        llama_cpp_root = _fixture_llama_cpp_root(tmp_path)
++
 +        merge_calls: list[tuple[Path, Path, Path]] = []
++
 +        def _recorder(args: Any) -> None:
 +            if args and args[0].endswith("llama-quantize"):
 +                Path(args[2]).write_bytes(b"stub-gguf-bytes")
++
 +        def _merge(adapter: Path, out_dir: Path, *, cached_base_dir: Path) -> None:
 +            merge_calls.append((adapter, out_dir, cached_base_dir))
 +            out_dir.mkdir(parents=True, exist_ok=True)
++
 +        result = run_vl_gguf_export(
 +            store,
 +            _qwen2vl_spec(),
 +            _merged_plan(),
 +            verdict=_supported_verdict(),
 +            cached_base_dir=cached_base,
 +            adapter_name="knowledge",
 +            subprocess_runner=_recorder,
 +            merge_runner=_merge,
 +            llama_cpp_root_override=llama_cpp_root,
 +        )
++
 +        assert len(merge_calls) == 1
 +        assert merge_calls[0][0] == named
 +        assert merge_calls[0][0] != flat
 +        manifest = json.loads(result.manifest_path.read_text(encoding="utf-8"))
 +        assert manifest["adapter_version"] == 2
++
 +    def test_missing_quantize_output_raises(self, tmp_path: Path) -> None:
 +        store = for_dlm(_VALID_ULID, home=tmp_path)
 +        _populate_adapter(store)
 +        cached_base = tmp_path / "base-cache"
 +        cached_base.mkdir()
 +        llama_cpp_root = _fixture_llama_cpp_root(tmp_path)
++
 +        def _recorder(_args: Any) -> None:
 +            return None
++
 +        def _merge(_adapter: Path, out_dir: Path, *, cached_base_dir: Path) -> None:
 +            out_dir.mkdir(parents=True, exist_ok=True)
++
 +        with pytest.raises(ExportError, match="expected .*base.Q4_K_M.gguf"):
 +            run_vl_gguf_export(
 +                store,
 +                _qwen2vl_spec(),
 +                _merged_plan(),
 +                verdict=_supported_verdict(),
 +                cached_base_dir=cached_base,
 +                subprocess_runner=_recorder,
 +                merge_runner=_merge,
 +                llama_cpp_root_override=llama_cpp_root,
 +            )
++
++
 +class TestHelpers:
 +    def test_version_parser_falls_back_to_one_for_non_version_dir(self, tmp_path: Path) -> None:
 +        assert vl_gguf._version_from_dir_name(tmp_path / "merged-adapter") == 1
++
 +    def test_default_runner_delegates_to_run_checked(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        recorded: dict[str, object] = {}
++
 +        def _fake_run_checked(args: list[str], *, timeout: int) -> object:
 +            recorded["args"] = args
 +            recorded["timeout"] = timeout
 +            return "ok"
++
 +        monkeypatch.setattr(vl_gguf, "run_checked", _fake_run_checked)
 +        out = vl_gguf._default_runner(("python", "tool.py"))
 +        assert out == "ok"
 +        assert recorded == {"args": ["python", "tool.py"], "timeout": 60 * 60}

tests/unit/export/test_vl_snapshot.pymodified

101 lines changed — click to load

  from __future__ import annotations
 +import json
  from pathlib import Path
  import pytest
          with pytest.raises(ExportError, match="only vision-language bases"):
              run_vl_snapshot_export(populated_store, _text_spec())
 +    def test_missing_vl_preprocessor_plan_refused(self, populated_store) -> None:
 +        spec = _vl_spec()
 +        object.__setattr__(spec, "vl_preprocessor_plan", None)
 +        with pytest.raises(ExportError, match="no vl_preprocessor_plan"):
 +            run_vl_snapshot_export(populated_store, spec)
++
      def test_missing_adapter_refused(self, tmp_path: Path) -> None:
          store = for_dlm(_VALID_ULID, home=tmp_path)
          store.ensure_layout()
          result = run_vl_snapshot_export(populated_store, _vl_spec())
          assert (result.adapter_dir / "adapter_model.safetensors").read_bytes() == b"new bytes"
 +    def test_named_adapter_export_uses_named_current_pointer(self, populated_store) -> None:
 +        named = populated_store.adapter_version_for("knowledge", 7)
 +        named.mkdir(parents=True, exist_ok=True)
 +        (named / "adapter_config.json").write_text('{"r": 32}', encoding="utf-8")
 +        (named / "adapter_model.safetensors").write_bytes(b"named bytes")
 +        populated_store.set_current_adapter_for("knowledge", named)
++
 +        result = run_vl_snapshot_export(
 +            populated_store,
 +            _vl_spec(),
 +            adapter_name="knowledge",
 +        )
++
 +        assert (result.adapter_dir / "adapter_model.safetensors").read_bytes() == b"named bytes"
 +        manifest = load_vl_snapshot_manifest(result.export_dir)
 +        assert manifest.adapter_version == 7
 +        assert manifest.adapter_name == "knowledge"
++
 +    def test_adapter_override_uses_provided_dir(self, populated_store, tmp_path: Path) -> None:
 +        override = tmp_path / "merged-adapter"
 +        override.mkdir()
 +        (override / "adapter_model.safetensors").write_bytes(b"override bytes")
++
 +        result = run_vl_snapshot_export(
 +            populated_store,
 +            _vl_spec(),
 +            adapter_path_override=override,
 +        )
++
 +        assert (result.adapter_dir / "adapter_model.safetensors").read_bytes() == b"override bytes"
 +        manifest = load_vl_snapshot_manifest(result.export_dir)
 +        assert manifest.adapter_version == 1
++
 +    def test_missing_adapter_override_refused(self, populated_store, tmp_path: Path) -> None:
 +        with pytest.raises(ExportError, match="adapter_path_override .* does not exist"):
 +            run_vl_snapshot_export(
 +                populated_store,
 +                _vl_spec(),
 +                adapter_path_override=tmp_path / "missing",
 +            )
++
 +    def test_processor_save_pretrained_writes_processor_artifact(self, populated_store) -> None:
 +        class _Processor:
 +            def save_pretrained(self, out_dir: str) -> None:
 +                Path(out_dir, "processor_config.json").write_text("{}", encoding="utf-8")
++
 +        result = run_vl_snapshot_export(populated_store, _vl_spec(), processor=_Processor())
++
 +        assert (result.processor_dir / "processor_config.json").exists()
 +        manifest = load_vl_snapshot_manifest(result.export_dir)
 +        paths = {entry.path for entry in manifest.artifacts}
 +        assert "processor/processor_config.json" in paths
++
 +    def test_noncallable_processor_save_is_ignored(self, populated_store) -> None:
 +        class _Processor:
 +            save_pretrained = "not-callable"
++
 +        result = run_vl_snapshot_export(populated_store, _vl_spec(), processor=_Processor())
++
 +        assert result.processor_dir.exists()
 +        assert not any(result.processor_dir.iterdir())
++
  class TestManifestContent:
      def test_export_target_is_hf_snapshot(self, populated_store) -> None:
          with pytest.raises(ExportManifestError, match="cannot parse"):
              load_vl_snapshot_manifest(tmp_path)
 +    def test_invalid_shape_raises(self, tmp_path: Path) -> None:
 +        (tmp_path / SNAPSHOT_MANIFEST_FILENAME).write_text(
 +            json.dumps({"created_by": "dlm-test"}),
 +            encoding="utf-8",
 +        )
 +        with pytest.raises(ExportManifestError, match="invalid shape"):
 +            load_vl_snapshot_manifest(tmp_path)
++
  class TestManifestModelDirect:
      def test_frozen(self) -> None:

tests/unit/hardware/test_capabilities.pymodified

88 lines changed — click to load

  from __future__ import annotations
 +from types import SimpleNamespace
 +from unittest.mock import patch
++
  import pytest
  from dlm.hardware.backend import Backend
 -from dlm.hardware.capabilities import probe
 +from dlm.hardware.capabilities import _accelerate_version, _rocm_arch_supports_bf16, probe
  from tests.fixtures.hardware_mocks import force_cpu, force_cuda, force_mps, force_rocm
          # flash_attn gated on SM>=8.0 regardless of package availability
          assert caps.has_flash_attention is False
 +    def test_cuda_sm_probe_failure_yields_unknown_sm(self) -> None:
 +        with force_cuda():
 +            with patch("torch.cuda.get_device_capability", side_effect=RuntimeError("boom")):
 +                caps = probe()
 +        assert caps.sm is None
++
 +    def test_cuda_vram_probe_failure_yields_unknown_vram(self) -> None:
 +        with force_cuda():
 +            with patch("torch.cuda.mem_get_info", side_effect=RuntimeError("boom")):
 +                caps = probe()
 +        assert caps.vram_gb is None
++
 +    def test_cuda_flash_attention_true_when_package_and_sm_supported(self) -> None:
 +        with (
 +            patch("dlm.hardware.capabilities._module_available", lambda name: name == "flash_attn"),
 +            force_cuda(sm=(8, 0)),
 +        ):
 +            caps = probe()
 +        assert caps.has_flash_attention is True
++
  class TestProbeRocm:
      def test_rocm_reports_hip_version(self) -> None:
          assert caps.determinism_class == "best-effort"
          assert caps.has_flash_attention is False
 +    def test_rocm_arch_probe_failure_yields_unknown_arch(self) -> None:
 +        with force_rocm():
 +            with patch("torch.cuda.get_device_properties", side_effect=RuntimeError("boom")):
 +                caps = probe()
 +        assert caps.rocm_arch is None
++
 +    def test_rocm_arch_probe_missing_name_yields_unknown_arch(self) -> None:
 +        with force_rocm():
 +            with patch(
 +                "torch.cuda.get_device_properties", return_value=SimpleNamespace(name="AMD")
 +            ):
 +                caps = probe()
 +        assert caps.rocm_arch is None
++
  class TestProbeMps:
      def test_mps_caps(self) -> None:
          assert caps.determinism_class == "best-effort"
          assert caps.has_flash_attention is False
 +    def test_mps_never_reports_flash_attention(self) -> None:
 +        with (
 +            patch("dlm.hardware.capabilities._module_available", lambda name: name == "flash_attn"),
 +            force_mps(),
 +        ):
 +            caps = probe()
 +        assert caps.has_flash_attention is False
++
  class TestMlxAvailability:
      def test_non_mps_never_reports_mlx(self) -> None:
              caps = probe()
          assert caps.telemetry_posture["HF_HUB_DISABLE_TELEMETRY"] == "<unset>"
          assert caps.telemetry_posture["DO_NOT_TRACK"] == "<unset>"
++
++
 +class TestCoverageEdges:
 +    def test_rocm_arch_none_is_not_bf16_capable(self) -> None:
 +        assert _rocm_arch_supports_bf16(None) is False
++
 +    def test_accelerate_version_missing_returns_none(self) -> None:
 +        from importlib.metadata import PackageNotFoundError
++
 +        with patch("importlib.metadata.version", side_effect=PackageNotFoundError):
 +            assert _accelerate_version() is None

tests/unit/hardware/test_plan.pymodified

76 lines changed — click to load

  from __future__ import annotations
 +from unittest.mock import patch
++
 +import pytest
++
  from dlm.doc.schema import TrainingConfig
  from dlm.hardware.capabilities import probe
 -from dlm.hardware.plan import resolve
 +from dlm.hardware.plan import _build_reason, resolve
  from tests.fixtures.hardware_mocks import force_cpu, force_cuda, force_mps
          plan = resolve(_cfg(), caps, base_params=135_000_000, seq_len=1024)
          assert plan.attn_implementation == "sdpa"
 +    def test_flash_attention_selected_when_available(self) -> None:
 +        with (
 +            patch("dlm.hardware.capabilities._module_available", lambda name: name == "flash_attn"),
 +            force_cuda(sm=(8, 0)),
 +        ):
 +            caps = probe()
 +        plan = resolve(_cfg(), caps, base_params=1_500_000_000, seq_len=2048)
 +        assert plan.attn_implementation == "flash_attention_2"
++
  class TestQloraGating:
      def test_qlora_requested_on_cuda_without_bnb_raises(self) -> None:
          loose_plan = resolve(_cfg(), loose_caps, base_params=1_500_000_000, seq_len=2048)
          assert tight_plan.micro_batch_size <= loose_plan.micro_batch_size
 +    def test_tiny_budget_breaks_auto_micro_batch_at_one(self) -> None:
 +        with force_cuda(sm=(8, 0), vram_gb=2.0):
 +            caps = probe()
 +        plan = resolve(_cfg(), caps, base_params=3_000_000_000, seq_len=4096)
 +        assert plan.micro_batch_size == 1
++
  class TestGradientCheckpointing:
      def test_enabled_when_memory_tight(self) -> None:
          plan = resolve(_cfg(), caps, base_params=1_500_000_000, seq_len=2048)
          assert "precision=bf16" in plan.reason
          assert "attn=" in plan.reason
++
++
 +class TestResolverCoverageEdges:
 +    def test_world_size_must_be_positive(self) -> None:
 +        with force_cuda(sm=(8, 0)):
 +            caps = probe()
 +        with pytest.raises(ValueError, match="world_size must be >= 1"):
 +            resolve(_cfg(), caps, base_params=135_000_000, seq_len=512, world_size=0)
++
 +    def test_multi_gpu_refusals_checked_when_world_size_gt_one(self) -> None:
 +        with force_cuda(sm=(8, 0)):
 +            caps = probe()
 +        with (
 +            patch("dlm.hardware.plan.check_multi_gpu_refusals") as multi_gpu,
 +            patch("dlm.hardware.plan.check_refusals"),
 +        ):
 +            resolve(_cfg(), caps, base_params=135_000_000, seq_len=512, world_size=2)
 +        multi_gpu.assert_called_once_with(caps, 2)
++
 +    def test_build_reason_records_dora_and_galore_warning(self) -> None:
 +        reason = _build_reason(
 +            "bf16",
 +            "sdpa",
 +            False,
 +            True,
 +            adapter="dora",
 +            optimizer="galore_adamw",
 +            base_params=500_000_000,
 +        )
 +        assert "adapter=dora" in reason
 +        assert "optim=galore_adamw" in reason
 +        assert "warn=galore-small-base(500M<1B)" in reason

tests/unit/harvest/test_sway_reader.pymodified

18 lines changed — click to load

          assert len(candidates) == 1
          assert candidates[0].confidence == 1.0
 +    def test_invalid_confidence_defaults_to_one(self, tmp_path: Path) -> None:
 +        broken_conf = {**_PROBE_FAIL_WITH_REF}
 +        broken_conf["evidence"] = {
 +            "prompt": "q?",
 +            "reference": "a.",
 +            "confidence": {"not": "numeric"},
 +        }
 +        report = _write(tmp_path, _full_report([broken_conf]))
 +        candidates = read_sway_report(report)
 +        assert len(candidates) == 1
 +        assert candidates[0].confidence == 1.0
++
  class TestMissingReference:
      def test_strict_raises(self, tmp_path: Path) -> None:

tests/unit/inference/test_mlx_backend.pymodified

30 lines changed — click to load

  import pytest
  from dlm.base_models import BASE_MODELS
 -from dlm.inference.backends.mlx_backend import MlxBackend, _resolve_base_num_hidden_layers
 +from dlm.inference.backends.mlx_backend import (
 +    MlxBackend,
 +    _resolve_base_num_hidden_layers,
 +    stage_mlx_adapter_dir,
 +)
  from dlm.inference.errors import AdapterNotFoundError
  from dlm.inference.mlx_adapter import MlxConversionError
          assert backend._workdir is None
          assert backend._model is None
          assert backend._tokenizer is None
++
++
 +class TestStageMlxAdapterDir:
 +    def test_unreadable_adapter_config_raises_conversion_error(self, tmp_path: Path) -> None:
 +        adapter_dir = tmp_path / "adapter"
 +        adapter_dir.mkdir()
 +        (adapter_dir / "adapter_model.safetensors").write_bytes(b"fake")
 +        (adapter_dir / "adapter_config.json").mkdir()
++
 +        with pytest.raises(MlxConversionError, match="cannot read .*adapter_config.json"):
 +            stage_mlx_adapter_dir(
 +                adapter_dir,
 +                tmp_path / "staged",
 +                base_hf_id=BASE_MODELS["smollm2-135m"].hf_id,
 +            )

tests/unit/lock/test_mismatch_policy.pymodified

13 lines changed — click to load

          msgs = [msg for _s, msg in classify_mismatches(prior, current)]
          assert any("url changed" in m for m in msgs)
 +    def test_equal_acceptance_is_silent(self) -> None:
 +        acceptance = self._acceptance()
 +        prior = _lock(license_acceptance=acceptance)
 +        current = _lock(license_acceptance=acceptance)
 +        msgs = [msg for _s, msg in classify_mismatches(prior, current)]
 +        assert not any("license_acceptance" in m for m in msgs)
++
      def test_both_none_is_silent(self) -> None:
          prior = _lock(license_acceptance=None)
          current = _lock(license_acceptance=None)

tests/unit/metrics/test_queries.pymodified

256 lines changed — click to load

  from __future__ import annotations
 +import sqlite3
  from datetime import UTC, datetime, timedelta
  from pathlib import Path
 -from dlm.metrics.events import EvalEvent, PreferenceMineEvent, RunEnd, RunStart, StepEvent
 +import pytest
++
 +from dlm.metrics.events import (
 +    EvalEvent,
 +    GateEvent,
 +    PreferenceMineEvent,
 +    RunEnd,
 +    RunStart,
 +    StepEvent,
 +    TokenizationEvent,
 +)
  from dlm.metrics.queries import (
      evals_for_run,
      evals_to_dict,
 +    gate_events_for_run,
 +    latest_gate_events,
      latest_preference_mining,
      latest_run_id,
 +    latest_tokenization,
      preference_mining_for_run,
      preference_mining_to_dict,
      preference_mining_totals,
      runs_to_dict,
      steps_for_run,
      steps_to_dict,
 +    tokenization_for_run,
+ )
  from dlm.metrics.recorder import MetricsRecorder
              rec.record_step(StepEvent(run_id=run_id, step=step, loss=2.0 - 0.1 * step))
          rec.record_eval(EvalEvent(run_id=run_id, step=30, val_loss=1.5))
          rec.record_run_end(RunEnd(run_id=run_id, status="ok"))
 +    rec.record_tokenization(
 +        TokenizationEvent(
 +            run_id=3,
 +            total_sections=10,
 +            cache_hits=7,
 +            cache_misses=3,
 +            total_tokenize_seconds=0.75,
 +            cache_bytes_after=4096,
 +        )
 +    )
 +    rec.record_gate(
 +        GateEvent(
 +            run_id=2,
 +            adapter_name="tone",
 +            mean_weight=0.8,
 +            sample_count=12,
 +            mode="trained",
 +        )
 +    )
 +    rec.record_gate(
 +        GateEvent(
 +            run_id=2,
 +            adapter_name="facts",
 +            mean_weight=0.2,
 +            sample_count=12,
 +            mode="trained",
 +        )
 +    )
      rec.record_preference_mine(
          PreferenceMineEvent(
              run_id=2,
              pass
          assert latest_run_id(tmp_path) is None
 +    def test_none_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert latest_run_id(tmp_path) is None
++
++
 +class TestTokenizationQueries:
 +    def test_tokenization_for_run_returns_row_with_hit_rate(self, tmp_path: Path) -> None:
 +        _seed(tmp_path)
 +        row = tokenization_for_run(tmp_path, run_id=3)
 +        assert row is not None
 +        assert row.cache_hits == 7
 +        assert row.hit_rate == 0.7
++
 +    def test_tokenization_for_run_none_when_table_has_no_row(self, tmp_path: Path) -> None:
 +        from dlm.metrics.db import connect
++
 +        with connect(tmp_path) as _conn:
 +            pass
 +        assert tokenization_for_run(tmp_path, run_id=3) is None
++
 +    def test_hit_rate_zero_when_total_lookups_is_zero(self) -> None:
 +        from dlm.metrics.queries import TokenizationRow
++
 +        row = TokenizationRow(
 +            run_id=1,
 +            total_sections=0,
 +            cache_hits=0,
 +            cache_misses=0,
 +            total_tokenize_seconds=0.0,
 +            cache_bytes_after=0,
 +            at="2026-01-01T00:00:00Z",
 +        )
 +        assert row.hit_rate == 0.0
++
 +    def test_tokenization_for_run_none_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert tokenization_for_run(tmp_path, run_id=1) is None
++
 +    def test_latest_tokenization_returns_most_recent_row(self, tmp_path: Path) -> None:
 +        _seed(tmp_path)
 +        row = latest_tokenization(tmp_path)
 +        assert row is not None
 +        assert row.run_id == 3
++
 +    def test_latest_tokenization_none_when_empty(self, tmp_path: Path) -> None:
 +        from dlm.metrics.db import connect
++
 +        with connect(tmp_path) as _conn:
 +            pass
 +        assert latest_tokenization(tmp_path) is None
++
 +    def test_latest_tokenization_none_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert latest_tokenization(tmp_path) is None
++
++
 +class TestGateQueries:
 +    def test_gate_events_for_run_returns_rows_sorted_by_adapter(self, tmp_path: Path) -> None:
 +        _seed(tmp_path)
 +        rows = gate_events_for_run(tmp_path, run_id=2)
 +        assert [row.adapter_name for row in rows] == ["facts", "tone"]
++
 +    def test_gate_events_for_run_returns_empty_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert gate_events_for_run(tmp_path, run_id=2) == []
++
 +    def test_latest_gate_events_returns_latest_run_rows(self, tmp_path: Path) -> None:
 +        _seed(tmp_path)
 +        rows = latest_gate_events(tmp_path)
 +        assert [row.adapter_name for row in rows] == ["facts", "tone"]
++
 +    def test_latest_gate_events_empty_when_table_empty(self, tmp_path: Path) -> None:
 +        from dlm.metrics.db import connect
++
 +        with connect(tmp_path) as _conn:
 +            pass
 +        assert latest_gate_events(tmp_path) == []
++
 +    def test_latest_gate_events_empty_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert latest_gate_events(tmp_path) == []
++
  class TestPreferenceMiningQueries:
      def test_preference_mining_for_run_returns_oldest_first(self, tmp_path: Path) -> None:
          assert totals.total_mined_pairs == 3
          assert totals.total_skipped_prompts == 3
 +    def test_preference_mining_for_run_returns_empty_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert preference_mining_for_run(tmp_path, run_id=2) == []
++
 +    def test_latest_preference_mining_returns_none_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert latest_preference_mining(tmp_path) is None
++
 +    def test_preference_mining_totals_none_when_table_empty(self, tmp_path: Path) -> None:
 +        from dlm.metrics.db import connect
++
 +        with connect(tmp_path) as _conn:
 +            pass
 +        assert preference_mining_totals(tmp_path) is None
++
 +    def test_preference_mining_totals_none_on_sqlite_error(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.metrics.queries as queries_mod
++
 +        def _boom(_store_root: Path) -> sqlite3.Connection:
 +            raise sqlite3.OperationalError("boom")
++
 +        monkeypatch.setattr(queries_mod, "connect", _boom)
 +        assert preference_mining_totals(tmp_path) is None
++
  class TestDictSerialization:
      def test_runs_to_dict_shape(self, tmp_path: Path) -> None:

tests/unit/metrics/test_recorder.pymodified

84 lines changed — click to load

  from collections.abc import Iterator
  from contextlib import contextmanager
  from pathlib import Path
 +from typing import Any
  import pytest
  from dlm.metrics.events import (
      EvalEvent,
      ExportEvent,
 +    GateEvent,
      PreferenceMineEvent,
      RunEnd,
      RunStart,
      StepEvent,
 +    TokenizationEvent,
+ )
 -from dlm.metrics.recorder import DlmTrainerCallback, MetricsRecorder
 +from dlm.metrics.recorder import DlmTrainerCallback, MetricsRecorder, _maybe_float
 -def _select_all(db_path: Path, table: str) -> list[tuple]:
 +def _select_all(db_path: Path, table: str) -> list[tuple[Any, ...]]:
      conn = sqlite3.connect(str(db_path))
      try:
          rows = conn.execute(f"SELECT * FROM {table} ORDER BY 1").fetchall()
          assert rows[0][2] == 1.8  # val_loss
 +class TestTokenization:
 +    def test_tokenization_written(self, tmp_path: Path) -> None:
 +        rec = MetricsRecorder(tmp_path)
 +        rec.record_run_start(RunStart(run_id=1, adapter_version=None, phase="sft", seed=0))
 +        rec.record_tokenization(
 +            TokenizationEvent(
 +                run_id=1,
 +                total_sections=4,
 +                cache_hits=3,
 +                cache_misses=1,
 +                total_tokenize_seconds=0.25,
 +                cache_bytes_after=1024,
 +            )
 +        )
 +        rows = _select_all(metrics_db_path(tmp_path), "tokenization")
 +        assert len(rows) == 1
 +        assert rows[0][1:6] == (4, 3, 1, 0.25, 1024)
++
++
 +class TestGateRecorder:
 +    def test_gate_written(self, tmp_path: Path) -> None:
 +        rec = MetricsRecorder(tmp_path)
 +        rec.record_run_start(RunStart(run_id=1, adapter_version=None, phase="sft", seed=0))
 +        rec.record_gate(
 +            GateEvent(
 +                run_id=1,
 +                adapter_name="tone",
 +                mean_weight=0.6,
 +                sample_count=8,
 +                mode="trained",
 +            )
 +        )
 +        rows = _select_all(metrics_db_path(tmp_path), "gate_events")
 +        assert len(rows) == 1
 +        assert rows[0][1:5] == ("tone", 0.6, 8, "trained")
++
++
  class TestExports:
      def test_export_written(self, tmp_path: Path) -> None:
          rec = MetricsRecorder(tmp_path)
          with pytest.raises(AttributeError, match="not_a_callback"):
              _ = callback.not_a_callback
++
++
 +class TestMaybeFloat:
 +    def test_none_returns_none(self) -> None:
 +        assert _maybe_float(None) is None
++
 +    def test_numeric_values_parse(self) -> None:
 +        assert _maybe_float(1.25) == 1.25
 +        assert _maybe_float("2.5") == 2.5
++
 +    def test_bad_value_returns_none(self) -> None:
 +        assert _maybe_float("nope") is None

tests/unit/metrics/test_sinks.pyadded

168 lines changed — click to load

 +"""Optional observability sinks: TensorBoard + W&B."""
++
 +from __future__ import annotations
++
 +import sys
 +from pathlib import Path
 +from types import ModuleType
 +from typing import Any
++
 +import pytest
++
 +from dlm.metrics.events import EvalEvent, StepEvent
 +from dlm.metrics.sinks import (
 +    TensorBoardSink,
 +    WandbSink,
 +    tensorboard_available,
 +    wandb_available,
 +)
++
++
 +class _FakeWriter:
 +    def __init__(self, *, log_dir: str) -> None:
 +        self.log_dir = log_dir
 +        self.scalars: list[tuple[str, float, int]] = []
 +        self.flushed = False
 +        self.closed = False
++
 +    def add_scalar(self, name: str, value: float, step: int) -> None:
 +        self.scalars.append((name, value, step))
++
 +    def flush(self) -> None:
 +        self.flushed = True
++
 +    def close(self) -> None:
 +        self.closed = True
++
++
 +class _FakeRun:
 +    def __init__(self) -> None:
 +        self.logged: list[tuple[dict[str, float], int]] = []
 +        self.finished = False
++
 +    def log(self, payload: dict[str, float], *, step: int) -> None:
 +        self.logged.append((payload, step))
++
 +    def finish(self) -> None:
 +        self.finished = True
++
++
 +class TestAvailabilityProbes:
 +    def test_tensorboard_available_true_when_spec_exists(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        monkeypatch.setattr(
 +            "importlib.util.find_spec",
 +            lambda name: object() if name == "tensorboard" else None,
 +        )
 +        assert tensorboard_available() is True
++
 +    def test_tensorboard_available_false_when_spec_missing(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        monkeypatch.setattr("importlib.util.find_spec", lambda _name: None)
 +        assert tensorboard_available() is False
++
 +    def test_wandb_available_true_when_spec_exists(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        monkeypatch.setattr(
 +            "importlib.util.find_spec",
 +            lambda name: object() if name == "wandb" else None,
 +        )
 +        assert wandb_available() is True
++
 +    def test_wandb_available_false_when_spec_missing(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        monkeypatch.setattr("importlib.util.find_spec", lambda _name: None)
 +        assert wandb_available() is False
++
++
 +class TestTensorBoardSink:
 +    def test_constructor_raises_cleanly_when_tensorboard_missing(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        real_import = __import__
++
 +        def _fake_import(name: str, *args: Any, **kwargs: Any) -> Any:
 +            if name == "torch.utils.tensorboard":
 +                raise ImportError("missing tensorboard")
 +            return real_import(name, *args, **kwargs)
++
 +        monkeypatch.setattr("builtins.__import__", _fake_import)
 +        with pytest.raises(RuntimeError, match="requires `tensorboard`"):
 +            TensorBoardSink(tmp_path, run_id=7)
++
 +    def test_records_step_eval_and_close(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        fake_module = ModuleType("torch.utils.tensorboard")
 +        fake_module.SummaryWriter = _FakeWriter  # type: ignore[attr-defined]
 +        monkeypatch.setitem(sys.modules, "torch.utils.tensorboard", fake_module)
++
 +        sink = TensorBoardSink(tmp_path, run_id=7)
 +        sink.record_step(StepEvent(run_id=7, step=10, loss=1.2, lr=0.01, grad_norm=0.5))
 +        sink.record_eval(EvalEvent(run_id=7, step=10, val_loss=0.9, perplexity=2.0))
 +        sink.close()
++
 +        writer = sink._writer
 +        assert sink.log_dir == tmp_path / "tensorboard" / "run_0007"
 +        assert writer.scalars == [
 +            ("train/loss", 1.2, 10),
 +            ("train/lr", 0.01, 10),
 +            ("train/grad_norm", 0.5, 10),
 +            ("eval/val_loss", 0.9, 10),
 +            ("eval/perplexity", 2.0, 10),
 +        ]
 +        assert writer.flushed is True
 +        assert writer.closed is True
++
++
 +class TestWandbSink:
 +    def test_constructor_raises_cleanly_when_wandb_missing(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        real_import = __import__
++
 +        def _fake_import(name: str, *args: Any, **kwargs: Any) -> Any:
 +            if name == "wandb":
 +                raise ImportError("missing wandb")
 +            return real_import(name, *args, **kwargs)
++
 +        monkeypatch.setattr("builtins.__import__", _fake_import)
 +        with pytest.raises(RuntimeError, match="requires `wandb`"):
 +            WandbSink(tmp_path, run_id=9, project="dlm")
++
 +    def test_records_payloads_and_close(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        fake_run = _FakeRun()
 +        fake_wandb = ModuleType("wandb")
 +        fake_wandb.init = lambda **_kwargs: fake_run  # type: ignore[attr-defined]
 +        monkeypatch.setitem(sys.modules, "wandb", fake_wandb)
++
 +        sink = WandbSink(tmp_path, run_id=9, project="dlm")
 +        sink.record_step(StepEvent(run_id=9, step=3, loss=1.0, lr=0.02, grad_norm=0.4))
 +        sink.record_eval(EvalEvent(run_id=9, step=3, val_loss=0.8, perplexity=1.5))
 +        sink.record_step(StepEvent(run_id=9, step=4, loss=None, lr=None, grad_norm=None))
 +        sink.record_eval(EvalEvent(run_id=9, step=4, val_loss=None, perplexity=None))
 +        sink.close()
++
 +        assert fake_run.logged == [
 +            ({"train/loss": 1.0, "train/lr": 0.02, "train/grad_norm": 0.4}, 3),
 +            ({"eval/val_loss": 0.8, "eval/perplexity": 1.5}, 3),
 +        ]
 +        assert fake_run.finished is True

tests/unit/modality/test_dispatch_modules.pyadded

136 lines changed — click to load

 +"""Direct coverage for modality dispatch wrapper modules."""
++
 +from __future__ import annotations
++
 +from types import SimpleNamespace
 +from unittest.mock import patch
++
 +import pytest
++
 +from dlm.base_models import BaseModelSpec
 +from dlm.modality.audio import AudioLanguageModality
 +from dlm.modality.errors import UnknownModalityError
 +from dlm.modality.registry import TextModality, _unknown, modality_for
 +from dlm.modality.text import TextModality as ReexportedTextModality
 +from dlm.modality.vl import VisionLanguageModality
++
++
 +def _minimal_text_spec(*, modality: str = "text") -> BaseModelSpec:
 +    return BaseModelSpec.model_validate(
 +        {
 +            "key": "demo-1b",
 +            "hf_id": "org/demo-1b",
 +            "revision": "0123456789abcdef0123456789abcdef01234567",
 +            "architecture": "DemoForCausalLM",
 +            "params": 1_000_000_000,
 +            "target_modules": ["q_proj", "v_proj"],
 +            "template": "chatml",
 +            "gguf_arch": "demo",
 +            "tokenizer_pre": "demo",
 +            "license_spdx": "Apache-2.0",
 +            "license_url": None,
 +            "requires_acceptance": False,
 +            "redistributable": True,
 +            "size_gb_fp16": 2.0,
 +            "context_length": 4096,
 +            "recommended_seq_len": 2048,
 +            "modality": modality,
 +        }
 +    )
++
++
 +def test_text_module_reexports_text_modality() -> None:
 +    assert ReexportedTextModality is TextModality
++
++
 +def test_text_dispatch_defaults_are_noops() -> None:
 +    dispatch = TextModality()
++
 +    assert dispatch.load_processor(_minimal_text_spec()) is None
 +    assert (
 +        dispatch.dispatch_export(
 +            store=object(),
 +            spec=_minimal_text_spec(),
 +            adapter_name=None,
 +            quant=None,
 +            merged=False,
 +            adapter_mix_raw=None,
 +        )
 +        is None
 +    )
++
++
 +def test_unknown_error_contains_registration_hint() -> None:
 +    err = _unknown("mystery")
 +    assert isinstance(err, UnknownModalityError)
 +    assert "Register a ModalityDispatch subclass" in str(err)
++
++
 +def test_modality_for_unknown_modality_raises() -> None:
 +    with pytest.raises(UnknownModalityError, match="mystery"):
 +        modality_for(SimpleNamespace(modality="mystery"))
++
++
 +def test_audio_modality_loads_processor_and_dispatches_export() -> None:
 +    dispatch = AudioLanguageModality()
 +    spec = SimpleNamespace()
++
 +    with (
 +        patch("dlm.train.loader.load_processor", return_value="processor") as load_processor,
 +        patch("dlm.export.dispatch.dispatch_audio_export", return_value="audio-export") as export,
 +    ):
 +        processor = dispatch.load_processor(spec)
 +        result = dispatch.dispatch_export(
 +            store="store",
 +            spec=spec,
 +            adapter_name="adapter",
 +            quant="q4_k_m",
 +            merged=False,
 +            adapter_mix_raw="named",
 +        )
++
 +    assert processor == "processor"
 +    load_processor.assert_called_once_with(spec)
 +    assert result == "audio-export"
 +    export.assert_called_once_with(
 +        store="store",
 +        spec=spec,
 +        adapter_name="adapter",
 +        quant="q4_k_m",
 +        merged=False,
 +        adapter_mix_raw="named",
 +    )
++
++
 +def test_vl_modality_loads_processor_and_dispatches_export() -> None:
 +    dispatch = VisionLanguageModality()
 +    spec = SimpleNamespace()
 +    context = {"emit": "gguf"}
++
 +    with (
 +        patch("dlm.train.loader.load_processor", return_value="processor") as load_processor,
 +        patch("dlm.export.dispatch.dispatch_vl_export", return_value="vl-export") as export,
 +    ):
 +        processor = dispatch.load_processor(spec)
 +        result = dispatch.dispatch_export(
 +            store="store",
 +            spec=spec,
 +            adapter_name="adapter",
 +            quant="q8_0",
 +            merged=True,
 +            adapter_mix_raw=None,
 +            gguf_emission_context=context,
 +        )
++
 +    assert processor == "processor"
 +    load_processor.assert_called_once_with(spec)
 +    assert result == "vl-export"
 +    export.assert_called_once_with(
 +        store="store",
 +        spec=spec,
 +        adapter_name="adapter",
 +        quant="q8_0",
 +        merged=True,
 +        adapter_mix_raw=None,
 +        gguf_emission_context=context,
 +    )

tests/unit/modality/test_vl_contract.pyadded

72 lines changed — click to load

 +"""Direct coverage for VL runtime contract guardrails."""
++
 +from __future__ import annotations
++
 +from types import SimpleNamespace
++
 +import pytest
++
 +from dlm.modality.errors import ProcessorContractError
 +from dlm.modality.vl_contract import ensure_supported_vl_runtime, validate_loaded_vl_processor
++
++
 +def test_ensure_supported_vl_runtime_is_noop_for_non_vl_specs() -> None:
 +    ensure_supported_vl_runtime(
 +        SimpleNamespace(modality="text", architecture="Anything", key="demo")
 +    )
++
++
 +def test_ensure_supported_vl_runtime_is_noop_for_supported_vl_architecture() -> None:
 +    ensure_supported_vl_runtime(
 +        SimpleNamespace(
 +            modality="vision-language", architecture="Qwen2VLForConditionalGeneration", key="demo"
 +        )
 +    )
++
++
 +def test_ensure_supported_vl_runtime_rejects_internvl_family() -> None:
 +    with pytest.raises(ProcessorContractError, match="InternVL-family VL model"):
 +        ensure_supported_vl_runtime(
 +            SimpleNamespace(
 +                modality="vision-language", architecture="InternVLChatModel", key="internvl"
 +            )
 +        )
++
++
 +def test_validate_loaded_vl_processor_is_noop_for_non_vl_specs() -> None:
 +    processor = object()
 +    assert (
 +        validate_loaded_vl_processor(
 +            SimpleNamespace(modality="text", architecture="Demo", key="demo"), processor
 +        )
 +        is processor
 +    )
++
++
 +def test_validate_loaded_vl_processor_accepts_processor_with_image_processor() -> None:
 +    processor = SimpleNamespace(image_processor=object())
 +    assert (
 +        validate_loaded_vl_processor(
 +            SimpleNamespace(modality="vision-language", architecture="Demo", key="demo"),
 +            processor,
 +        )
 +        is processor
 +    )
++
++
 +def test_validate_loaded_vl_processor_delegates_internvl_refusal() -> None:
 +    with pytest.raises(ProcessorContractError, match="InternVL-family VL model"):
 +        validate_loaded_vl_processor(
 +            SimpleNamespace(
 +                modality="vision-language", architecture="InternVLChatModel", key="internvl"
 +            ),
 +            SimpleNamespace(),
 +        )
++
++
 +def test_validate_loaded_vl_processor_rejects_missing_image_processor() -> None:
 +    with pytest.raises(ProcessorContractError, match="without an `image_processor` attribute"):
 +        validate_loaded_vl_processor(
 +            SimpleNamespace(modality="vision-language", architecture="Demo", key="demo"),
 +            SimpleNamespace(),
 +        )

tests/unit/preference/test_cli_judge.pymodified

95 lines changed — click to load

  from __future__ import annotations
 +import math
  import subprocess
  from pathlib import Path
  from unittest.mock import patch
  from dlm.preference import (
      CliJudge,
      HfRewardModelJudge,
 +    InvalidJudgeSpecError,
      JudgeInvocationError,
      JudgeUnavailableError,
      SwayJudge,
      build_judge,
+ )
 +from dlm.preference.judge import _combine_reasoning, _parse_cli_candidate_score
  def _proc(
  class TestCliJudge:
 +    def test_blank_command_is_rejected(self) -> None:
 +        with pytest.raises(InvalidJudgeSpecError, match="include a command"):
 +            CliJudge("   ")
++
 +    def test_empty_argv_after_split_is_rejected(self) -> None:
 +        with (
 +            patch("dlm.preference.judge.shlex.split", return_value=[]),
 +            pytest.raises(InvalidJudgeSpecError, match="include a command"),
 +        ):
 +            CliJudge("judge-bin")
++
 +    def test_non_positive_timeout_is_rejected(self) -> None:
 +        with pytest.raises(ValueError, match="timeout must be > 0"):
 +            CliJudge("judge-bin", timeout=0.0)
++
      def test_scores_pair_via_two_json_round_trips(self) -> None:
          seen_payloads: list[str] = []
          ):
              judge.score_pair("p", "a", "b")
 +    def test_oserror_raises_unavailable_error(self) -> None:
 +        judge = CliJudge("judge-bin")
 +        with (
 +            patch(
 +                "dlm.preference.judge.subprocess.run",
 +                side_effect=OSError("permission denied"),
 +            ),
 +            pytest.raises(JudgeUnavailableError, match="could not start"),
 +        ):
 +            judge.score_pair("p", "a", "b")
++
++
 +class TestCliJudgeHelpers:
 +    def test_empty_stdout_is_rejected(self) -> None:
 +        with pytest.raises(JudgeInvocationError, match="empty stdout"):
 +            _parse_cli_candidate_score("   ")
++
 +    def test_json_must_be_object(self) -> None:
 +        with pytest.raises(JudgeInvocationError, match="JSON object"):
 +            _parse_cli_candidate_score('["not", "an", "object"]')
++
 +    @pytest.mark.parametrize("score", [float("nan"), float("inf"), -float("inf")])
 +    def test_score_must_be_finite(self, score: float) -> None:
 +        rendered = "NaN" if math.isnan(score) else ("Infinity" if score > 0 else "-Infinity")
 +        with pytest.raises(JudgeInvocationError, match="must be finite"):
 +            _parse_cli_candidate_score(f'{{"score": {rendered}}}')
++
 +    def test_reasoning_must_be_string_when_present(self) -> None:
 +        with pytest.raises(JudgeInvocationError, match="must be a string"):
 +            _parse_cli_candidate_score('{"score": 1.0, "reasoning": 7}')
++
 +    @pytest.mark.parametrize(
 +        ("left", "right", "expected"),
 +        [
 +            ("why a", None, "a: why a"),
 +            (None, "why b", "b: why b"),
 +            ("why a", "why b", "a: why a | b: why b"),
 +            (None, None, None),
 +        ],
 +    )
 +    def test_combine_reasoning_formats_present_parts(
 +        self,
 +        left: str | None,
 +        right: str | None,
 +        expected: str | None,
 +    ) -> None:
 +        assert _combine_reasoning(left, right) == expected
++
  class TestBuildJudge:
      def test_cli_ref_builds_concrete_cli_judge(self) -> None:

tests/unit/preference/test_hf_reward_judge.pymodified

265 lines changed — click to load

  from __future__ import annotations
 +import builtins
  from collections import deque
 +from types import SimpleNamespace
 +from unittest.mock import patch
  import pytest
 -from dlm.preference import HfRewardModelJudge, JudgeInvocationError
 +from dlm.preference import (
 +    HfRewardModelJudge,
 +    InvalidJudgeSpecError,
 +    JudgeInvocationError,
 +    JudgeUnavailableError,
 +)
 +from dlm.preference.judge import (
 +    _default_reward_loader,
 +    _encode_reward_input,
 +    _extract_reward_scalar,
 +    _move_to_device,
 +    _resolve_reward_device,
 +)
  class FakeScalar:
          return self
 +class FakeTensor:
 +    def __init__(self) -> None:
 +        self.device: str | None = None
++
 +    def to(self, device: str) -> FakeTensor:
 +        self.device = device
 +        return self
++
++
  class FakeTokenizer:
 -    def __init__(self, *, use_chat_template: bool = False) -> None:
 +    def __init__(
 +        self,
 +        *,
 +        use_chat_template: bool = False,
 +        template_error: Exception | None = None,
 +        template_returns_non_string: bool = False,
 +    ) -> None:
          self.calls: list[tuple[str, tuple[object, ...], dict[str, object]]] = []
 +        self._template_error = template_error
 +        self._template_returns_non_string = template_returns_non_string
          if use_chat_template:
              self.chat_template = "fake-template"
      def apply_chat_template(self, messages: list[dict[str, str]], **kwargs: object) -> str:
          self.calls.append(("apply_chat_template", (messages,), dict(kwargs)))
 +        if self._template_error is not None:
 +            raise self._template_error
 +        if self._template_returns_non_string:
 +            return ""  # type: ignore[return-value]
          return f"templated::{messages[0]['content']}::{messages[1]['content']}"
      def __call__(self, *args: object, **kwargs: object) -> FakeBatch:
          return Output(self._logits.popleft())
 +class FakeTorchScalarLogits:
 +    def __init__(self, value: float) -> None:
 +        self._value = value
++
 +    def numel(self) -> int:
 +        return 1
++
 +    def item(self) -> float:
 +        return self._value
++
++
 +class FakePretrainedRewardModel:
 +    def __init__(self) -> None:
 +        self.device: str | None = None
 +        self.eval_called = False
++
 +    def to(self, device: str) -> FakePretrainedRewardModel:
 +        self.device = device
 +        return self
++
 +    def eval(self) -> None:
 +        self.eval_called = True
++
++
  def _loader_factory(tokenizer: FakeTokenizer, model: FakeModel):
      calls: list[tuple[str, str]] = []
  class TestHfRewardModelJudge:
 +    def test_blank_selector_is_rejected(self) -> None:
 +        with pytest.raises(InvalidJudgeSpecError, match="include a model id"):
 +            HfRewardModelJudge("   ")
++
      def test_scores_pair_and_caches_loaded_bundle(self) -> None:
          tokenizer = FakeTokenizer()
          model = FakeModel([FakeLogits([0.2]), FakeLogits([0.9])])
          with pytest.raises(JudgeInvocationError, match="no `.logits`"):
              judge.score_pair("prompt", "a", "b")
          assert calls == [("reward/model", "cpu")]
++
 +    def test_missing_torch_is_reported(self) -> None:
 +        tokenizer = FakeTokenizer()
 +        model = FakeModel([FakeLogits([0.2]), FakeLogits([0.1])])
 +        _, loader = _loader_factory(tokenizer, model)
 +        judge = HfRewardModelJudge("reward/model", device="cpu", loader=loader)
 +        real_import = builtins.__import__
++
 +        def fake_import(name: str, *args: object, **kwargs: object):
 +            if name == "torch":
 +                raise ImportError("no torch here")
 +            return real_import(name, *args, **kwargs)
++
 +        with (
 +            patch("builtins.__import__", side_effect=fake_import),
 +            pytest.raises(JudgeUnavailableError, match="requires torch"),
 +        ):
 +            judge.score_pair("prompt", "a", "b")
++
 +    def test_default_loader_path_is_used_when_no_loader_is_supplied(self) -> None:
 +        tokenizer = FakeTokenizer()
 +        model = FakeModel([FakeLogits([0.7]), FakeLogits([0.1])])
++
 +        def fake_default_loader(hf_id: str, device: str):
 +            from dlm.preference.judge import _LoadedRewardJudge
++
 +            assert hf_id == "reward/model"
 +            assert device == "cpu"
 +            return _LoadedRewardJudge(model=model, tokenizer=tokenizer, device=device)
++
 +        judge = HfRewardModelJudge("reward/model", device="cpu")
 +        with patch("dlm.preference.judge._default_reward_loader", side_effect=fake_default_loader):
 +            score = judge.score_pair("prompt", "a", "b")
++
 +        assert score.preferred == "a"
++
++
 +class TestHfRewardHelpers:
 +    def test_default_reward_loader_requires_transformers(self) -> None:
 +        real_import = builtins.__import__
++
 +        def fake_import(name: str, *args: object, **kwargs: object):
 +            if name == "transformers":
 +                raise ImportError("missing transformers")
 +            return real_import(name, *args, **kwargs)
++
 +        with (
 +            patch("builtins.__import__", side_effect=fake_import),
 +            pytest.raises(JudgeUnavailableError, match="requires transformers"),
 +        ):
 +            _default_reward_loader("reward/model", "cpu")
++
 +    def test_default_reward_loader_moves_model_and_sets_eval(self) -> None:
 +        model = FakePretrainedRewardModel()
 +        tokenizer = FakeTokenizer()
++
 +        class AutoModelForSequenceClassification:
 +            @staticmethod
 +            def from_pretrained(hf_id: str) -> FakePretrainedRewardModel:
 +                assert hf_id == "reward/model"
 +                return model
++
 +        class AutoTokenizer:
 +            @staticmethod
 +            def from_pretrained(hf_id: str) -> FakeTokenizer:
 +                assert hf_id == "reward/model"
 +                return tokenizer
++
 +        fake_transformers = SimpleNamespace(
 +            AutoModelForSequenceClassification=AutoModelForSequenceClassification,
 +            AutoTokenizer=AutoTokenizer,
 +        )
++
 +        with patch.dict("sys.modules", {"transformers": fake_transformers}):
 +            loaded = _default_reward_loader("reward/model", "mps")
++
 +        assert loaded.model is model
 +        assert loaded.tokenizer is tokenizer
 +        assert loaded.device == "mps"
 +        assert model.device == "mps"
 +        assert model.eval_called is True
++
 +    def test_resolve_reward_device_respects_explicit_request(self) -> None:
 +        assert _resolve_reward_device("cuda:3") == "cuda:3"
++
 +    def test_resolve_reward_device_returns_cpu_when_torch_is_missing(self) -> None:
 +        real_import = builtins.__import__
++
 +        def fake_import(name: str, *args: object, **kwargs: object):
 +            if name == "torch":
 +                raise ImportError("no torch")
 +            return real_import(name, *args, **kwargs)
++
 +        with patch("builtins.__import__", side_effect=fake_import):
 +            assert _resolve_reward_device("auto") == "cpu"
++
 +    def test_resolve_reward_device_prefers_cuda_then_mps_then_cpu(self) -> None:
 +        torch_cuda = SimpleNamespace(
 +            cuda=SimpleNamespace(is_available=lambda: True),
 +            backends=SimpleNamespace(mps=SimpleNamespace(is_available=lambda: True)),
 +        )
 +        torch_mps = SimpleNamespace(
 +            cuda=SimpleNamespace(is_available=lambda: False),
 +            backends=SimpleNamespace(mps=SimpleNamespace(is_available=lambda: True)),
 +        )
 +        torch_cpu = SimpleNamespace(
 +            cuda=SimpleNamespace(is_available=lambda: False),
 +            backends=SimpleNamespace(mps=SimpleNamespace(is_available=lambda: False)),
 +        )
++
 +        with patch.dict("sys.modules", {"torch": torch_cuda}):
 +            assert _resolve_reward_device("auto") == "cuda"
 +        with patch.dict("sys.modules", {"torch": torch_mps}):
 +            assert _resolve_reward_device("auto") == "mps"
 +        with patch.dict("sys.modules", {"torch": torch_cpu}):
 +            assert _resolve_reward_device("auto") == "cpu"
++
 +    def test_encode_reward_input_falls_back_when_template_raises(self) -> None:
 +        tokenizer = FakeTokenizer(use_chat_template=True, template_error=RuntimeError("boom"))
++
 +        encoded = _encode_reward_input(tokenizer, "prompt", "candidate")
++
 +        assert isinstance(encoded, FakeBatch)
 +        assert tokenizer.calls[-1][0] == "tokenizer"
 +        assert tokenizer.calls[-1][1] == ("prompt",)
 +        assert tokenizer.calls[-1][2]["text_pair"] == "candidate"
++
 +    def test_encode_reward_input_falls_back_when_template_returns_non_string(self) -> None:
 +        tokenizer = FakeTokenizer(use_chat_template=True, template_returns_non_string=True)
++
 +        encoded = _encode_reward_input(tokenizer, "prompt", "candidate")
++
 +        assert isinstance(encoded, FakeBatch)
 +        assert tokenizer.calls[-1][0] == "tokenizer"
++
 +    def test_move_to_device_moves_mapping_values(self) -> None:
 +        tensor = FakeTensor()
 +        payload = {"input_ids": tensor, "meta": "keep"}
++
 +        moved = _move_to_device(payload, "mps")
++
 +        assert moved["input_ids"] is tensor
 +        assert tensor.device == "mps"
 +        assert moved["meta"] == "keep"
++
 +    def test_move_to_device_returns_unmodified_non_mapping_values(self) -> None:
 +        value = object()
 +        assert _move_to_device(value, "cpu") is value
++
 +    def test_extract_reward_scalar_uses_item_fallback(self) -> None:
 +        assert _extract_reward_scalar(FakeTorchScalarLogits(0.75)) == pytest.approx(0.75)
++
 +    def test_extract_reward_scalar_rejects_unreadable_values(self) -> None:
 +        class UnreadableLogits:
 +            def numel(self) -> int:
 +                return 1
++
 +        with pytest.raises(JudgeInvocationError, match="unreadable scalar logit"):
 +            _extract_reward_scalar(UnreadableLogits())

tests/unit/preference/test_mine_dedup.pymodified

90 lines changed — click to load

  from collections import deque
 +import pytest
++
  from dlm.doc.parser import parse_text
  from dlm.preference import (
      PreferenceMineSkipReason,
      render_mine_plan,
+ )
  from dlm.preference.judge import PairScore
 +from dlm.preference.mine import _best_pair, _first_line, _resolve_pair, _unique_nonempty
  _FRONTMATTER = """---
  dlm_id: 01KPQ9X1000000000000000000
  class TestBuildMinePlan:
 +    def test_validates_numeric_limits(self) -> None:
 +        parsed = _parsed("::instruction::\n### Q\nquestion?\n### A\nreference\n")
 +        backend = StubBackend({"question?": ["one", "two"]})
 +        judge = StubJudge({("question?", "one", "two"): PairScore(score_a=1.0, score_b=0.0)})
++
 +        with pytest.raises(ValueError, match="samples must be >= 2"):
 +            build_mine_plan(parsed, backend, judge, mined_run_id=1, samples=1)
 +        with pytest.raises(ValueError, match="max_pairs must be >= 1"):
 +            build_mine_plan(parsed, backend, judge, mined_run_id=1, samples=2, max_pairs=0)
 +        with pytest.raises(ValueError, match="threshold must be >= 0.0"):
 +            build_mine_plan(parsed, backend, judge, mined_run_id=1, samples=2, threshold=-0.1)
 +        with pytest.raises(ValueError, match="max_new_tokens must be >= 1"):
 +            build_mine_plan(parsed, backend, judge, mined_run_id=1, samples=2, max_new_tokens=0)
++
      def test_materializes_auto_mined_preference_section(self) -> None:
          parsed = _parsed("::instruction::\n### Q\nquestion?\n### A\nreference\n")
          backend = StubBackend({"question?": ["bad answer", "good answer"]})
          assert plan.additions == ()
          assert len(plan.skipped) == 1
          assert plan.skipped[0].reason is PreferenceMineSkipReason.MALFORMED_INSTRUCTION
++
 +    def test_stops_collecting_once_max_pairs_is_reached(self) -> None:
 +        parsed = _parsed(
 +            "::instruction::\n### Q\nquestion one?\n### A\nreference\n\n"
 +            "::instruction::\n### Q\nquestion two?\n### A\nreference\n"
 +        )
 +        backend = StubBackend(
 +            {
 +                "question one?": ["bad one", "good one"],
 +                "question two?": ["bad two", "good two"],
 +            }
 +        )
 +        judge = StubJudge(
 +            {
 +                ("question one?", "bad one", "good one"): PairScore(score_a=0.1, score_b=0.9),
 +                ("question two?", "bad two", "good two"): PairScore(score_a=0.1, score_b=0.9),
 +            }
 +        )
++
 +        plan = build_mine_plan(parsed, backend, judge, mined_run_id=4, samples=2, max_pairs=1)
++
 +        assert len(plan.additions) == 1
 +        assert plan.additions[0].source.prompt == "question one?"
++
 +    def test_insufficient_variety_is_reported(self) -> None:
 +        parsed = _parsed("::instruction::\n### Q\nquestion?\n### A\nreference\n")
 +        backend = StubBackend({"question?": [" same ", "", "same", "   "]})
 +        judge = StubJudge({})
++
 +        plan = build_mine_plan(parsed, backend, judge, mined_run_id=6, samples=4)
++
 +        assert plan.additions == ()
 +        assert len(plan.skipped) == 1
 +        assert plan.skipped[0].reason is PreferenceMineSkipReason.INSUFFICIENT_VARIETY
 +        assert "need at least 2 unique non-empty candidates" in plan.skipped[0].detail
++
++
 +class TestMineHelpers:
 +    def test_unique_nonempty_strips_blanks_and_duplicates(self) -> None:
 +        assert _unique_nonempty(["", " alpha ", "alpha", "beta", "   "]) == ["alpha", "beta"]
++
 +    def test_best_pair_skips_ties(self) -> None:
 +        judge = StubJudge({("prompt", "a", "b"): PairScore(score_a=0.4, score_b=0.4)})
++
 +        assert _best_pair("prompt", ["a", "b"], judge=judge) is None
++
 +    def test_resolve_pair_returns_none_for_ties(self) -> None:
 +        assert _resolve_pair("a", "b", PairScore(score_a=0.2, score_b=0.2)) is None
++
 +    def test_first_line_truncates_long_text(self) -> None:
 +        rendered = _first_line("x" * 90, max_chars=20)
 +        assert rendered == ("x" * 19) + "…"

tests/unit/preference/test_pending.pyadded

199 lines changed — click to load

 +"""Tests for staged preference pending-plan helpers."""
++
 +from __future__ import annotations
++
 +import json
 +from pathlib import Path
++
 +import pytest
++
 +from dlm.doc.sections import Section, SectionType
 +from dlm.preference.pending import (
 +    PendingPreferencePlanError,
 +    _optional_float,
 +    _optional_int,
 +    _optional_str,
 +    _section_from_payload,
 +    clear_pending_plan,
 +    load_pending_plan,
 +    pending_plan_path,
 +    save_pending_plan,
 +)
 +from dlm.store.paths import for_dlm
++
 +_DLM_ID = "01KPQ9X1000000000000000000"
++
++
 +def _mined_pref(
 +    *,
 +    prompt: str = "question?",
 +    chosen: str = "better",
 +    rejected: str = "worse",
 +    run_id: int = 7,
 +) -> Section:
 +    body = f"### Prompt\n{prompt}\n### Chosen\n{chosen}\n### Rejected\n{rejected}"
 +    return Section(
 +        type=SectionType.PREFERENCE,
 +        content=body,
 +        start_line=12,
 +        adapter="tone",
 +        tags={"topic": "blas"},
 +        auto_mined=True,
 +        judge_name="sway:preference_judge",
 +        judge_score_chosen=0.9,
 +        judge_score_rejected=0.1,
 +        mined_at="2026-04-23T20:00:00Z",
 +        mined_run_id=run_id,
 +    )
++
++
 +def _image() -> Section:
 +    return Section(
 +        type=SectionType.IMAGE,
 +        content="A DGEMM block diagram.",
 +        media_path="diagram.png",
 +        media_alt="DGEMM diagram",
 +        media_blob_sha="ab" * 32,
 +    )
++
++
 +class TestPendingPlan:
 +    def test_pending_path_round_trip_and_clear(self, tmp_path: Path) -> None:
 +        home = tmp_path / "home"
 +        source_path = tmp_path / "doc.dlm"
 +        source_path.write_text("stub", encoding="utf-8")
 +        store = for_dlm(_DLM_ID, home=home)
++
 +        path = pending_plan_path(store)
 +        assert path == home / "store" / _DLM_ID / "preference" / "pending.json"
++
 +        saved = save_pending_plan(
 +            store,
 +            source_path=source_path,
 +            sections=[_mined_pref(), _image()],
 +        )
 +        raw = json.loads(path.read_text(encoding="utf-8"))
 +        loaded = load_pending_plan(store)
++
 +        assert saved.source_path == source_path.resolve()
 +        assert saved.created_at.endswith("Z")
 +        assert raw["schema_version"] == 1
 +        assert raw["source_path"] == str(source_path.resolve())
 +        assert loaded == saved
 +        assert clear_pending_plan(store) is True
 +        assert clear_pending_plan(store) is False
 +        assert load_pending_plan(store) is None
++
 +    def test_load_returns_none_when_plan_absent(self, tmp_path: Path) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
++
 +        assert load_pending_plan(store) is None
++
 +    def test_load_rejects_unreadable_plan(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
 +        path = pending_plan_path(store)
 +        path.parent.mkdir(parents=True, exist_ok=True)
 +        path.write_text("{}", encoding="utf-8")
++
 +        def _raise(_self: Path, *, encoding: str) -> str:
 +            _ = encoding
 +            raise OSError("boom")
++
 +        monkeypatch.setattr(Path, "read_text", _raise)
 +        with pytest.raises(
 +            PendingPreferencePlanError, match="could not read staged preference plan"
 +        ):
 +            load_pending_plan(store)
++
 +    @pytest.mark.parametrize(
 +        ("payload", "message"),
 +        [
 +            (["not", "an", "object"], "must be a JSON object"),
 +            ({"schema_version": 2}, "unsupported staged preference plan schema_version=2"),
 +            (
 +                {"schema_version": 1, "created_at": "2026-04-24T20:00:00Z", "sections": []},
 +                "missing source_path",
 +            ),
 +            (
 +                {"schema_version": 1, "source_path": "/tmp/doc.dlm", "sections": []},
 +                "missing created_at",
 +            ),
 +            (
 +                {
 +                    "schema_version": 1,
 +                    "source_path": "/tmp/doc.dlm",
 +                    "created_at": "2026-04-24T20:00:00Z",
 +                },
 +                "missing sections",
 +            ),
 +            (
 +                {
 +                    "schema_version": 1,
 +                    "source_path": "/tmp/doc.dlm",
 +                    "created_at": "2026-04-24T20:00:00Z",
 +                    "sections": [{"content": "oops"}],
 +                },
 +                "invalid section payload at index 0",
 +            ),
 +        ],
 +    )
 +    def test_load_rejects_invalid_payloads(
 +        self, tmp_path: Path, payload: object, message: str
 +    ) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
 +        path = pending_plan_path(store)
 +        path.parent.mkdir(parents=True, exist_ok=True)
 +        path.write_text(json.dumps(payload), encoding="utf-8")
++
 +        with pytest.raises(PendingPreferencePlanError, match=message):
 +            load_pending_plan(store)
++
 +    def test_load_rejects_invalid_json(self, tmp_path: Path) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
 +        path = pending_plan_path(store)
 +        path.parent.mkdir(parents=True, exist_ok=True)
 +        path.write_text("{not json", encoding="utf-8")
++
 +        with pytest.raises(
 +            PendingPreferencePlanError, match="staged preference plan is not valid JSON"
 +        ):
 +            load_pending_plan(store)
++
++
 +class TestPendingPayloadHelpers:
 +    def test_section_from_payload_validates_tags_and_optional_types(self) -> None:
 +        with pytest.raises(TypeError, match="expected object, got list"):
 +            _section_from_payload([])
++
 +        with pytest.raises(TypeError, match="tags must be an object"):
 +            _section_from_payload({"type": "preference", "content": "x", "tags": []})
++
 +        with pytest.raises(TypeError, match="tags keys and values must be strings"):
 +            _section_from_payload({"type": "preference", "content": "x", "tags": {"topic": 1}})
++
 +        with pytest.raises(TypeError, match="expected float or null"):
 +            _section_from_payload(
 +                {"type": "preference", "content": "x", "judge_score_chosen": True}
 +            )
++
 +        with pytest.raises(TypeError, match="expected int or null"):
 +            _section_from_payload({"type": "preference", "content": "x", "mined_run_id": True})
++
 +    def test_optional_helpers_accept_none_and_reject_wrong_types(self) -> None:
 +        assert _optional_str(None) is None
 +        assert _optional_str("ok") == "ok"
 +        assert _optional_float(None) is None
 +        assert _optional_float(1) == 1.0
 +        assert _optional_int(None) is None
 +        assert _optional_int(7) == 7
++
 +        with pytest.raises(TypeError, match="expected string or null"):
 +            _optional_str(7)
++
 +        with pytest.raises(TypeError, match="expected float or null"):
 +            _optional_float(True)
++
 +        with pytest.raises(TypeError, match="expected int or null"):
 +            _optional_int(True)

tests/unit/preference/test_sway_bridge.pyadded

262 lines changed — click to load

 +"""Direct helper coverage for sway-backed preference judge wiring."""
++
 +from __future__ import annotations
++
 +import builtins
 +import importlib
 +import sys
 +from pathlib import Path
 +from types import SimpleNamespace
 +from unittest.mock import patch
++
 +import pytest
++
 +from dlm.preference import JudgeUnavailableError
 +from dlm.preference.judge import (
 +    _build_sway_backend,
 +    _import_sway_bridge,
 +    _resolve_sway_trust_remote_code,
 +)
++
++
 +class FakeSwayError(Exception):
 +    pass
++
++
 +class FakeModelSpec:
 +    def __init__(self, **kwargs: object) -> None:
 +        self.kwargs = kwargs
++
++
 +class FakeSysPath(list[str]):
 +    def __init__(self) -> None:
 +        super().__init__()
 +        self.inserted: list[str] = []
++
 +    def insert(self, index: int, value: str) -> None:  # type: ignore[override]
 +        self.inserted.append(value)
 +        super().insert(index, value)
++
++
 +def test_build_sway_backend_requires_importable_bridge() -> None:
 +    with (
 +        patch("dlm.preference.judge._import_sway_bridge", side_effect=ImportError("missing")),
 +        pytest.raises(JudgeUnavailableError, match="requires the sway bridge"),
 +    ):
 +        _build_sway_backend(Path("/tmp/example.dlm"))
++
++
 +def test_build_sway_backend_wraps_sway_resolution_errors() -> None:
 +    def resolve_dlm(_path: Path) -> object:
 +        raise FakeSwayError("no store")
++
 +    with (
 +        patch(
 +            "dlm.preference.judge._import_sway_bridge",
 +            return_value=(resolve_dlm, object(), FakeModelSpec, FakeSwayError),
 +        ),
 +        pytest.raises(JudgeUnavailableError, match="could not resolve"),
 +    ):
 +        _build_sway_backend(Path("/tmp/example.dlm"))
++
++
 +def test_build_sway_backend_wraps_generic_resolution_errors() -> None:
 +    def resolve_dlm(_path: Path) -> object:
 +        raise RuntimeError("boom")
++
 +    with (
 +        patch(
 +            "dlm.preference.judge._import_sway_bridge",
 +            return_value=(resolve_dlm, object(), FakeModelSpec, FakeSwayError),
 +        ),
 +        pytest.raises(JudgeUnavailableError, match="could not resolve"),
 +    ):
 +        _build_sway_backend(Path("/tmp/example.dlm"))
++
++
 +def test_build_sway_backend_requires_trained_adapter() -> None:
 +    handle = SimpleNamespace(adapter_path=None, base_model="base/model")
++
 +    def resolve_dlm(_path: Path) -> object:
 +        return handle
++
 +    with (
 +        patch(
 +            "dlm.preference.judge._import_sway_bridge",
 +            return_value=(resolve_dlm, object(), FakeModelSpec, FakeSwayError),
 +        ),
 +        pytest.raises(JudgeUnavailableError, match="requires a trained adapter"),
 +    ):
 +        _build_sway_backend(Path("/tmp/example.dlm"))
++
++
 +def test_build_sway_backend_wraps_backend_load_errors() -> None:
 +    handle = SimpleNamespace(adapter_path=Path("/tmp/adapter"), base_model="base/model")
++
 +    def resolve_dlm(_path: Path) -> object:
 +        return handle
++
 +    def build_backend(_spec: FakeModelSpec, *, adapter_path: Path) -> object:
 +        assert adapter_path == handle.adapter_path
 +        raise RuntimeError("backend blew up")
++
 +    with (
 +        patch(
 +            "dlm.preference.judge._import_sway_bridge",
 +            return_value=(resolve_dlm, build_backend, FakeModelSpec, FakeSwayError),
 +        ),
 +        patch("dlm.preference.judge._resolve_sway_trust_remote_code", return_value=False),
 +        pytest.raises(JudgeUnavailableError, match="could not load backend"),
 +    ):
 +        _build_sway_backend(Path("/tmp/example.dlm"))
++
++
 +def test_build_sway_backend_builds_model_spec_with_trust_remote_code() -> None:
 +    handle = SimpleNamespace(adapter_path=Path("/tmp/adapter"), base_model="base/model")
 +    seen: dict[str, object] = {}
++
 +    def resolve_dlm(_path: Path) -> object:
 +        return handle
++
 +    def build_backend(spec: FakeModelSpec, *, adapter_path: Path) -> object:
 +        seen["spec"] = spec
 +        seen["adapter_path"] = adapter_path
 +        return "backend"
++
 +    with (
 +        patch(
 +            "dlm.preference.judge._import_sway_bridge",
 +            return_value=(resolve_dlm, build_backend, FakeModelSpec, FakeSwayError),
 +        ),
 +        patch("dlm.preference.judge._resolve_sway_trust_remote_code", return_value=True),
 +    ):
 +        backend = _build_sway_backend(Path("/tmp/example.dlm"))
++
 +    assert backend == "backend"
 +    spec = seen["spec"]
 +    assert isinstance(spec, FakeModelSpec)
 +    assert spec.kwargs == {
 +        "kind": "hf",
 +        "base": "base/model",
 +        "adapter": handle.adapter_path,
 +        "trust_remote_code": True,
 +    }
 +    assert seen["adapter_path"] == handle.adapter_path
++
++
 +def test_import_sway_bridge_loads_modules_directly(monkeypatch: pytest.MonkeyPatch) -> None:
 +    modules = {
 +        "dlm_sway.backends": SimpleNamespace(build="build-backend"),
 +        "dlm_sway.core.errors": SimpleNamespace(SwayError=FakeSwayError),
 +        "dlm_sway.core.model": SimpleNamespace(ModelSpec=FakeModelSpec),
 +        "dlm_sway.integrations.dlm.resolver": SimpleNamespace(resolve_dlm="resolve-dlm"),
 +    }
++
 +    def fake_import_module(name: str) -> object:
 +        return modules[name]
++
 +    monkeypatch.setattr(importlib, "import_module", fake_import_module)
 +    resolve_dlm, build_backend, model_spec, sway_error = _import_sway_bridge()
++
 +    assert resolve_dlm == "resolve-dlm"
 +    assert build_backend == "build-backend"
 +    assert model_spec is FakeModelSpec
 +    assert sway_error is FakeSwayError
++
++
 +def test_import_sway_bridge_falls_back_to_local_src_path(
 +    monkeypatch: pytest.MonkeyPatch,
 +) -> None:
 +    modules = {
 +        "dlm_sway.backends": SimpleNamespace(build="build-backend"),
 +        "dlm_sway.core.errors": SimpleNamespace(SwayError=FakeSwayError),
 +        "dlm_sway.core.model": SimpleNamespace(ModelSpec=FakeModelSpec),
 +        "dlm_sway.integrations.dlm.resolver": SimpleNamespace(resolve_dlm="resolve-dlm"),
 +    }
 +    calls = {"count": 0}
++
 +    def fake_import_module(name: str) -> object:
 +        calls["count"] += 1
 +        if calls["count"] == 1:
 +            raise ImportError("first import fails")
 +        return modules[name]
++
 +    fake_sys_path = FakeSysPath()
++
 +    monkeypatch.setattr(importlib, "import_module", fake_import_module)
 +    monkeypatch.setattr(Path, "exists", lambda self: True)
 +    monkeypatch.setattr(sys, "path", fake_sys_path)
 +    resolve_dlm, build_backend, model_spec, sway_error = _import_sway_bridge()
++
 +    assert resolve_dlm == "resolve-dlm"
 +    assert build_backend == "build-backend"
 +    assert model_spec is FakeModelSpec
 +    assert sway_error is FakeSwayError
 +    assert fake_sys_path.inserted
 +    assert fake_sys_path.inserted[0].endswith("/sway/src")
++
++
 +def test_resolve_sway_trust_remote_code_returns_false_when_imports_are_missing() -> None:
 +    real_import = builtins.__import__
++
 +    def fake_import(name: str, *args: object, **kwargs: object):
 +        if name in {"dlm.base_models", "dlm.doc.parser"}:
 +            raise ImportError("missing")
 +        return real_import(name, *args, **kwargs)
++
 +    with patch("builtins.__import__", side_effect=fake_import):
 +        assert _resolve_sway_trust_remote_code(Path("/tmp/example.dlm")) is False
++
++
 +def test_resolve_sway_trust_remote_code_handles_parse_and_resolve_failures() -> None:
 +    fake_doc_parser = SimpleNamespace(
 +        parse_file=lambda _path: (_ for _ in ()).throw(RuntimeError("bad"))
 +    )
 +    fake_base_models = SimpleNamespace(resolve=lambda *_args, **_kwargs: object())
++
 +    with patch.dict(
 +        "sys.modules",
 +        {"dlm.doc.parser": fake_doc_parser, "dlm.base_models": fake_base_models},
 +    ):
 +        assert _resolve_sway_trust_remote_code(Path("/tmp/example.dlm")) is False
++
 +    parsed = SimpleNamespace(frontmatter=SimpleNamespace(base_model="custom-base"))
 +    fake_doc_parser = SimpleNamespace(parse_file=lambda _path: parsed)
 +    fake_base_models = SimpleNamespace(
 +        resolve=lambda *_args, **_kwargs: (_ for _ in ()).throw(RuntimeError("no base"))
 +    )
++
 +    with patch.dict(
 +        "sys.modules",
 +        {"dlm.doc.parser": fake_doc_parser, "dlm.base_models": fake_base_models},
 +    ):
 +        assert _resolve_sway_trust_remote_code(Path("/tmp/example.dlm")) is False
++
++
 +@pytest.mark.parametrize("base_model", ["", "hf:org/model"])
 +def test_resolve_sway_trust_remote_code_short_circuits_for_non_registry_models(
 +    base_model: str,
 +) -> None:
 +    parsed = SimpleNamespace(frontmatter=SimpleNamespace(base_model=base_model))
 +    fake_doc_parser = SimpleNamespace(parse_file=lambda _path: parsed)
 +    fake_base_models = SimpleNamespace(resolve=lambda *_args, **_kwargs: object())
++
 +    with patch.dict(
 +        "sys.modules",
 +        {"dlm.doc.parser": fake_doc_parser, "dlm.base_models": fake_base_models},
 +    ):
 +        assert _resolve_sway_trust_remote_code(Path("/tmp/example.dlm")) is False
++
++
 +def test_resolve_sway_trust_remote_code_returns_spec_flag() -> None:
 +    parsed = SimpleNamespace(frontmatter=SimpleNamespace(base_model="qwen3-1.7b"))
 +    fake_doc_parser = SimpleNamespace(parse_file=lambda _path: parsed)
 +    fake_base_models = SimpleNamespace(
 +        resolve=lambda *_args, **_kwargs: SimpleNamespace(trust_remote_code=True)
 +    )
++
 +    with patch.dict(
 +        "sys.modules",
 +        {"dlm.doc.parser": fake_doc_parser, "dlm.base_models": fake_base_models},
 +    ):
 +        assert _resolve_sway_trust_remote_code(Path("/tmp/example.dlm")) is True

tests/unit/repl/test_app_helpers.pyadded

10 lines changed — click to load

 +"""Direct coverage for small non-interactive REPL helpers."""
++
 +from __future__ import annotations
++
 +from dlm.repl.app import _format_prompt
++
++
 +def test_format_prompt_handles_empty_and_existing_history() -> None:
 +    assert _format_prompt([]) == "> "
 +    assert _format_prompt([object(), object(), object(), object()]) == "[2] > "

tests/unit/repl/test_commands.pymodified

19 lines changed — click to load

  import pytest
 -from dlm.repl.commands import Action, is_command, parse_and_dispatch
 +from dlm.repl.commands import Action, _truncate, is_command, parse_and_dispatch
  from dlm.repl.errors import BadCommandArgumentError, UnknownCommandError
  from dlm.repl.session import ReplSession
              assert cmd in result.message
 +class TestHelpers:
 +    def test_truncate_adds_ellipsis_for_long_lines(self) -> None:
 +        assert _truncate("x" * 20, 10) == "x" * 9 + "…"
++
++
  class TestUnknownCommand:
      def test_unknown_slash_raises(self) -> None:
          with pytest.raises(UnknownCommandError, match="/bogus"):

tests/unit/repl/test_streaming.pyadded

64 lines changed — click to load

 +"""Direct unit coverage for REPL streaming helpers."""
++
 +from __future__ import annotations
++
 +from types import SimpleNamespace
 +from unittest.mock import patch
++
 +from dlm.repl.streaming import CaptureStreamer, build_streamer, concatenate_tokens, should_stream
++
++
 +def test_should_stream_tracks_stdout_tty_state() -> None:
 +    with patch("sys.stdout", new=SimpleNamespace(isatty=lambda: True)):
 +        assert should_stream() is True
 +    with patch("sys.stdout", new=SimpleNamespace(isatty=lambda: False)):
 +        assert should_stream() is False
++
++
 +def test_should_stream_handles_broken_stdout() -> None:
 +    class MissingIsAtty:
 +        pass
++
 +    class RaisesValueError:
 +        @staticmethod
 +        def isatty() -> bool:
 +            raise ValueError("closed")
++
 +    with patch("sys.stdout", new=MissingIsAtty()):
 +        assert should_stream() is False
 +    with patch("sys.stdout", new=RaisesValueError()):
 +        assert should_stream() is False
++
++
 +def test_capture_streamer_is_noop_and_keeps_text_buffer() -> None:
 +    streamer = CaptureStreamer()
 +    streamer.put(["ignored"])
 +    streamer.end()
 +    assert streamer.text == ""
++
++
 +def test_build_streamer_returns_capture_streamer_when_disabled() -> None:
 +    assert isinstance(build_streamer(object(), stream_to_stdout=False), CaptureStreamer)
++
++
 +def test_build_streamer_wraps_transformers_text_streamer() -> None:
 +    calls: list[tuple[object, bool, bool]] = []
++
 +    class FakeTextStreamer:
 +        def __init__(
 +            self, tokenizer: object, *, skip_prompt: bool, skip_special_tokens: bool
 +        ) -> None:
 +            calls.append((tokenizer, skip_prompt, skip_special_tokens))
++
 +    fake_transformers = SimpleNamespace(TextStreamer=FakeTextStreamer)
 +    tokenizer = object()
++
 +    with patch.dict("sys.modules", {"transformers": fake_transformers}):
 +        streamer = build_streamer(tokenizer, stream_to_stdout=True)
++
 +    assert isinstance(streamer, FakeTextStreamer)
 +    assert calls == [(tokenizer, True, True)]
++
++
 +def test_concatenate_tokens_joins_token_pieces() -> None:
 +    assert concatenate_tokens(["hello", " ", "world"]) == "hello world"

tests/unit/replay/test_corpus.pymodified

27 lines changed — click to load

  import pytest
 +import dlm.replay.corpus as replay_corpus
  from dlm.replay.corpus import _encode_frame, append_snapshot, iter_snapshots, read_chunk
  from dlm.replay.errors import CorpusCorruptError
  from dlm.replay.models import SectionSnapshot
          with pytest.raises(CorpusCorruptError):
              read_chunk(corpus, byte_offset=0, length=len(frame))
 +    def test_cbor_value_error_is_wrapped(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        frame = _encode_frame(_snap("a" * 16, "hello"))
 +        corpus = tmp_path / "corpus.zst"
 +        corpus.write_bytes(frame)
++
 +        def _boom(_payload: bytes) -> object:
 +            raise ValueError("bad semantic tag")
++
 +        monkeypatch.setattr(replay_corpus.cbor2, "loads", _boom)
 +        with pytest.raises(CorpusCorruptError, match="CBOR decode failed"):
 +            read_chunk(corpus, byte_offset=0, length=len(frame))
++
      def test_iter_short_read_raises(self, tmp_path: Path) -> None:
          """iter_snapshots also guards against truncated entries."""
          from dlm.replay.models import IndexEntry

tests/unit/replay/test_sampler.pymodified

36 lines changed — click to load

  from dlm.replay.errors import SamplerError
  from dlm.replay.models import IndexEntry
 -from dlm.replay.sampler import sample
 +from dlm.replay.sampler import _weighted_reservoir, sample
  _NOW = datetime(2026, 4, 18)
          p1 = sample(entries_a, k=5, now=_NOW, rng=random.Random(7), scheme="uniform")
          p2 = sample(entries_b, k=5, now=_NOW, rng=random.Random(7), scheme="uniform")
          assert [e.section_id for e in p1] == [e.section_id for e in p2]
++
++
 +class TestReservoirEdgeCases:
 +    def test_zero_random_draw_retries_and_falls_back_to_tiny_positive(self) -> None:
 +        entries = _entries(2)
++
 +        class _ZeroThenHalfRng:
 +            def __init__(self) -> None:
 +                self._values = iter([0.0, 0.0, 0.5, 0.5])
++
 +            def random(self) -> float:
 +                return next(self._values)
++
 +        picked = sample(entries, k=1, now=_NOW, rng=_ZeroThenHalfRng(), scheme="uniform")
 +        assert len(picked) == 1
++
 +    def test_nonpositive_weight_entries_are_skipped(self) -> None:
 +        entries = _entries(3)
 +        picked = _weighted_reservoir(
 +            entries,
 +            weights=[1.0, 0.0, -1.0],
 +            k=3,
 +            rng=random.Random(0),
 +        )
 +        assert [entry.section_id for entry in picked] == [entries[0].section_id]

tests/unit/share/test_peer_runtime.pyadded

388 lines changed — click to load

 +"""Runtime coverage for the peer share transport."""
++
 +from __future__ import annotations
++
 +import importlib
 +import socket
 +from io import BytesIO
 +from pathlib import Path
 +from types import SimpleNamespace
++
 +import pytest
++
 +from dlm.share.errors import PeerAuthError, RateLimitError
 +from dlm.share.peer import (
 +    RateLimiter,
 +    ServeHandle,
 +    ServeOptions,
 +    _detect_lan_ip,
 +    _log_connection,
 +    build_handler,
 +    new_session,
 +    pull_peer,
 +    serve,
 +)
++
 +peer_mod = importlib.import_module("dlm.share.peer")
++
++
 +def _build_test_handler(
 +    tmp_path: Path,
 +    *,
 +    path: str,
 +) -> tuple[type[object], object, list[tuple[str, str, str, str]], RateLimiter, Path]:
 +    session = new_session("01HZPEER")
 +    pack_path = tmp_path / "bundle.dlm.pack"
 +    pack_path.write_bytes(b"peer-pack")
 +    rate_limiter = RateLimiter(max_concurrency=4, rate_limit_per_min=30)
 +    logs: list[tuple[str, str, str, str]] = []
++
 +    handler_cls = build_handler(session, pack_path, rate_limiter)
 +    handler = object.__new__(handler_cls)
 +    handler.path = path
 +    handler.client_address = ("127.0.0.1", 7337)
 +    handler.send_error = lambda code, message: logs.append(("error", str(code), message, ""))  # type: ignore[attr-defined]
 +    handler._stream_pack = lambda path: logs.append(("stream", str(path), "", ""))  # type: ignore[attr-defined]
 +    return handler_cls, handler, logs, rate_limiter, pack_path
++
++
 +class TestPeerHandler:
 +    def test_log_message_is_silent(self, tmp_path: Path) -> None:
 +        handler_cls, handler, _logs, _rate_limiter, _pack_path = _build_test_handler(
 +            tmp_path, path="/ignored"
 +        )
 +        assert handler_cls.log_message(handler, "%s", "ignored") is None
++
 +    def test_handler_rejects_unknown_dlm_id(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        handler_cls, handler, events, _rate_limiter, _pack_path = _build_test_handler(
 +            tmp_path, path="/wrong?token=abc"
 +        )
 +        request_logs: list[tuple[str, str, str, str]] = []
 +        monkeypatch.setattr(
 +            peer_mod,
 +            "_log_connection",
 +            lambda ip, method, path, status: request_logs.append((ip, method, path, status)),
 +        )
++
 +        handler_cls.do_GET(handler)
++
 +        assert events == [("error", "404", "unknown dlm_id", "")]
 +        assert request_logs == [
 +            ("127.0.0.1", "GET", "/wrong", "start"),
 +            ("127.0.0.1", "GET", "/wrong", "404 unknown dlm_id"),
 +        ]
++
 +    def test_handler_rejects_missing_token(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        handler_cls, handler, events, _rate_limiter, _pack_path = _build_test_handler(
 +            tmp_path, path="/01HZPEER"
 +        )
 +        request_logs: list[tuple[str, str, str, str]] = []
 +        monkeypatch.setattr(
 +            peer_mod,
 +            "_log_connection",
 +            lambda ip, method, path, status: request_logs.append((ip, method, path, status)),
 +        )
++
 +        handler_cls.do_GET(handler)
++
 +        assert events == [("error", "401", "missing token", "")]
 +        assert request_logs == [
 +            ("127.0.0.1", "GET", "/01HZPEER", "start"),
 +            ("127.0.0.1", "GET", "/01HZPEER", "401 missing token"),
 +        ]
++
 +    def test_handler_rejects_bad_token(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        handler_cls, handler, events, _rate_limiter, _pack_path = _build_test_handler(
 +            tmp_path, path="/01HZPEER?token=bad"
 +        )
 +        request_logs: list[tuple[str, str, str, str]] = []
 +        monkeypatch.setattr(
 +            peer_mod,
 +            "_log_connection",
 +            lambda ip, method, path, status: request_logs.append((ip, method, path, status)),
 +        )
 +        monkeypatch.setattr(
 +            peer_mod.PeerSession,
 +            "verify_token",
 +            lambda self, token: (_ for _ in ()).throw(PeerAuthError("bad token")),
 +        )
++
 +        handler_cls.do_GET(handler)
++
 +        assert events == [("error", "403", "token rejected", "")]
 +        assert request_logs == [
 +            ("127.0.0.1", "GET", "/01HZPEER", "start"),
 +            ("127.0.0.1", "GET", "/01HZPEER", "403 bad token"),
 +        ]
++
 +    def test_handler_rejects_rate_limited(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        handler_cls, handler, events, rate_limiter, _pack_path = _build_test_handler(
 +            tmp_path, path="/01HZPEER?token=good"
 +        )
 +        request_logs: list[tuple[str, str, str, str]] = []
 +        monkeypatch.setattr(
 +            peer_mod,
 +            "_log_connection",
 +            lambda ip, method, path, status: request_logs.append((ip, method, path, status)),
 +        )
 +        monkeypatch.setattr(peer_mod.PeerSession, "verify_token", lambda self, token: None)
 +        monkeypatch.setattr(
 +            rate_limiter,
 +            "check_and_acquire",
 +            lambda: (_ for _ in ()).throw(RateLimitError("too many")),
 +        )
++
 +        handler_cls.do_GET(handler)
++
 +        assert events == [("error", "429", "rate limited", "")]
 +        assert request_logs == [
 +            ("127.0.0.1", "GET", "/01HZPEER", "start"),
 +            ("127.0.0.1", "GET", "/01HZPEER", "429 too many"),
 +        ]
++
 +    def test_handler_streams_pack_and_releases_limiter(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        handler_cls, handler, events, rate_limiter, pack_path = _build_test_handler(
 +            tmp_path, path="/01HZPEER?token=good"
 +        )
 +        request_logs: list[tuple[str, str, str, str]] = []
 +        monkeypatch.setattr(
 +            peer_mod,
 +            "_log_connection",
 +            lambda ip, method, path, status: request_logs.append((ip, method, path, status)),
 +        )
 +        monkeypatch.setattr(peer_mod.PeerSession, "verify_token", lambda self, token: None)
++
 +        handler_cls.do_GET(handler)
++
 +        assert events == [("stream", str(pack_path), "", "")]
 +        assert rate_limiter.active == 0
 +        assert request_logs == [
 +            ("127.0.0.1", "GET", "/01HZPEER", "start"),
 +            ("127.0.0.1", "GET", "/01HZPEER", "200 complete"),
 +        ]
++
 +    def test_stream_pack_writes_headers_and_body(self, tmp_path: Path) -> None:
 +        handler_cls, handler, _events, _rate_limiter, pack_path = _build_test_handler(
 +            tmp_path, path="/ignored"
 +        )
 +        responses: list[tuple[str, str]] = []
 +        body = BytesIO()
 +        handler.wfile = body
 +        handler.send_response = lambda status: responses.append(("status", str(status)))  # type: ignore[attr-defined]
 +        handler.send_header = lambda name, value: responses.append((name, value))  # type: ignore[attr-defined]
 +        handler.end_headers = lambda: responses.append(("end", ""))  # type: ignore[attr-defined]
++
 +        handler_cls._stream_pack(handler, pack_path)
++
 +        assert responses == [
 +            ("status", "200"),
 +            ("Content-Type", "application/octet-stream"),
 +            ("Content-Length", str(len(b"peer-pack"))),
 +            ("end", ""),
 +        ]
 +        assert body.getvalue() == b"peer-pack"
++
++
 +class TestPeerHelpers:
 +    def test_log_connection_emits_metadata_only(self, caplog: pytest.LogCaptureFixture) -> None:
 +        caplog.set_level("INFO")
++
 +        _log_connection("127.0.0.1", "GET", "/01HZPEER", "200 complete")
++
 +        assert "peer: GET /01HZPEER 200 complete from 127.0.0.1" in caplog.text
++
 +    def test_pull_peer_reuses_url_sink(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.share.url_sink as url_sink
++
 +        out_path = tmp_path / "incoming.dlm.pack"
 +        seen: dict[str, object] = {}
++
 +        def _fake_pull_url(url: str, actual_out: Path, *, progress: object | None = None) -> int:
 +            seen["url"] = url
 +            seen["out"] = actual_out
 +            seen["progress"] = progress
 +            return 42
++
 +        monkeypatch.setattr(url_sink, "pull_url", _fake_pull_url)
++
 +        result = pull_peer("host:7337/01HZPEER?token=abc", out_path, progress=None)
++
 +        assert result == 42
 +        assert seen == {
 +            "url": "http://host:7337/01HZPEER?token=abc",
 +            "out": out_path,
 +            "progress": None,
 +        }
++
++
 +class TestServeHandle:
 +    def test_peer_url_uses_bind_host_for_loopback(self) -> None:
 +        handle = ServeHandle(
 +            session=SimpleNamespace(dlm_id="01HZPEER"),
 +            bind_host="127.0.0.1",
 +            port=7337,
 +            token="abc",
 +            _server=SimpleNamespace(),
 +        )
++
 +        assert handle.peer_url == "peer://127.0.0.1:7337/01HZPEER?token=abc"
++
 +    def test_peer_url_detects_lan_ip_for_public_bind(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        handle = ServeHandle(
 +            session=SimpleNamespace(dlm_id="01HZPEER"),
 +            bind_host="0.0.0.0",
 +            port=7337,
 +            token="abc",
 +            _server=SimpleNamespace(),
 +        )
 +        monkeypatch.setattr(peer_mod, "_detect_lan_ip", lambda: "192.168.1.9")
++
 +        assert handle.peer_url == "peer://192.168.1.9:7337/01HZPEER?token=abc"
++
 +    def test_wait_shutdown_stops_server_cleanly(self) -> None:
 +        calls: list[str] = []
 +        server = SimpleNamespace(
 +            serve_forever=lambda: calls.append("serve_forever"),
 +            shutdown=lambda: calls.append("shutdown"),
 +            server_close=lambda: calls.append("server_close"),
 +        )
 +        handle = ServeHandle(
 +            session=SimpleNamespace(dlm_id="01HZPEER"),
 +            bind_host="127.0.0.1",
 +            port=7337,
 +            token="abc",
 +            _server=server,
 +        )
++
 +        handle.wait_shutdown()
++
 +        assert calls == ["serve_forever", "shutdown", "server_close"]
++
 +    def test_wait_shutdown_handles_keyboard_interrupt(
 +        self, caplog: pytest.LogCaptureFixture
 +    ) -> None:
 +        calls: list[str] = []
++
 +        def _serve_forever() -> None:
 +            calls.append("serve_forever")
 +            raise KeyboardInterrupt
++
 +        server = SimpleNamespace(
 +            serve_forever=_serve_forever,
 +            shutdown=lambda: calls.append("shutdown"),
 +            server_close=lambda: calls.append("server_close"),
 +        )
 +        handle = ServeHandle(
 +            session=SimpleNamespace(dlm_id="01HZPEER"),
 +            bind_host="127.0.0.1",
 +            port=7337,
 +            token="abc",
 +            _server=server,
 +        )
 +        caplog.set_level("INFO")
++
 +        handle.wait_shutdown()
++
 +        assert calls == ["serve_forever", "shutdown", "server_close"]
 +        assert "shutdown requested" in caplog.text
++
++
 +class TestServe:
 +    def test_serve_builds_handle(self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
 +        pack_path = tmp_path / "bundle.dlm.pack"
 +        pack_path.write_bytes(b"peer-pack")
 +        handler_cls = type("FakeHandler", (), {})
 +        server_calls: dict[str, object] = {}
++
 +        class FakeSession:
 +            dlm_id = "01HZPEER"
++
 +            def issue_token(self) -> str:
 +                return "issued-token"
++
 +        class FakeServer:
 +            def __init__(self, address: tuple[str, int], handler: type[object]) -> None:
 +                server_calls["address"] = address
 +                server_calls["handler"] = handler
++
 +        monkeypatch.setattr(
 +            peer_mod, "new_session", lambda dlm_id, token_ttl_seconds: FakeSession()
 +        )
 +        monkeypatch.setattr(
 +            peer_mod, "build_handler", lambda session, actual_pack, limiter: handler_cls
 +        )
 +        monkeypatch.setattr(peer_mod, "resolve_bind", lambda opts: "127.0.0.1")
 +        monkeypatch.setattr(peer_mod.http.server, "ThreadingHTTPServer", FakeServer)
++
 +        handle = serve("01HZPEER", pack_path, ServeOptions(port=8123))
++
 +        assert handle.session.dlm_id == "01HZPEER"
 +        assert handle.bind_host == "127.0.0.1"
 +        assert handle.port == 8123
 +        assert handle.token == "issued-token"
 +        assert server_calls == {
 +            "address": ("127.0.0.1", 8123),
 +            "handler": handler_cls,
 +        }
++
++
 +class TestDetectLanIp:
 +    def test_detect_lan_ip_returns_socket_address(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        class FakeSocket:
 +            def settimeout(self, value: float) -> None:
 +                assert value == 0.1
++
 +            def connect(self, target: tuple[str, int]) -> None:
 +                assert target == ("10.254.254.254", 1)
++
 +            def getsockname(self) -> tuple[str, int]:
 +                return ("192.168.1.7", 9999)
++
 +            def __enter__(self) -> FakeSocket:
 +                return self
++
 +            def __exit__(self, exc_type: object, exc: object, tb: object) -> None:
 +                return None
++
 +        monkeypatch.setattr(socket, "socket", lambda *args, **kwargs: FakeSocket())
++
 +        assert _detect_lan_ip() == "192.168.1.7"
++
 +    def test_detect_lan_ip_returns_placeholder_on_error(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        class FakeSocket:
 +            def __enter__(self) -> FakeSocket:
 +                raise OSError("no route")
++
 +            def __exit__(self, exc_type: object, exc: object, tb: object) -> None:
 +                return None
++
 +        monkeypatch.setattr(socket, "socket", lambda *args, **kwargs: FakeSocket())
++
 +        assert _detect_lan_ip() == "<lan-ip>"

tests/unit/share/test_provenance.pymodified

84 lines changed — click to load

  from dlm.share.provenance import (
      Provenance,
      ProvenanceChainBroken,
 +    ProvenanceError,
      ProvenanceSchemaError,
      ProvenanceVerifyResult,
      UnknownSignerError,
          second = record_trusted_key(_SAMPLE_PUBKEY, trusted_keys_dir=tmp_path)
          assert first == second
 +    def test_record_refuses_to_overwrite_different_key_contents(self, tmp_path: Path) -> None:
 +        target = record_trusted_key(_SAMPLE_PUBKEY, trusted_keys_dir=tmp_path, label="alice")
++
 +        with pytest.MonkeyPatch.context() as mp:
 +            mp.setattr(
 +                "dlm.share.provenance.pubkey_fingerprint",
 +                lambda _key: target.stem.removeprefix("alice-"),
 +            )
 +            with pytest.raises(ProvenanceError, match="refusing to overwrite"):
 +                record_trusted_key(
 +                    _SAMPLE_PUBKEY + "\nDIFFERENT",
 +                    trusted_keys_dir=tmp_path,
 +                    label="alice",
 +                )
 +        assert target.is_file()
++
      def test_find_matching_returns_path(self, tmp_path: Path) -> None:
          record_trusted_key(_SAMPLE_PUBKEY, trusted_keys_dir=tmp_path)
          found = find_matching_trusted_key(_SAMPLE_PUBKEY, trusted_keys_dir=tmp_path)
+         )
          assert found is None
 +    def test_find_matching_skips_unreadable_pubkey_files(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        good = record_trusted_key(_SAMPLE_PUBKEY, trusted_keys_dir=tmp_path)
 +        bad = tmp_path / "000-bad.pub"
 +        bad.write_text("broken", encoding="utf-8")
 +        path_type = type(bad)
 +        real_read_text = path_type.read_text
++
 +        def _maybe_broken(self: Path, *args: object, **kwargs: object) -> str:
 +            if self == bad:
 +                raise OSError("boom")
 +            return real_read_text(self, *args, **kwargs)
++
 +        monkeypatch.setattr(path_type, "read_text", _maybe_broken)
++
 +        assert find_matching_trusted_key(_SAMPLE_PUBKEY, trusted_keys_dir=tmp_path) == good
++
  class TestVerifyProvenance:
      def _stub_verifier_accepts(self, chain: bytes, signature: str, pubkey_path: Path) -> None:
          prov = _sample_provenance(adapter_sha256="a" * 64)
          with pytest.raises(ProvenanceChainBroken, match="mismatch"):
              recompute_chain_consistency(prov, adapter_sha256="b" * 64)
++
++
 +class TestDefaultSignatureVerifier:
 +    def test_default_signature_verifier_writes_temp_files_and_calls_minisign(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +        tmp_path: Path,
 +    ) -> None:
 +        from dlm.share.provenance import _default_signature_verifier
++
 +        seen: dict[str, object] = {}
++
 +        def _fake_minisign_verify(payload: Path, sig: Path, pubkey: Path) -> None:
 +            seen["payload"] = payload.read_bytes()
 +            seen["signature"] = sig.read_text(encoding="utf-8")
 +            seen["pubkey"] = pubkey
++
 +        monkeypatch.setattr("dlm.share.signing._minisign_verify", _fake_minisign_verify)
++
 +        pubkey = tmp_path / "key.pub"
 +        pubkey.write_text("pub", encoding="utf-8")
 +        _default_signature_verifier(b"chain-bytes", "signature-block", pubkey)
++
 +        assert seen["payload"] == b"chain-bytes"
 +        assert seen["signature"] == "signature-block"
 +        assert seen["pubkey"] == pubkey

tests/unit/share/test_pull.pyadded

393 lines changed — click to load

 +"""Unit coverage for the share pull orchestrator."""
++
 +from __future__ import annotations
++
 +import importlib
 +import sys
 +from pathlib import Path
 +from types import ModuleType, SimpleNamespace
 +from typing import cast
++
 +import pytest
++
 +from dlm.share.errors import ShareError, SinkError
 +from dlm.share.pull import (
 +    PullResult,
 +    _dispatch_pull,
 +    _log_verification,
 +    _try_hf_sidecar,
 +    _try_peer_sidecar,
 +    _try_url_sidecar,
 +    pull,
 +)
 +from dlm.share.signing import VerifyResult, VerifyStatus
 +from dlm.share.sinks import SinkKind, SinkSpec
++
 +pull_mod = importlib.import_module("dlm.share.pull")
++
++
 +class TestPull:
 +    def test_pull_dispatches_verifies_and_unpacks(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        source = "https://example.test/adapter.dlm.pack"
 +        out_dir = tmp_path / "out"
 +        home = tmp_path / "home"
 +        progress = object()
 +        spec = SinkSpec(kind=SinkKind.URL, target=source)
 +        order: list[str] = []
 +        verification = VerifyResult(status=VerifyStatus.VERIFIED, key_path=tmp_path / "trusted.pub")
++
 +        monkeypatch.setattr(
 +            pull_mod, "parse_source", lambda value: spec if value == source else None
 +        )
++
 +        def _fake_dispatch(
 +            actual_spec: SinkSpec,
 +            pack_path: Path,
 +            sig_path: Path,
 +            *,
 +            progress: object | None,
 +        ) -> int:
 +            order.append("dispatch")
 +            assert actual_spec == spec
 +            assert pack_path.name == "incoming.dlm.pack"
 +            assert sig_path.name == "incoming.dlm.pack.minisig"
 +            assert progress is not None
 +            pack_path.write_bytes(b"pack-bytes")
 +            sig_path.write_text("signature", encoding="utf-8")
 +            return 123
++
 +        def _fake_verify(pack_path: Path, sig_path: Path) -> VerifyResult:
 +            order.append("verify")
 +            assert pack_path.read_bytes() == b"pack-bytes"
 +            assert sig_path.read_text(encoding="utf-8") == "signature"
 +            return verification
++
 +        def _fake_unpack(
 +            pack_path: Path,
 +            *,
 +            home: Path | None,
 +            force: bool,
 +            out_dir: Path,
 +        ) -> SimpleNamespace:
 +            order.append("unpack")
 +            assert pack_path.read_bytes() == b"pack-bytes"
 +            assert home == tmp_path / "home"
 +            assert force is True
 +            assert out_dir == tmp_path / "out"
 +            return SimpleNamespace(
 +                dlm_path=out_dir / "restored.dlm",
 +                store_path=home / "store" / "01HZPULL",
 +                dlm_id="01HZPULL",
 +            )
++
 +        monkeypatch.setattr(pull_mod, "_dispatch_pull", _fake_dispatch)
 +        monkeypatch.setattr(pull_mod, "verify_signature", _fake_verify)
 +        monkeypatch.setattr(pull_mod, "pack_unpack", _fake_unpack)
++
 +        result = pull(
 +            source,
 +            out_dir=out_dir,
 +            force=True,
 +            home=home,
 +            progress=cast("object", progress),
 +        )
++
 +        assert result == PullResult(
 +            dlm_path=out_dir / "restored.dlm",
 +            store_path=home / "store" / "01HZPULL",
 +            dlm_id="01HZPULL",
 +            source=source,
 +            bytes_received=123,
 +            verification=verification,
 +        )
 +        assert order == ["dispatch", "verify", "unpack"]
++
++
 +class TestDispatchPull:
 +    def test_dispatch_pull_hf_downloads_pack_and_sidecar(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.share.hf_sink as hf_sink
++
 +        pack_path = tmp_path / "pack.dlm.pack"
 +        sig_path = tmp_path / "pack.dlm.pack.minisig"
 +        progress = object()
 +        seen: dict[str, object] = {}
++
 +        def _fake_pull_hf(repo_id: str, out_path: Path, *, progress: object | None = None) -> int:
 +            seen["repo_id"] = repo_id
 +            seen["progress"] = progress
 +            out_path.write_bytes(b"hf-pack")
 +            return 7
++
 +        monkeypatch.setattr(hf_sink, "pull_hf", _fake_pull_hf)
 +        monkeypatch.setattr(
 +            pull_mod,
 +            "_try_hf_sidecar",
 +            lambda repo_id, sidecar_path: seen.update(
 +                {"sidecar_repo_id": repo_id, "sidecar_path": sidecar_path}
 +            ),
 +        )
++
 +        bytes_received = _dispatch_pull(
 +            SinkSpec(kind=SinkKind.HF, target="org/repo"),
 +            pack_path,
 +            sig_path,
 +            progress=cast("object", progress),
 +        )
++
 +        assert bytes_received == 7
 +        assert pack_path.read_bytes() == b"hf-pack"
 +        assert seen == {
 +            "repo_id": "org/repo",
 +            "progress": progress,
 +            "sidecar_repo_id": "org/repo",
 +            "sidecar_path": sig_path,
 +        }
++
 +    def test_dispatch_pull_url_downloads_pack_and_sidecar(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.share.url_sink as url_sink
++
 +        pack_path = tmp_path / "pack.dlm.pack"
 +        sig_path = tmp_path / "pack.dlm.pack.minisig"
 +        seen: dict[str, object] = {}
++
 +        def _fake_pull_url(url: str, out_path: Path, *, progress: object | None = None) -> int:
 +            seen["url"] = url
 +            seen["progress"] = progress
 +            out_path.write_bytes(b"url-pack")
 +            return 9
++
 +        monkeypatch.setattr(url_sink, "pull_url", _fake_pull_url)
 +        monkeypatch.setattr(
 +            pull_mod,
 +            "_try_url_sidecar",
 +            lambda url, sidecar_path: seen.update(
 +                {"sidecar_url": url, "sidecar_path": sidecar_path}
 +            ),
 +        )
++
 +        bytes_received = _dispatch_pull(
 +            SinkSpec(kind=SinkKind.URL, target="https://example.test/pack"),
 +            pack_path,
 +            sig_path,
 +            progress=None,
 +        )
++
 +        assert bytes_received == 9
 +        assert pack_path.read_bytes() == b"url-pack"
 +        assert seen == {
 +            "url": "https://example.test/pack",
 +            "progress": None,
 +            "sidecar_url": "https://example.test/pack",
 +            "sidecar_path": sig_path,
 +        }
++
 +    def test_dispatch_pull_peer_downloads_pack_and_sidecar(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.share.peer as peer
++
 +        pack_path = tmp_path / "pack.dlm.pack"
 +        sig_path = tmp_path / "pack.dlm.pack.minisig"
 +        seen: dict[str, object] = {}
++
 +        def _fake_pull_peer(target: str, out_path: Path, *, progress: object | None = None) -> int:
 +            seen["target"] = target
 +            seen["progress"] = progress
 +            out_path.write_bytes(b"peer-pack")
 +            return 11
++
 +        monkeypatch.setattr(peer, "pull_peer", _fake_pull_peer)
 +        monkeypatch.setattr(
 +            pull_mod,
 +            "_try_peer_sidecar",
 +            lambda target, sidecar_path: seen.update(
 +                {"sidecar_target": target, "sidecar_path": sidecar_path}
 +            ),
 +        )
++
 +        bytes_received = _dispatch_pull(
 +            SinkSpec(kind=SinkKind.PEER, target="host:7337/pack?token=abc"),
 +            pack_path,
 +            sig_path,
 +            progress=None,
 +        )
++
 +        assert bytes_received == 11
 +        assert pack_path.read_bytes() == b"peer-pack"
 +        assert seen == {
 +            "target": "host:7337/pack?token=abc",
 +            "progress": None,
 +            "sidecar_target": "host:7337/pack?token=abc",
 +            "sidecar_path": sig_path,
 +        }
++
 +    def test_dispatch_pull_local_copies_pack_and_signature(self, tmp_path: Path) -> None:
 +        src = tmp_path / "src.dlm.pack"
 +        sig = tmp_path / "src.dlm.pack.minisig"
 +        src.write_bytes(b"local-pack")
 +        sig.write_text("local-signature", encoding="utf-8")
 +        pack_path = tmp_path / "incoming.dlm.pack"
 +        sig_path = tmp_path / "incoming.dlm.pack.minisig"
++
 +        bytes_received = _dispatch_pull(
 +            SinkSpec(kind=SinkKind.LOCAL, target=str(src)),
 +            pack_path,
 +            sig_path,
 +            progress=None,
 +        )
++
 +        assert bytes_received == len(b"local-pack")
 +        assert pack_path.read_bytes() == b"local-pack"
 +        assert sig_path.read_text(encoding="utf-8") == "local-signature"
++
 +    def test_dispatch_pull_local_missing_source_raises(self, tmp_path: Path) -> None:
 +        with pytest.raises(SinkError, match="source missing"):
 +            _dispatch_pull(
 +                SinkSpec(kind=SinkKind.LOCAL, target=str(tmp_path / "missing.dlm.pack")),
 +                tmp_path / "incoming.dlm.pack",
 +                tmp_path / "incoming.dlm.pack.minisig",
 +                progress=None,
 +            )
++
 +    def test_dispatch_pull_rejects_unsupported_kind(self, tmp_path: Path) -> None:
 +        weird = SinkSpec(kind=cast("SinkKind", "weird"), target="x")
++
 +        with pytest.raises(ShareError, match="unsupported sink kind"):
 +            _dispatch_pull(
 +                weird,
 +                tmp_path / "incoming.dlm.pack",
 +                tmp_path / "incoming.dlm.pack.minisig",
 +                progress=None,
 +            )
++
++
 +class TestPullSidecars:
 +    def test_try_hf_sidecar_copies_downloaded_signature(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        fake_hub = ModuleType("huggingface_hub")
 +        fake_utils = ModuleType("huggingface_hub.utils")
 +        downloaded = tmp_path / "downloaded.minisig"
 +        downloaded.write_text("hf-signature", encoding="utf-8")
++
 +        class FakeHfHubHTTPError(Exception):
 +            pass
++
 +        def _fake_download(*, repo_id: str, filename: str, repo_type: str) -> str:
 +            assert repo_id == "org/repo"
 +            assert filename == "adapter.dlm.pack.minisig"
 +            assert repo_type == "model"
 +            return str(downloaded)
++
 +        fake_hub.hf_hub_download = _fake_download
 +        fake_utils.HfHubHTTPError = FakeHfHubHTTPError
 +        monkeypatch.setitem(sys.modules, "huggingface_hub", fake_hub)
 +        monkeypatch.setitem(sys.modules, "huggingface_hub.utils", fake_utils)
++
 +        sig_path = tmp_path / "incoming.minisig"
 +        _try_hf_sidecar("org/repo", sig_path)
++
 +        assert sig_path.read_text(encoding="utf-8") == "hf-signature"
++
 +    def test_try_hf_sidecar_suppresses_hub_errors(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        fake_hub = ModuleType("huggingface_hub")
 +        fake_utils = ModuleType("huggingface_hub.utils")
++
 +        class FakeHfHubHTTPError(Exception):
 +            pass
++
 +        def _fake_download(*, repo_id: str, filename: str, repo_type: str) -> str:
 +            raise FakeHfHubHTTPError("missing")
++
 +        fake_hub.hf_hub_download = _fake_download
 +        fake_utils.HfHubHTTPError = FakeHfHubHTTPError
 +        monkeypatch.setitem(sys.modules, "huggingface_hub", fake_hub)
 +        monkeypatch.setitem(sys.modules, "huggingface_hub.utils", fake_utils)
++
 +        sig_path = tmp_path / "incoming.minisig"
 +        _try_hf_sidecar("org/repo", sig_path)
++
 +        assert not sig_path.exists()
++
 +    def test_try_url_sidecar_suppresses_missing_sidecar(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.share.url_sink as url_sink
++
 +        def _fake_pull_url(url: str, out_path: Path, *, progress: object | None = None) -> int:
 +            raise SinkError(f"missing {url}")
++
 +        monkeypatch.setattr(url_sink, "pull_url", _fake_pull_url)
++
 +        _try_url_sidecar("https://example.test/pack", tmp_path / "incoming.minisig")
++
 +    def test_try_peer_sidecar_suppresses_missing_sidecar(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.share.peer as peer
++
 +        def _fake_pull_peer(target: str, out_path: Path, *, progress: object | None = None) -> int:
 +            raise SinkError(f"missing {target}")
++
 +        monkeypatch.setattr(peer, "pull_peer", _fake_pull_peer)
++
 +        _try_peer_sidecar("host:7337/pack?token=abc", tmp_path / "incoming.minisig")
++
++
 +class TestVerificationLogging:
 +    def test_log_verification_verified(
 +        self, caplog: pytest.LogCaptureFixture, tmp_path: Path
 +    ) -> None:
 +        caplog.set_level("INFO")
++
 +        _log_verification(
 +            "hf:org/repo",
 +            VerifyResult(status=VerifyStatus.VERIFIED, key_path=tmp_path / "trusted.pub"),
 +        )
++
 +        assert "verified signature" in caplog.text
++
 +    def test_log_verification_unverified(self, caplog: pytest.LogCaptureFixture) -> None:
 +        caplog.set_level("WARNING")
++
 +        _log_verification(
 +            "https://example.test/pack",
 +            VerifyResult(status=VerifyStatus.UNVERIFIED, detail="no trusted key matched"),
 +        )
++
 +        assert "signature present but could not verify" in caplog.text
 +        assert "no trusted key matched" in caplog.text
++
 +    def test_log_verification_unsigned(self, caplog: pytest.LogCaptureFixture) -> None:
 +        caplog.set_level("INFO")
++
 +        _log_verification(
 +            "./local.dlm.pack",
 +            VerifyResult(status=VerifyStatus.UNSIGNED),
 +        )
++
 +        assert "no signature" in caplog.text

tests/unit/share/test_push.pyadded

435 lines changed — click to load

 +"""Unit coverage for the share push orchestrator."""
++
 +from __future__ import annotations
++
 +import importlib
 +import io
 +import json
 +import tarfile
 +from pathlib import Path
 +from types import SimpleNamespace
 +from typing import cast
++
 +import pytest
 +import zstandard as zstd
++
 +from dlm.share.errors import ShareError, SinkError
 +from dlm.share.push import (
 +    PushResult,
 +    _collect_readme_fields,
 +    _dispatch_push,
 +    _ensure_pack,
 +    _noop,
 +    _sign_pack,
 +    push,
 +)
 +from dlm.share.sinks import SinkKind, SinkSpec
++
 +push_mod = importlib.import_module("dlm.share.push")
++
++
 +def _write_pack_with_header(tmp_path: Path, header: dict[str, str]) -> Path:
 +    tar_bytes = io.BytesIO()
 +    with tarfile.open(fileobj=tar_bytes, mode="w") as tar:
 +        payload = json.dumps(header).encode("utf-8")
 +        info = tarfile.TarInfo("pack/header.json")
 +        info.size = len(payload)
 +        tar.addfile(info, io.BytesIO(payload))
 +    pack_path = tmp_path / "bundle.dlm.pack"
 +    with pack_path.open("wb") as dst, zstd.ZstdCompressor().stream_writer(dst) as writer:
 +        writer.write(tar_bytes.getvalue())
 +    return pack_path
++
++
 +class TestPush:
 +    def test_push_rejects_peer_destinations(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        monkeypatch.setattr(
 +            push_mod,
 +            "parse_source",
 +            lambda destination: SinkSpec(kind=SinkKind.PEER, target=destination),
 +        )
++
 +        with pytest.raises(ShareError, match="push to peer:// is not supported"):
 +            push(tmp_path / "doc.dlm", "peer://host:7337/doc?token=abc")
++
 +    def test_push_signs_dispatches_and_cleans_up(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        source = tmp_path / "doc.dlm"
 +        source.write_text("body", encoding="utf-8")
 +        pack_path = tmp_path / "doc.dlm.pack"
 +        cleanup_called = False
 +        order: list[str] = []
 +        progress = object()
 +        expected = PushResult(
 +            destination="https://example.test/upload",
 +            sink_kind=SinkKind.URL,
 +            bytes_sent=11,
 +        )
++
 +        monkeypatch.setattr(
 +            push_mod,
 +            "parse_source",
 +            lambda destination: SinkSpec(kind=SinkKind.URL, target=destination),
 +        )
++
 +        def _fake_ensure_pack(
 +            actual_source: Path,
 +            *,
 +            include_exports: bool,
 +            include_base: bool,
 +            include_logs: bool,
 +            licensee_acceptance_url: str | None,
 +        ) -> tuple[Path, object]:
 +            nonlocal cleanup_called
 +            assert actual_source == source
 +            assert include_exports is True
 +            assert include_base is True
 +            assert include_logs is True
 +            assert licensee_acceptance_url == "https://license.example/accept"
 +            pack_path.write_bytes(b"packed-bytes")
++
 +            def _cleanup() -> None:
 +                nonlocal cleanup_called
 +                cleanup_called = True
++
 +            return pack_path, _cleanup
++
 +        def _fake_sign_pack(actual_pack: Path) -> None:
 +            order.append("sign")
 +            assert actual_pack == pack_path
++
 +        def _fake_dispatch(
 +            actual_pack: Path,
 +            spec: SinkSpec,
 +            *,
 +            progress: object | None,
 +        ) -> PushResult:
 +            order.append("dispatch")
 +            assert actual_pack == pack_path
 +            assert spec == SinkSpec(
 +                kind=SinkKind.URL,
 +                target="https://example.test/upload",
 +            )
 +            assert progress is not None
 +            return expected
++
 +        monkeypatch.setattr(push_mod, "_ensure_pack", _fake_ensure_pack)
 +        monkeypatch.setattr(push_mod, "_sign_pack", _fake_sign_pack)
 +        monkeypatch.setattr(push_mod, "_dispatch_push", _fake_dispatch)
++
 +        result = push(
 +            source,
 +            "https://example.test/upload",
 +            sign=True,
 +            include_exports=True,
 +            include_base=True,
 +            include_logs=True,
 +            licensee_acceptance_url="https://license.example/accept",
 +            progress=cast("object", progress),
 +        )
++
 +        assert result == expected
 +        assert order == ["sign", "dispatch"]
 +        assert cleanup_called is True
++
 +    def test_push_cleans_up_when_dispatch_raises(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        source = tmp_path / "doc.dlm"
 +        source.write_text("body", encoding="utf-8")
 +        pack_path = tmp_path / "doc.dlm.pack"
 +        cleanup_called = False
++
 +        monkeypatch.setattr(
 +            push_mod,
 +            "parse_source",
 +            lambda destination: SinkSpec(kind=SinkKind.URL, target=destination),
 +        )
 +        monkeypatch.setattr(
 +            push_mod,
 +            "_ensure_pack",
 +            lambda *args, **kwargs: (
 +                pack_path,
 +                lambda: globals().__setitem__("_unused", None),
 +            ),
 +        )
++
 +        def _cleanup() -> None:
 +            nonlocal cleanup_called
 +            cleanup_called = True
++
 +        monkeypatch.setattr(push_mod, "_ensure_pack", lambda *args, **kwargs: (pack_path, _cleanup))
 +        monkeypatch.setattr(
 +            push_mod,
 +            "_dispatch_push",
 +            lambda *args, **kwargs: (_ for _ in ()).throw(SinkError("boom")),
 +        )
++
 +        with pytest.raises(SinkError, match="boom"):
 +            push(source, "https://example.test/upload")
++
 +        assert cleanup_called is True
++
++
 +class TestEnsurePack:
 +    def test_ensure_pack_keeps_existing_pack(self, tmp_path: Path) -> None:
 +        pack_path = tmp_path / "doc.dlm.pack"
 +        pack_path.write_bytes(b"already-packed")
++
 +        actual_path, cleanup = _ensure_pack(
 +            pack_path,
 +            include_exports=False,
 +            include_base=False,
 +            include_logs=False,
 +            licensee_acceptance_url=None,
 +        )
++
 +        assert actual_path == pack_path
 +        assert cleanup is _noop
++
 +    def test_ensure_pack_packs_dlm_and_cleans_up(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        source = tmp_path / "doc.dlm"
 +        source.write_text("body", encoding="utf-8")
 +        seen: dict[str, object] = {}
++
 +        def _fake_pack(
 +            actual_source: Path,
 +            *,
 +            out: Path,
 +            include_exports: bool,
 +            include_base: bool,
 +            include_logs: bool,
 +            licensee_acceptance_url: str | None,
 +        ) -> SimpleNamespace:
 +            seen["source"] = actual_source
 +            seen["out"] = out
 +            seen["include_exports"] = include_exports
 +            seen["include_base"] = include_base
 +            seen["include_logs"] = include_logs
 +            seen["license"] = licensee_acceptance_url
 +            out.write_bytes(b"packed")
 +            return SimpleNamespace(path=out)
++
 +        monkeypatch.setattr(push_mod, "pack", _fake_pack)
++
 +        actual_path, cleanup = _ensure_pack(
 +            source,
 +            include_exports=True,
 +            include_base=True,
 +            include_logs=True,
 +            licensee_acceptance_url="https://license.example/accept",
 +        )
++
 +        temp_dir = actual_path.parent
 +        assert actual_path.read_bytes() == b"packed"
 +        assert seen == {
 +            "source": source,
 +            "out": actual_path,
 +            "include_exports": True,
 +            "include_base": True,
 +            "include_logs": True,
 +            "license": "https://license.example/accept",
 +        }
++
 +        cleanup()
 +        assert not temp_dir.exists()
++
++
 +class TestSignPack:
 +    def test_sign_pack_calls_sign_file(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        import dlm.share.signing as signing
++
 +        pack_path = tmp_path / "bundle.dlm.pack"
 +        pack_path.write_bytes(b"packed")
 +        sig_path = pack_path.with_suffix(pack_path.suffix + ".minisig")
 +        seen: dict[str, object] = {}
++
 +        def _fake_sign_file(target: Path, *, comment: str | None = None) -> Path:
 +            seen["target"] = target
 +            seen["comment"] = comment
 +            sig_path.write_text("signature", encoding="utf-8")
 +            return sig_path
++
 +        monkeypatch.setattr(signing, "sign_file", _fake_sign_file)
++
 +        _sign_pack(pack_path)
++
 +        assert seen == {
 +            "target": pack_path,
 +            "comment": f"dlm push {pack_path.name}",
 +        }
++
 +    def test_sign_pack_propagates_missing_minisign(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import dlm.share.signing as signing
++
 +        pack_path = tmp_path / "bundle.dlm.pack"
 +        pack_path.write_bytes(b"packed")
++
 +        def _fake_sign_file(target: Path, *, comment: str | None = None) -> Path:
 +            raise signing.MinisignNotAvailableError("missing")
++
 +        monkeypatch.setattr(signing, "sign_file", _fake_sign_file)
++
 +        with pytest.raises(signing.MinisignNotAvailableError, match="missing"):
 +            _sign_pack(pack_path)
++
++
 +class TestDispatchPush:
 +    def test_dispatch_push_hf_uploads_pack(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        import dlm.share.hf_sink as hf_sink
++
 +        pack_path = tmp_path / "bundle.dlm.pack"
 +        pack_path.write_bytes(b"packed")
 +        progress = object()
 +        seen: dict[str, object] = {}
++
 +        def _fake_push_hf(
 +            actual_pack: Path,
 +            repo_id: str,
 +            *,
 +            private: bool = False,
 +            readme_fields: dict[str, str] | None = None,
 +            progress: object | None = None,
 +        ) -> SimpleNamespace:
 +            seen["pack"] = actual_pack
 +            seen["repo_id"] = repo_id
 +            seen["private"] = private
 +            seen["readme_fields"] = readme_fields
 +            seen["progress"] = progress
 +            return SimpleNamespace(
 +                pack_url="https://huggingface.co/org/repo/blob/main/adapter.dlm.pack"
 +            )
++
 +        monkeypatch.setattr(hf_sink, "push_hf", _fake_push_hf)
 +        monkeypatch.setattr(
 +            push_mod,
 +            "_collect_readme_fields",
 +            lambda path: {"dlm_id": "01HZPUSH", "base_model": "qwen3-4b"},
 +        )
++
 +        result = _dispatch_push(
 +            pack_path,
 +            SinkSpec(kind=SinkKind.HF, target="org/repo"),
 +            progress=cast("object", progress),
 +        )
++
 +        assert result == PushResult(
 +            destination="hf:org/repo",
 +            sink_kind=SinkKind.HF,
 +            bytes_sent=len(b"packed"),
 +            detail="pack: https://huggingface.co/org/repo/blob/main/adapter.dlm.pack",
 +        )
 +        assert seen == {
 +            "pack": pack_path,
 +            "repo_id": "org/repo",
 +            "private": False,
 +            "readme_fields": {"dlm_id": "01HZPUSH", "base_model": "qwen3-4b"},
 +            "progress": progress,
 +        }
++
 +    def test_dispatch_push_url_uploads_pack(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        import dlm.share.url_sink as url_sink
++
 +        pack_path = tmp_path / "bundle.dlm.pack"
 +        pack_path.write_bytes(b"packed")
 +        seen: dict[str, object] = {}
++
 +        def _fake_push_url(actual_pack: Path, url: str, *, progress: object | None = None) -> None:
 +            seen["pack"] = actual_pack
 +            seen["url"] = url
 +            seen["progress"] = progress
++
 +        monkeypatch.setattr(url_sink, "push_url", _fake_push_url)
++
 +        result = _dispatch_push(
 +            pack_path,
 +            SinkSpec(kind=SinkKind.URL, target="https://example.test/upload"),
 +            progress=None,
 +        )
++
 +        assert result == PushResult(
 +            destination="https://example.test/upload",
 +            sink_kind=SinkKind.URL,
 +            bytes_sent=len(b"packed"),
 +        )
 +        assert seen == {
 +            "pack": pack_path,
 +            "url": "https://example.test/upload",
 +            "progress": None,
 +        }
++
 +    def test_dispatch_push_local_copies_pack(self, tmp_path: Path) -> None:
 +        pack_path = tmp_path / "bundle.dlm.pack"
 +        pack_path.write_bytes(b"packed")
 +        dest = tmp_path / "nested" / "copy.dlm.pack"
++
 +        result = _dispatch_push(
 +            pack_path,
 +            SinkSpec(kind=SinkKind.LOCAL, target=str(dest)),
 +            progress=None,
 +        )
++
 +        assert result == PushResult(
 +            destination=str(dest),
 +            sink_kind=SinkKind.LOCAL,
 +            bytes_sent=len(b"packed"),
 +        )
 +        assert dest.read_bytes() == b"packed"
++
 +    def test_dispatch_push_rejects_unsupported_kind(self, tmp_path: Path) -> None:
 +        pack_path = tmp_path / "bundle.dlm.pack"
 +        pack_path.write_bytes(b"packed")
++
 +        with pytest.raises(SinkError, match="unsupported sink kind"):
 +            _dispatch_push(
 +                pack_path,
 +                SinkSpec(kind=cast("SinkKind", "weird"), target="x"),
 +                progress=None,
 +            )
++
++
 +class TestReadmeFields:
 +    def test_collect_readme_fields_from_pack(self, tmp_path: Path) -> None:
 +        pack_path = _write_pack_with_header(
 +            tmp_path,
 +            {
 +                "dlm_id": "01HZHEADER",
 +                "base_model": "qwen3-8b",
 +                "adapter_version": "v0007",
 +            },
 +        )
++
 +        assert _collect_readme_fields(pack_path) == {
 +            "dlm_id": "01HZHEADER",
 +            "base_model": "qwen3-8b",
 +            "adapter_version": "v0007",
 +        }
++
 +    def test_collect_readme_fields_returns_empty_on_bad_pack(self, tmp_path: Path) -> None:
 +        assert _collect_readme_fields(tmp_path / "missing.dlm.pack") == {}
++
 +    def test_noop_is_noop(self) -> None:
 +        assert _noop() is None

tests/unit/share/test_signing.pymodified

149 lines changed — click to load

  import pytest
 +from dlm.share.errors import ShareError
  from dlm.share.signing import (
      MinisignNotAvailableError,
      VerifyResult,
              pytest.raises(MinisignNotAvailableError, match="not installed"),
          ):
              sign_file(target)
++
++
 +class TestSignFile:
 +    def test_missing_secret_key_is_refused(self, tmp_path: Path) -> None:
 +        target = tmp_path / "pack.bin"
 +        target.write_bytes(b"payload")
++
 +        with (
 +            patch("dlm.share.signing.minisign_available", return_value=True),
 +            pytest.raises(Exception, match="secret key not found"),
 +        ):
 +            sign_file(target, secret_key=tmp_path / "missing.key")
++
 +    def test_nonzero_exit_is_refused(self, tmp_path: Path) -> None:
 +        target = tmp_path / "pack.bin"
 +        target.write_bytes(b"payload")
 +        secret = tmp_path / "secret.key"
 +        secret.write_text("key", encoding="utf-8")
++
 +        class Result:
 +            returncode = 7
++
 +        with (
 +            patch("dlm.share.signing.minisign_available", return_value=True),
 +            patch("subprocess.run", return_value=Result()),
 +            pytest.raises(Exception, match="exit 7"),
 +        ):
 +            sign_file(target, secret_key=secret, comment="demo")
++
 +    def test_missing_signature_sidecar_after_success_is_refused(self, tmp_path: Path) -> None:
 +        target = tmp_path / "pack.bin"
 +        target.write_bytes(b"payload")
 +        secret = tmp_path / "secret.key"
 +        secret.write_text("key", encoding="utf-8")
++
 +        class Result:
 +            returncode = 0
++
 +        with (
 +            patch("dlm.share.signing.minisign_available", return_value=True),
 +            patch("subprocess.run", return_value=Result()),
 +            pytest.raises(Exception, match="is missing"),
 +        ):
 +            sign_file(target, secret_key=secret)
++
 +    def test_happy_path_returns_minisig_path(self, tmp_path: Path) -> None:
 +        target = tmp_path / "pack.bin"
 +        target.write_bytes(b"payload")
 +        secret = tmp_path / "secret.key"
 +        secret.write_text("key", encoding="utf-8")
 +        sig = target.with_suffix(target.suffix + ".minisig")
++
 +        class Result:
 +            returncode = 0
++
 +        def _fake_run(cmd: list[str], check: bool) -> Result:
 +            assert "-c" in cmd
 +            sig.write_text("signature", encoding="utf-8")
 +            return Result()
++
 +        with (
 +            patch("dlm.share.signing.minisign_available", return_value=True),
 +            patch("subprocess.run", side_effect=_fake_run),
 +        ):
 +            out = sign_file(target, secret_key=secret, comment="demo")
++
 +        assert out == sig
++
++
 +class TestVerifySignature:
 +    def test_verified_when_one_key_matches(self, tmp_path: Path) -> None:
 +        target = tmp_path / "pack.bin"
 +        target.write_bytes(b"payload")
 +        sig = tmp_path / "pack.bin.minisig"
 +        sig.write_bytes(b"sig")
 +        keys = tmp_path / "trusted-keys"
 +        keys.mkdir()
 +        miss = keys / "miss.pub"
 +        hit = keys / "hit.pub"
 +        miss.write_text("miss", encoding="utf-8")
 +        hit.write_text("hit", encoding="utf-8")
 +        seen: list[Path] = []
++
 +        def _fake_verify(_target: Path, _sig: Path, pub_key: Path) -> None:
 +            seen.append(pub_key)
 +            if pub_key == miss:
 +                raise Exception("bad key")
++
 +        with (
 +            patch("dlm.share.signing.minisign_available", return_value=True),
 +            patch("dlm.share.signing._minisign_verify", side_effect=_fake_verify),
 +        ):
 +            result = verify_signature(target, sig, trusted_keys_dir=keys)
++
 +        assert result.status == VerifyStatus.VERIFIED
 +        assert result.key_path == hit
 +        assert seen == [hit]
++
 +    def test_unverified_when_no_keys_match(self, tmp_path: Path) -> None:
 +        target = tmp_path / "pack.bin"
 +        target.write_bytes(b"payload")
 +        sig = tmp_path / "pack.bin.minisig"
 +        sig.write_bytes(b"sig")
 +        keys = tmp_path / "trusted-keys"
 +        keys.mkdir()
 +        (keys / "a.pub").write_text("a", encoding="utf-8")
 +        (keys / "b.pub").write_text("b", encoding="utf-8")
++
 +        with (
 +            patch("dlm.share.signing.minisign_available", return_value=True),
 +            patch("dlm.share.signing._minisign_verify", side_effect=ShareError("no match")),
 +        ):
 +            result = verify_signature(target, sig, trusted_keys_dir=keys)
++
 +        assert result.status == VerifyStatus.UNVERIFIED
 +        assert "no match among 2 trusted keys" in result.detail
++
++
 +class TestMinisignVerify:
 +    def test_verify_raises_share_error_on_nonzero_exit(self, tmp_path: Path) -> None:
 +        from dlm.share.errors import ShareError
 +        from dlm.share.signing import _minisign_verify
++
 +        target = tmp_path / "pack.bin"
 +        target.write_bytes(b"payload")
 +        sig = tmp_path / "pack.bin.minisig"
 +        sig.write_bytes(b"sig")
 +        key = tmp_path / "key.pub"
 +        key.write_text("key", encoding="utf-8")
++
 +        class Result:
 +            returncode = 1
 +            stderr = b"bad signature"
++
 +        with (
 +            patch("subprocess.run", return_value=Result()),
 +            pytest.raises(ShareError, match="bad signature"),
 +        ):
 +            _minisign_verify(target, sig, key)

tests/unit/share/test_url_sink.pymodified

93 lines changed — click to load

          with pytest.raises(SinkError, match="network error"):
              push_url(pack, "https://example.com/upload")
 +    def test_non_2xx_response_object_is_refused(
 +        self, pack: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        def _fake_urlopen(req: urllib.request.Request, data: object, timeout: int) -> _FakeResponse:
 +            return _FakeResponse(status=500)
++
 +        monkeypatch.setattr(urllib.request, "urlopen", _fake_urlopen)
++
 +        with pytest.raises(SinkError, match="HTTP 500"):
 +            push_url(pack, "https://example.com/upload")
++
 +    def test_io_error_reading_pack_is_translated(
 +        self, pack: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        real_open = Path.open
++
 +        def _broken_open(self: Path, *args: object, **kwargs: object):
 +            if self == pack:
 +                raise OSError("disk error")
 +            return real_open(self, *args, **kwargs)
++
 +        monkeypatch.setattr(Path, "open", _broken_open)
++
 +        with pytest.raises(SinkError, match="I/O error reading"):
 +            push_url(pack, "https://example.com/upload")
++
      def test_progress_called_at_start_and_end(
          self, pack: Path, monkeypatch: pytest.MonkeyPatch
      ) -> None:
          with pytest.raises(SinkError, match="HTTP 404"):
              pull_url("https://example.com/p", tmp_path / "out.pack")
 +    def test_non_2xx_response_object_is_refused(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        def _fake_urlopen(req: urllib.request.Request, timeout: int) -> _FakeResponse:
 +            return _FakeResponse(status=503, body=b"down")
++
 +        monkeypatch.setattr(urllib.request, "urlopen", _fake_urlopen)
 +        with pytest.raises(SinkError, match="HTTP 503"):
 +            pull_url("https://example.com/p", tmp_path / "out.pack")
++
 +    def test_network_error_is_translated(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        def _fake_urlopen(req: urllib.request.Request, timeout: int) -> _FakeResponse:
 +            raise urllib.error.URLError("reset")
++
 +        monkeypatch.setattr(urllib.request, "urlopen", _fake_urlopen)
 +        with pytest.raises(SinkError, match="network error"):
 +            pull_url("https://example.com/p", tmp_path / "out.pack")
++
 +    def test_io_error_writing_is_translated(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        out = tmp_path / "nested" / "out.pack"
++
 +        def _fake_urlopen(req: urllib.request.Request, timeout: int) -> _FakeResponse:
 +            return _FakeResponse(status=200, body=b"payload", headers={"Content-Length": "7"})
++
 +        real_open = Path.open
++
 +        def _broken_open(self: Path, *args: object, **kwargs: object):
 +            if self == out:
 +                raise OSError("read only")
 +            return real_open(self, *args, **kwargs)
++
 +        monkeypatch.setattr(urllib.request, "urlopen", _fake_urlopen)
 +        monkeypatch.setattr(Path, "open", _broken_open)
++
 +        with pytest.raises(SinkError, match="I/O error writing"):
 +            pull_url("https://example.com/p", out)
++
 +    def test_http_scheme_warns(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch, caplog: pytest.LogCaptureFixture
 +    ) -> None:
 +        out = tmp_path / "fetched.pack"
++
 +        def _fake_urlopen(req: urllib.request.Request, timeout: int) -> _FakeResponse:
 +            return _FakeResponse(status=200, body=b"x", headers={"Content-Length": "1"})
++
 +        monkeypatch.setattr(urllib.request, "urlopen", _fake_urlopen)
 +        with caplog.at_level("WARNING", logger="dlm.share.url_sink"):
 +            pull_url("http://example.com/p", out)
++
 +        assert any("plaintext HTTP" in rec.message for rec in caplog.records)
++
      def test_creates_parent_dir(self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
          out = tmp_path / "nested" / "dir" / "fetched.pack"

tests/unit/store/test_blobs.pymodified

47 lines changed — click to load

          from_bytes = store.put_bytes(data, ext=".jpg")
          assert from_path == from_bytes
 +    def test_put_bytes_writes_new_blob(self, store: BlobStore, store_root: Path) -> None:
 +        data = b"raw bytes"
 +        handle = store.put_bytes(data, ext="PNG")
 +        blob_path = store_root / handle.sha[:2] / f"{handle.sha}.png"
 +        assert blob_path.read_bytes() == data
++
  class TestBlobStoreGet:
      def test_get_returns_stored_path(self, store: BlobStore, tmp_path: Path) -> None:
      def test_gc_noop_on_empty_store(self, store: BlobStore) -> None:
          assert list(store.gc({"a" * 64})) == []
 +    def test_gc_ignores_concurrent_delete(self, store: BlobStore, tmp_path: Path) -> None:
 +        src = tmp_path / "x.png"
 +        src.write_bytes(b"x")
 +        handle = store.put(src)
 +        store.get(handle.sha).unlink()
 +        store.iter_all = lambda: iter([handle])  # type: ignore[method-assign]
 +        assert list(store.gc(set())) == []
++
  class TestBlobStoreExtensions:
      @pytest.mark.parametrize(
          iterated = list(store.iter_all())
          assert sorted(h.sha for h in handles) == sorted(h.sha for h in iterated)
 +    def test_iter_all_ignores_non_blob_entries(self, store: BlobStore, store_root: Path) -> None:
 +        bucket = store_root / "aa"
 +        bucket.mkdir(parents=True, exist_ok=True)
 +        (store_root / "README.txt").write_text("ignore me", encoding="utf-8")
 +        (bucket / "nested").mkdir()
 +        assert list(store.iter_all()) == []
++
  class TestBlobStoreClear:
      def test_clear_removes_tree(self, store: BlobStore, store_root: Path, tmp_path: Path) -> None:
          h = BlobHandle(sha="a" * 64, ext=".png", size=10)
          with pytest.raises(AttributeError):
              h.sha = "b" * 64  # type: ignore[misc]
++
++
 +class TestBlobStoreMetadata:
 +    def test_root_property(self, store: BlobStore, store_root: Path) -> None:
 +        assert store.root == store_root

tests/unit/store/test_inspect.pymodified

66 lines changed — click to load

  import pytest
 -from dlm.store.inspect import inspect_store
 +from dlm.store.inspect import _directory_size, _discover_named_adapters, _max_version, inspect_store
  from dlm.store.manifest import Manifest, TrainingRunSummary, save_manifest
  from dlm.store.paths import StorePath, for_dlm
  from tests.fixtures.dlm_factory import make_dlm
          save_manifest(store.manifest, manifest)
          result = inspect_store(store)
          assert result.last_trained_at == base + timedelta(minutes=5)
++
++
 +class TestInspectCoverageEdges:
 +    def test_discover_named_adapters_on_missing_adapter_dir(self, tmp_path: Path) -> None:
 +        store = for_dlm(VALID_ID, home=tmp_path)
 +        assert _discover_named_adapters(store) == []
++
 +    def test_directory_size_ignores_stat_errors(self, tmp_path: Path) -> None:
 +        path = tmp_path / "root"
 +        path.mkdir()
 +        good = path / "good.bin"
 +        good.write_bytes(b"1234")
++
 +        class _BadPath:
 +            def is_file(self) -> bool:
 +                return True
++
 +            def stat(self):  # type: ignore[no-untyped-def]
 +                raise OSError("transient")
++
 +        monkeypatch = pytest.MonkeyPatch()
 +        monkeypatch.setattr(Path, "rglob", lambda self, _pattern: iter([good, _BadPath()]))
 +        try:
 +            assert _directory_size(path) == 4
 +        finally:
 +            monkeypatch.undo()
++
 +    def test_discover_named_adapters_tolerates_pointer_probe_errors(self, tmp_path: Path) -> None:
 +        store = for_dlm(VALID_ID, home=tmp_path)
 +        store.ensure_layout()
 +        named = store.adapter / "knowledge"
 +        (named / "versions" / "v0002").mkdir(parents=True)
++
 +        def _boom(_name: str) -> None:
 +            raise OSError("pointer unreadable")
++
 +        monkeypatch = pytest.MonkeyPatch()
 +        monkeypatch.setattr(
 +            StorePath, "resolve_current_adapter_for", lambda self, _name: _boom(_name)
 +        )
 +        try:
 +            states = _discover_named_adapters(store)
 +        finally:
 +            monkeypatch.undo()
++
 +        assert states == [type(states[0])(name="knowledge", has_current=False, latest_version=2)]
++
 +    def test_max_version_ignores_non_version_entries(self, tmp_path: Path) -> None:
 +        versions = tmp_path / "versions"
 +        versions.mkdir()
 +        (versions / "v0002").mkdir()
 +        (versions / "vbad").mkdir()
 +        (versions / "notes").mkdir()
 +        (versions / "v0009").write_text("not a dir", encoding="utf-8")
 +        assert _max_version(versions) == 2

tests/unit/store/test_lock.pymodified

70 lines changed — click to load

  from __future__ import annotations
 +import errno
  import multiprocessing
  import os
  import time
  # Module-level worker fns so `spawn` context can pickle them.
 -def _child_attempt(path: str, queue: _MPQueue) -> None:
 +def _child_attempt(path: str, queue: _MPQueue[str]) -> None:
      try:
          with lock.exclusive(Path(path), timeout=0.0):
              queue.put("acquired")
          # Parent acquires and releases in sequence; we hold inside the `with`
          # block long enough for the child to try + fail.
          ctx = multiprocessing.get_context("spawn")
 -        outcome: _MPQueue = ctx.Queue()
 +        outcome: _MPQueue[str] = ctx.Queue()
          with lock.exclusive(lock_path):
              proc = ctx.Process(target=_child_attempt, args=(str(lock_path), outcome))
          with pytest.raises(StaleLockError) as exc, lock.exclusive(lock_path, timeout=0.0):
              pass
          assert exc.value.holder_pid is None
++
 +    def test_transient_empty_lockfile_retries_when_timeout_allows(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +        tmp_path: Path,
 +    ) -> None:
 +        lock_path = tmp_path / "test.lock"
 +        payload = lock.LockInfo(pid=os.getpid(), hostname="host", acquired_at=time.time())
 +        acquire_results = iter([False, True])
 +        read_results = iter([None, payload])
++
 +        monkeypatch.setattr(lock, "_acquire_once", lambda _path: next(acquire_results))
 +        monkeypatch.setattr(lock, "_read_lock", lambda _path: next(read_results))
 +        monkeypatch.setattr(lock, "_release", lambda _path: None)
++
 +        with lock.exclusive(lock_path, timeout=1.0, poll_interval=0.0) as info:
 +            assert info == payload
++
++
 +class TestProcessProbeEdges:
 +    def test_permission_error_treated_as_alive(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        monkeypatch.setattr(
 +            "dlm.store.lock.os.kill",
 +            lambda _pid, _sig: (_ for _ in ()).throw(PermissionError()),
 +        )
 +        assert lock._is_alive(123) is True
++
 +    def test_generic_oserror_treated_as_alive(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        def _raise(_pid: int, _sig: int) -> None:
 +            err = OSError("io")
 +            err.errno = errno.EIO
 +            raise err
++
 +        monkeypatch.setattr("dlm.store.lock.os.kill", _raise)
 +        assert lock._is_alive(123) is True
++
 +    def test_esrch_oserror_treated_as_dead(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        def _raise(_pid: int, _sig: int) -> None:
 +            err = OSError("missing")
 +            err.errno = errno.ESRCH
 +            raise err
++
 +        monkeypatch.setattr("dlm.store.lock.os.kill", _raise)
 +        assert lock._is_alive(123) is False

tests/unit/store/test_paths.pymodified

78 lines changed — click to load

      LOGS_DIR,
      MANIFEST_FILENAME,
+ )
 -from dlm.store.paths import StorePath, dlm_home, ensure_home, for_dlm
 +from dlm.store.paths import StorePath, _current_os_name, dlm_home, ensure_home, for_dlm
  VALID_ID = "01HZ4X7TGZM3J1A2B3C4D5E6F7"
  class TestDlmHome:
 +    def test_current_os_name_passthrough(self) -> None:
 +        import os
++
 +        assert _current_os_name() == os.name
++
      def test_override_takes_precedence(self, tmp_path: Path) -> None:
          assert dlm_home(override=tmp_path / "custom") == (tmp_path / "custom").resolve()
          monkeypatch.setattr(Path, "home", lambda: tmp_path / "u")
          assert dlm_home() == tmp_path / "u" / ".dlm"
 +    def test_default_on_nt_prefers_appdata(
 +        self, monkeypatch: pytest.MonkeyPatch, tmp_path: Path
 +    ) -> None:
 +        monkeypatch.delenv("DLM_HOME", raising=False)
 +        monkeypatch.setenv("APPDATA", str(tmp_path / "AppData" / "Roaming"))
 +        monkeypatch.setattr("dlm.store.paths._current_os_name", lambda: "nt")
 +        assert dlm_home() == (tmp_path / "AppData" / "Roaming").resolve() / "dlm"
++
  class TestEnsureHome:
      def test_creates_store_subdir(self, tmp_path: Path) -> None:
      def test_lock_path(self, store: StorePath) -> None:
          assert store.lock.name == LOCK_FILENAME
 +    def test_training_state_paths(self, store: StorePath) -> None:
 +        assert store.training_state.name == "training_state.pt"
 +        assert store.training_state_sha.name == "training_state.pt.sha256"
++
      def test_adapter_subpaths(self, store: StorePath) -> None:
          assert store.adapter.name == ADAPTER_DIR
          assert store.adapter_versions.parent == store.adapter
      def test_logs_dir(self, store: StorePath) -> None:
          assert store.logs.name == LOGS_DIR
 +    def test_replay_paths(self, store: StorePath) -> None:
 +        assert store.replay_corpus.name == "corpus.zst"
 +        assert store.replay_index.name == "index.json"
++
      def test_adapter_version_zero_rejected(self, store: StorePath) -> None:
          with pytest.raises(ValueError, match="1-indexed"):
              store.adapter_version(0)
          assert store.vl_cache_dir.name == "vl-cache"
          assert store.vl_cache_dir.parent == store.root
 +    def test_other_lazy_dirs(self, store: StorePath) -> None:
 +        assert store.tokenized_cache_dir.name == "tokenized-cache"
 +        assert store.audio_cache_dir.name == "audio-cache"
 +        assert store.audio_waveform_cache_dir.name == "audio-waveform-cache"
 +        assert store.controls_dir.name == "controls"
 +        assert store.control_file("demo").name == "demo.safetensors"
 +        assert store.control_meta("demo").name == "demo.meta.json"
++
      def test_blob_and_vl_cache_lazy(self, tmp_path: Path) -> None:
          sp = for_dlm(VALID_ID, home=tmp_path)
          sp.ensure_layout()
          assert not sp.blob_dir.exists()
          assert not sp.vl_cache_dir.exists()
 +    def test_exists_reflects_store_root(self, tmp_path: Path) -> None:
 +        sp = for_dlm(VALID_ID, home=tmp_path)
 +        assert sp.exists() is False
 +        sp.ensure_layout()
 +        assert sp.exists() is True
++
  class TestEnsureLayout:
      @pytest.fixture

tests/unit/synth/test_apply_pending.pyadded

337 lines changed — click to load

 +"""Tests for synth apply/revert and pending-plan helpers."""
++
 +from __future__ import annotations
++
 +import json
 +from pathlib import Path
++
 +import pytest
++
 +from dlm.doc.parser import ParsedDlm, parse_file, parse_text
 +from dlm.doc.sections import Section, SectionType
 +from dlm.doc.serializer import serialize
 +from dlm.store.paths import for_dlm
 +from dlm.synth.apply import (
 +    SynthApplySkipReason,
 +    apply_plan,
 +    build_apply_plan,
 +    render_apply_plan,
 +    revert_all_auto_synth,
 +)
 +from dlm.synth.pending import (
 +    PendingSynthPlanError,
 +    _optional_float,
 +    _optional_int,
 +    _optional_str,
 +    _section_from_payload,
 +    clear_pending_plan,
 +    load_pending_plan,
 +    pending_plan_path,
 +    save_pending_plan,
 +)
++
 +_DLM_ID = "01KPQ9X1000000000000000000"
 +_FRONTMATTER = f"---\ndlm_id: {_DLM_ID}\ndlm_version: 15\nbase_model: smollm2-135m\n---\n"
++
++
 +def _write_dlm(path: Path, body: str = "") -> None:
 +    path.write_text(_FRONTMATTER + body, encoding="utf-8")
++
++
 +def _auto_synth_instruction(
 +    *,
 +    question: str = "What does DGEMM do?",
 +    answer: str = "It multiplies dense matrices.",
 +    teacher: str = "self",
 +    strategy: str = "extraction",
 +    source_section_id: str = "0123456789abcdef",
 +) -> Section:
 +    return Section(
 +        type=SectionType.INSTRUCTION,
 +        content=f"### Q\n{question}\n### A\n{answer}",
 +        start_line=12,
 +        adapter="tone",
 +        tags={"topic": "blas"},
 +        auto_synth=True,
 +        synth_teacher=teacher,
 +        synth_strategy=strategy,
 +        synth_at="2026-04-24T20:00:00Z",
 +        source_section_id=source_section_id,
 +    )
++
++
 +def _authored_instruction() -> Section:
 +    return Section(
 +        type=SectionType.INSTRUCTION,
 +        content="### Q\nWhat is BLAS?\n### A\nA linear algebra interface.",
 +    )
++
++
 +def _preference() -> Section:
 +    return Section(
 +        type=SectionType.PREFERENCE,
 +        content="### Prompt\nmanual\n### Chosen\nyes\n### Rejected\nno",
 +    )
++
++
 +def _image() -> Section:
 +    return Section(
 +        type=SectionType.IMAGE,
 +        content="A DGEMM block diagram.",
 +        media_path="diagram.png",
 +        media_alt="DGEMM diagram",
 +        media_blob_sha="ab" * 32,
 +    )
++
++
 +class TestBuildApplyPlan:
 +    def test_accepts_new_auto_synth_instruction(self) -> None:
 +        parsed = parse_text(_FRONTMATTER + "prose body\n")
 +        plan = build_apply_plan(parsed, [_auto_synth_instruction()])
++
 +        assert len(plan.additions) == 1
 +        assert plan.skipped == ()
 +        assert plan.additions[0].section.auto_synth is True
++
 +    def test_dedupes_within_input(self) -> None:
 +        parsed = parse_text(_FRONTMATTER + "prose body\n")
 +        section = _auto_synth_instruction()
 +        plan = build_apply_plan(parsed, [section, section])
++
 +        assert len(plan.additions) == 1
 +        assert len(plan.skipped) == 1
 +        assert plan.skipped[0].reason is SynthApplySkipReason.ALREADY_PRESENT
++
 +    def test_skips_non_instruction_and_hand_authored(self) -> None:
 +        parsed = parse_text(_FRONTMATTER + "prose body\n")
 +        plan = build_apply_plan(parsed, [_preference(), _authored_instruction()])
++
 +        assert plan.additions == ()
 +        assert [skip.reason for skip in plan.skipped] == [
 +            SynthApplySkipReason.NOT_INSTRUCTION,
 +            SynthApplySkipReason.NOT_AUTO_SYNTH,
 +        ]
++
 +    def test_render_plan_mentions_adds_and_skips(self) -> None:
 +        parsed = parse_text(_FRONTMATTER + "prose body\n")
 +        plan = build_apply_plan(parsed, [_auto_synth_instruction(), _authored_instruction()])
 +        rendered = render_apply_plan(plan)
++
 +        assert "1 add, 1 skip" in rendered
 +        assert "::instruction::" in rendered
 +        assert "teacher=self" in rendered
 +        assert "strategy=extraction" in rendered
 +        assert "source=0123456789abcdef" in rendered
 +        assert "not_auto_synth" in rendered
++
++
 +class TestApplyPlan:
 +    def test_writes_additions_and_preserves_body(self, tmp_path: Path) -> None:
 +        target = tmp_path / "doc.dlm"
 +        _write_dlm(target, "## hello\n\nkeep me\n")
++
 +        parsed = parse_file(target)
 +        plan = build_apply_plan(parsed, [_auto_synth_instruction()])
 +        summary = apply_plan(parsed, plan, target=target)
++
 +        assert summary.added == 1
 +        assert summary.skipped == 0
 +        assert len(summary.added_section_ids) == 1
++
 +        reloaded = parse_file(target)
 +        assert any(section.auto_synth for section in reloaded.sections)
 +        assert any("keep me" in section.content for section in reloaded.sections)
++
 +    def test_existing_document_section_is_skipped(self, tmp_path: Path) -> None:
 +        target = tmp_path / "doc.dlm"
 +        existing = _auto_synth_instruction()
 +        parsed = parse_text(_FRONTMATTER, path=target)
 +        plan = build_apply_plan(parsed, [existing])
 +        apply_plan(parsed, plan, target=target)
++
 +        reloaded = parse_file(target)
 +        second_plan = build_apply_plan(reloaded, [existing])
 +        assert second_plan.additions == ()
 +        assert len(second_plan.skipped) == 1
 +        assert second_plan.skipped[0].reason is SynthApplySkipReason.ALREADY_PRESENT
++
++
 +class TestRevertAutoSynth:
 +    def test_strips_only_auto_synth_instructions(self, tmp_path: Path) -> None:
 +        target = tmp_path / "doc.dlm"
 +        _write_dlm(target, "## hello\n\nkeep me\n")
 +        parsed = parse_file(target)
 +        plan = build_apply_plan(parsed, [_auto_synth_instruction()])
 +        apply_plan(parsed, plan, target=target)
++
 +        reloaded = parse_file(target)
 +        updated = ParsedDlm(
 +            frontmatter=reloaded.frontmatter,
 +            sections=reloaded.sections + (_authored_instruction(), _preference()),
 +            source_path=reloaded.source_path,
 +        )
 +        target.write_text(serialize(updated), encoding="utf-8")
++
 +        parsed_with_all = parse_file(target)
 +        summary = revert_all_auto_synth(parsed_with_all, target=target)
++
 +        assert summary.added == 0
 +        assert len(summary.added_section_ids) == 1
++
 +        final = parse_file(target)
 +        assert not any(section.auto_synth for section in final.sections)
 +        assert any(section.type is SectionType.PREFERENCE for section in final.sections)
 +        assert any(
 +            section.type is SectionType.INSTRUCTION and not section.auto_synth
 +            for section in final.sections
 +        )
 +        assert any("keep me" in section.content for section in final.sections)
++
 +    def test_revert_noop_when_no_auto_synth(self, tmp_path: Path) -> None:
 +        target = tmp_path / "doc.dlm"
 +        _write_dlm(target, "::instruction::\n### Q\nmanual?\n### A\nyes\n")
 +        parsed = parse_file(target)
 +        summary = revert_all_auto_synth(parsed, target=target)
++
 +        assert summary.added == 0
 +        assert summary.added_section_ids == ()
 +        reloaded = parse_file(target)
 +        assert len(reloaded.sections) == len(parsed.sections)
++
++
 +class TestPendingPlan:
 +    def test_pending_path_round_trip_and_clear(self, tmp_path: Path) -> None:
 +        home = tmp_path / "home"
 +        source_path = tmp_path / "doc.dlm"
 +        _write_dlm(source_path)
 +        store = for_dlm(_DLM_ID, home=home)
++
 +        path = pending_plan_path(store)
 +        assert path == home / "store" / _DLM_ID / "synth" / "pending.json"
++
 +        saved = save_pending_plan(
 +            store,
 +            source_path=source_path,
 +            sections=[_auto_synth_instruction(), _image()],
 +        )
 +        raw = json.loads(path.read_text(encoding="utf-8"))
 +        loaded = load_pending_plan(store)
++
 +        assert saved.source_path == source_path.resolve()
 +        assert saved.created_at.endswith("Z")
 +        assert raw["schema_version"] == 1
 +        assert raw["source_path"] == str(source_path.resolve())
 +        assert loaded == saved
 +        assert clear_pending_plan(store) is True
 +        assert clear_pending_plan(store) is False
 +        assert load_pending_plan(store) is None
++
 +    def test_load_returns_none_when_plan_absent(self, tmp_path: Path) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
++
 +        assert load_pending_plan(store) is None
++
 +    def test_load_rejects_unreadable_plan(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
 +        path = pending_plan_path(store)
 +        path.parent.mkdir(parents=True, exist_ok=True)
 +        path.write_text("{}", encoding="utf-8")
++
 +        def _raise(_self: Path, *, encoding: str) -> str:
 +            _ = encoding
 +            raise OSError("boom")
++
 +        monkeypatch.setattr(Path, "read_text", _raise)
 +        with pytest.raises(PendingSynthPlanError, match="could not read staged synth plan"):
 +            load_pending_plan(store)
++
 +    @pytest.mark.parametrize(
 +        ("payload", "message"),
 +        [
 +            (["not", "an", "object"], "must be a JSON object"),
 +            ({"schema_version": 2}, "unsupported staged synth plan schema_version=2"),
 +            (
 +                {"schema_version": 1, "created_at": "2026-04-24T20:00:00Z", "sections": []},
 +                "missing source_path",
 +            ),
 +            (
 +                {"schema_version": 1, "source_path": "/tmp/doc.dlm", "sections": []},
 +                "missing created_at",
 +            ),
 +            (
 +                {
 +                    "schema_version": 1,
 +                    "source_path": "/tmp/doc.dlm",
 +                    "created_at": "2026-04-24T20:00:00Z",
 +                },
 +                "missing sections",
 +            ),
 +            (
 +                {
 +                    "schema_version": 1,
 +                    "source_path": "/tmp/doc.dlm",
 +                    "created_at": "2026-04-24T20:00:00Z",
 +                    "sections": [{"content": "oops"}],
 +                },
 +                "invalid section payload at index 0",
 +            ),
 +        ],
 +    )
 +    def test_load_rejects_invalid_payloads(
 +        self, tmp_path: Path, payload: object, message: str
 +    ) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
 +        path = pending_plan_path(store)
 +        path.parent.mkdir(parents=True, exist_ok=True)
 +        path.write_text(json.dumps(payload), encoding="utf-8")
++
 +        with pytest.raises(PendingSynthPlanError, match=message):
 +            load_pending_plan(store)
++
 +    def test_load_rejects_invalid_json(self, tmp_path: Path) -> None:
 +        store = for_dlm(_DLM_ID, home=tmp_path / "home")
 +        path = pending_plan_path(store)
 +        path.parent.mkdir(parents=True, exist_ok=True)
 +        path.write_text("{not json", encoding="utf-8")
++
 +        with pytest.raises(PendingSynthPlanError, match="staged synth plan is not valid JSON"):
 +            load_pending_plan(store)
++
++
 +class TestPendingPayloadHelpers:
 +    def test_section_from_payload_validates_tags_and_optional_types(self) -> None:
 +        with pytest.raises(TypeError, match="expected object, got list"):
 +            _section_from_payload([])
++
 +        with pytest.raises(TypeError, match="tags must be an object"):
 +            _section_from_payload({"type": "instruction", "content": "x", "tags": []})
++
 +        with pytest.raises(TypeError, match="tags keys and values must be strings"):
 +            _section_from_payload({"type": "instruction", "content": "x", "tags": {"topic": 1}})
++
 +        with pytest.raises(TypeError, match="expected float or null"):
 +            _section_from_payload(
 +                {"type": "instruction", "content": "x", "judge_score_chosen": True}
 +            )
++
 +        with pytest.raises(TypeError, match="expected int or null"):
 +            _section_from_payload({"type": "instruction", "content": "x", "mined_run_id": True})
++
 +    def test_optional_helpers_accept_none_and_reject_wrong_types(self) -> None:
 +        assert _optional_str(None) is None
 +        assert _optional_str("ok") == "ok"
 +        assert _optional_float(None) is None
 +        assert _optional_float(1) == 1.0
 +        assert _optional_int(None) is None
 +        assert _optional_int(7) == 7
++
 +        with pytest.raises(TypeError, match="expected string or null"):
 +            _optional_str(7)
++
 +        with pytest.raises(TypeError, match="expected float or null"):
 +            _optional_float(True)
++
 +        with pytest.raises(TypeError, match="expected int or null"):
 +            _optional_int(True)

tests/unit/synth/test_filter.pymodified

63 lines changed — click to load

  class TestFilterSynthPlan:
 +    def test_negative_threshold_is_rejected(self) -> None:
 +        raw = SynthRunPlan(additions=(_planned(),), skipped=())
++
 +        with pytest.raises(ValueError, match="threshold must be >= 0.0"):
 +            filter_synth_plan(raw, filter_kind="sway", judge=StubJudge({}), threshold=-0.1)
++
      def test_none_filter_keeps_deduped_additions(self) -> None:
          raw = SynthRunPlan(
              additions=(
          assert filtered.report.dedup_count == 1
          assert filtered.report.accepted_count == 1
 +    def test_dedup_only_removes_near_duplicates_by_similarity(self) -> None:
 +        raw = SynthRunPlan(
 +            additions=(
 +                _planned(
 +                    question="What does DGEMM compute?",
 +                    answer="A dense matrix product.",
 +                ),
 +                _planned(
 +                    source_section_id="bbbbbbbbbbbbbbbb",
 +                    question="What does DGEMM compute",
 +                    answer="A dense matrix product.",
 +                ),
 +            ),
 +            skipped=(),
 +        )
++
 +        filtered = filter_synth_plan(raw, filter_kind="dedup-only")
++
 +        assert len(filtered.additions) == 1
 +        assert len(filtered.filtered_skipped) == 1
 +        assert filtered.filtered_skipped[0].reason.value == "duplicate_pair"
++
      def test_sway_filter_uses_judge_and_threshold(self) -> None:
          first = _planned(question="Q1", answer="A1")
          second = _planned(source_section_id="bbbbbbbbbbbbbbbb", question="Q2", answer="A2")
          rendered = render_filter_report(filtered)
          assert "generated 1, dedup 1, judge passed 1, threshold 1" in rendered
++
 +    def test_render_filter_report_for_dedup_only_mentions_filtered_entries(self) -> None:
 +        raw = SynthRunPlan(
 +            additions=(
 +                _planned(question="What is DGEMM?", answer="A matrix multiply routine."),
 +                _planned(
 +                    source_section_id="bbbbbbbbbbbbbbbb",
 +                    question="What is DGEMM?",
 +                    answer="A matrix multiply routine!",
 +                ),
 +            ),
 +            skipped=(),
 +        )
++
 +        filtered = filter_synth_plan(raw, filter_kind="dedup-only")
 +        rendered = render_filter_report(filtered)
++
 +        assert "generated 2, dedup 1, accepted 1" in rendered
 +        assert "=== filtered ===" in rendered
 +        assert "duplicate_pair" in rendered

tests/unit/synth/test_prompts.pymodified

42 lines changed — click to load

  from __future__ import annotations
 +from typing import Literal, cast
++
  import pytest
  from dlm.synth import DEFAULT_PROMPT_TEMPLATES, SynthPromptTemplate, get_prompt_template
  @pytest.mark.parametrize("strategy", ["extraction", "expansion"])
  def test_get_prompt_template_returns_shipped_template(strategy: str) -> None:
 -    template = get_prompt_template(strategy)  # type: ignore[arg-type]
 -    assert template is DEFAULT_PROMPT_TEMPLATES[strategy]
 +    typed_strategy = cast(Literal["extraction", "expansion"], strategy)
 +    template = get_prompt_template(typed_strategy)
 +    assert template is DEFAULT_PROMPT_TEMPLATES[typed_strategy]
      assert template.output_parser == "json_list"
      assert "3" in rendered
 -def test_user_template_must_reference_required_variables() -> None:
 -    with pytest.raises(ValueError, match="required variable"):
 +@pytest.mark.parametrize(
 +    ("template", "missing"),
 +    [
 +        ("Missing one variable: {{ prose }}", "['n']"),
 +        ("Missing one variable: {{ n }}", "['prose']"),
 +        ("Missing both variables.", "['prose', 'n']"),
 +    ],
 +)
 +def test_user_template_must_reference_required_variables(
 +    template: str,
 +    missing: str,
 +) -> None:
 +    with pytest.raises(ValueError, match=missing):
          SynthPromptTemplate(
              system_prompt="hi",
 -            user_template="Missing one variable: {{ prose }}",
 +            user_template=template,
+         )

tests/unit/synth/test_run_dry_run.pymodified

145 lines changed — click to load

  import pytest
  import dlm.synth.run as run_mod
 -from dlm.doc.parser import parse_text
 +from dlm.doc.parser import ParsedDlm, parse_text
  from dlm.synth import SynthPromptTemplate, build_synth_plan, render_synth_plan
  _FRONTMATTER = """---
          return self._outputs.popleft()
 -def _parsed(body: str):
 +def _parsed(body: str) -> ParsedDlm:
      return parse_text(_FRONTMATTER + body)
  class TestBuildSynthPlan:
 +    @pytest.mark.parametrize(
 +        ("field", "value", "message"),
 +        [
 +            ("per_section", 0, "per_section must be >= 1"),
 +            ("max_pairs", 0, "max_pairs must be >= 1"),
 +            ("max_new_tokens", 0, "max_new_tokens must be >= 1"),
 +        ],
 +    )
 +    def test_rejects_invalid_limits(
 +        self,
 +        field: str,
 +        value: int,
 +        message: str,
 +    ) -> None:
 +        parsed = _parsed("One prose block.\n")
++
 +        if field == "per_section":
 +            with pytest.raises(ValueError, match=message):
 +                build_synth_plan(parsed, StubTeacher([]), per_section=value)
 +        elif field == "max_pairs":
 +            with pytest.raises(ValueError, match=message):
 +                build_synth_plan(parsed, StubTeacher([]), max_pairs=value)
 +        else:
 +            with pytest.raises(ValueError, match=message):
 +                build_synth_plan(parsed, StubTeacher([]), max_new_tokens=value)
++
      def test_materializes_auto_synth_instruction_sections(self) -> None:
          parsed = _parsed("A short prose section about matrix multiplication.\n")
          teacher = StubTeacher(
          assert len(plan.additions) == 1
          assert plan.additions[0].pair.question == "Q1"
 +        assert len(teacher.calls) == 1
++
 +    def test_max_pairs_returns_before_generating_from_later_sources(self) -> None:
 +        parsed = _parsed(
 +            "First prose block.\n\n"
 +            "::instruction::\n"
 +            "### Q\nmanual?\n"
 +            "### A\nyes.\n\n"
 +            "Second prose block.\n"
 +        )
 +        teacher = StubTeacher(
 +            [
 +                '[{"question":"Q1","answer":"A1"}]',
 +                '[{"question":"Q2","answer":"A2"}]',
 +            ]
 +        )
++
 +        plan = build_synth_plan(parsed, teacher, per_section=1, strategy="extraction", max_pairs=1)
++
 +        assert len(plan.additions) == 1
 +        assert len(teacher.calls) == 1
++
 +    def test_both_strategy_skips_zero_count_branch(self) -> None:
 +        parsed = _parsed("One prose block.\n")
 +        teacher = StubTeacher(['[{"question":"Q1","answer":"A1"}]'])
++
 +        plan = build_synth_plan(parsed, teacher, per_section=1, strategy="both")
++
 +        assert len(plan.additions) == 1
 +        assert [add.strategy for add in plan.additions] == ["extraction"]
 +        assert len(teacher.calls) == 1
++
 +    def test_expansion_strategy_uses_expansion_template(self) -> None:
 +        parsed = _parsed("One prose block.\n")
 +        teacher = StubTeacher(['[{"question":"Q1","answer":"A1"}]'])
++
 +        plan = build_synth_plan(parsed, teacher, per_section=1, strategy="expansion")
++
 +        assert len(plan.additions) == 1
 +        assert [add.strategy for add in plan.additions] == ["expansion"]
 +        assert "expand on the material" in teacher.calls[0][1]
  def test_render_synth_plan_mentions_adds_and_skips() -> None:
      assert "synth plan: 0 add, 1 skip" in rendered
      assert "invalid_output" in rendered
++
++
 +def test_render_synth_plan_mentions_additions_and_truncates_long_lines() -> None:
 +    parsed = _parsed("One prose block.\n")
 +    long_question = "Q" * 90
 +    long_answer = "A" * 90
 +    teacher = StubTeacher([f'[{{"question":"{long_question}","answer":"{long_answer}"}}]'])
++
 +    plan = build_synth_plan(parsed, teacher, per_section=1, strategy="extraction")
 +    rendered = render_synth_plan(plan)
++
 +    assert "synth plan: 1 add, 0 skip" in rendered
 +    assert "+ ::instruction::" in rendered
 +    assert "q: " in rendered
 +    assert "a: " in rendered
 +    assert "…" in rendered
++
++
 +def test_first_line_returns_short_text_unchanged() -> None:
 +    assert run_mod._first_line("short line") == "short line"
++
++
 +@pytest.mark.parametrize(
 +    ("raw", "message"),
 +    [
 +        ("[]", "teacher output produced no instruction pairs"),
 +        ("{}", "teacher output must be a JSON list"),
 +        ("[1]", "teacher output item 0 must be an object"),
 +        ('[{"question":1,"answer":"ok"}]', "must contain string question/answer keys"),
 +        ('[{"question":" ","answer":"ok"}]', "has an empty question or answer"),
 +    ],
 +)
 +def test_parse_generated_pairs_rejects_bad_json_list_payloads(raw: str, message: str) -> None:
 +    with pytest.raises(ValueError, match=message):
 +        run_mod._parse_generated_pairs(raw, parser="json_list")
++
++
 +@pytest.mark.parametrize(
 +    ("raw", "message"),
 +    [
 +        ("Question: hi\nA: ok", "must use lines like `1. Q: ...`"),
 +        ("1. Q: hi", "missing an answer line"),
 +        ("1. Q: hi\nB: ok", "answers must use `A:` or `Answer:`"),
 +        ("1. Q:   \nA: ok", "contains an empty question or answer"),
 +    ],
 +)
 +def test_parse_generated_pairs_rejects_bad_numbered_list_payloads(raw: str, message: str) -> None:
 +    with pytest.raises(ValueError, match=message):
 +        run_mod._parse_generated_pairs(raw, parser="numbered_list")

tests/unit/synth/test_teachers.pymodified

1001 lines changed — click to load

  from __future__ import annotations
 +import builtins
 +import json
 +import sys
 +import urllib.error
  from pathlib import Path
 -from types import SimpleNamespace
 -from typing import Any
 +from types import ModuleType, SimpleNamespace
 +from typing import Any, Literal
  import pytest
      InvalidTeacherSpecError,
      OpenAiTeacher,
      SelfTeacher,
 +    TeacherInvocationError,
      TeacherUnavailableError,
      VllmServerTeacher,
      build_teacher,
+ )
 +def _module(name: str, **attrs: object) -> ModuleType:
 +    module = ModuleType(name)
 +    for key, value in attrs.items():
 +        setattr(module, key, value)
 +    return module
++
++
  class TestTeacherSelectorParsing:
      @pytest.mark.parametrize(
          ("raw", "kind", "target"),
          with pytest.raises(InvalidTeacherSpecError, match="unknown teacher selector"):
              parse_teacher_ref("mystery:thing")
 +    @pytest.mark.parametrize(
 +        ("raw", "message"),
 +        [
 +            ("hf:   ", "hf teacher selector must include a model id"),
 +            ("openai:   ", "openai teacher selector must include a model id"),
 +            ("anthropic:   ", "anthropic teacher selector must include a model id"),
 +            ("vllm-server:   ", "vllm-server teacher selector must include a URL"),
 +        ],
 +    )
 +    def test_missing_selector_targets_are_refused(self, raw: str, message: str) -> None:
 +        with pytest.raises(InvalidTeacherSpecError, match=message):
 +            parse_teacher_ref(raw)
++
  class TestBuildTeacher:
      def test_self_requires_dlm_path(self) -> None:
  class TestHfTeacher:
 +    def test_blank_hf_id_refused(self) -> None:
 +        with pytest.raises(InvalidTeacherSpecError, match="must include a model id"):
 +            HfTeacher("   ")
++
      def test_hf_teacher_uses_loader_and_runner(self) -> None:
          seen: dict[str, Any] = {}
+         )
          assert seen["runner"][3:] == (21, 0.5, 0.8, 11)
 +    def test_hf_teacher_reuses_loaded_bundle(self) -> None:
 +        loads: list[tuple[str, str]] = []
++
 +        def _loader(hf_id: str, device: str) -> teachers_mod._LoadedHfTeacher:
 +            loads.append((hf_id, device))
 +            return teachers_mod._LoadedHfTeacher(model="model", tokenizer="tok", device=device)
++
 +        teacher = HfTeacher(
 +            "Qwen/Qwen2.5-1.5B-Instruct",
 +            loader=_loader,
 +            runner=lambda *_args, **_kwargs: "ok",
 +        )
++
 +        assert teacher.generate("system", "user") == "ok"
 +        assert teacher.generate("system", "user") == "ok"
 +        assert loads == [
 +            ("Qwen/Qwen2.5-1.5B-Instruct", teachers_mod._resolve_generation_device("auto"))
 +        ]
++
  class TestOpenAiTeacher:
 +    def test_blank_model_refused(self) -> None:
 +        with pytest.raises(InvalidTeacherSpecError, match="must include a model id"):
 +            OpenAiTeacher("   ")
++
      def test_missing_api_key_refused(self, monkeypatch: pytest.MonkeyPatch) -> None:
          monkeypatch.delenv("OPENAI_API_KEY", raising=False)
          teacher = OpenAiTeacher("gpt-4o-mini")
      def test_openai_teacher_extracts_message_text(self, monkeypatch: pytest.MonkeyPatch) -> None:
          monkeypatch.setenv("OPENAI_API_KEY", "secret")
 -        captured: dict[str, Any] = {}
 +        payloads: list[dict[str, Any]] = []
 +        factories: list[str] = []
          def _create(**kwargs: Any) -> Any:
 -            captured["payload"] = kwargs
 +            payloads.append(kwargs)
              return SimpleNamespace(
                  choices=[SimpleNamespace(message=SimpleNamespace(content=" generated "))]
+             )
 +        def _factory(api_key: str) -> Any:
 +            factories.append(api_key)
 +            return client
++
          client = SimpleNamespace(
              chat=SimpleNamespace(
                  completions=SimpleNamespace(create=_create),
+             )
+         )
 -        teacher = OpenAiTeacher("gpt-4o-mini", client_factory=lambda api_key: client)
 +        teacher = OpenAiTeacher(
 +            "gpt-4o-mini",
 +            client_factory=_factory,
 +        )
          out = teacher.generate("sys", "usr", max_new_tokens=17, temperature=0.3, top_p=0.7, seed=5)
 +        second = teacher.generate("sys", "usr")
          assert out == "generated"
 -        assert captured["payload"]["model"] == "gpt-4o-mini"
 -        assert captured["payload"]["seed"] == 5
 +        assert second == "generated"
 +        assert payloads[0]["model"] == "gpt-4o-mini"
 +        assert payloads[0]["seed"] == 5
 +        assert factories == ["secret"]
++
 +    def test_openai_teacher_wraps_request_failures(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        monkeypatch.setenv("OPENAI_API_KEY", "secret")
++
 +        def _create(**_kwargs: Any) -> Any:
 +            raise RuntimeError("boom")
++
 +        client = SimpleNamespace(
 +            chat=SimpleNamespace(
 +                completions=SimpleNamespace(create=_create),
 +            )
 +        )
 +        teacher = OpenAiTeacher("gpt-4o-mini", client_factory=lambda _api_key: client)
++
 +        with pytest.raises(TeacherInvocationError, match="openai:gpt-4o-mini request failed: boom"):
 +            teacher.generate("sys", "usr")
  class TestAnthropicTeacher:
 +    def test_blank_model_refused(self) -> None:
 +        with pytest.raises(InvalidTeacherSpecError, match="must include a model id"):
 +            AnthropicTeacher("   ")
++
      def test_missing_api_key_refused(self, monkeypatch: pytest.MonkeyPatch) -> None:
          monkeypatch.delenv("ANTHROPIC_API_KEY", raising=False)
          teacher = AnthropicTeacher("claude-3-5-haiku-latest")
      def test_anthropic_teacher_extracts_text_blocks(self, monkeypatch: pytest.MonkeyPatch) -> None:
          monkeypatch.setenv("ANTHROPIC_API_KEY", "secret")
          captured: dict[str, Any] = {}
 +        factories: list[str] = []
          class _Messages:
              @staticmethod
                  captured["payload"] = kwargs
                  return SimpleNamespace(
                      content=[
 +                        SimpleNamespace(type="image", text="ignored"),
                          SimpleNamespace(type="text", text=" first "),
                          SimpleNamespace(type="text", text=" second "),
+                     ]
          class _Client:
              messages = _Messages()
 +        def _factory(api_key: str) -> _Client:
 +            factories.append(api_key)
 +            return _Client()
++
          teacher = AnthropicTeacher(
              "claude-3-5-haiku-latest",
 -            client_factory=lambda api_key: _Client(),
 +            client_factory=_factory,
+         )
          out = teacher.generate("sys", "usr", max_new_tokens=19, temperature=0.2, top_p=0.6)
 +        second = teacher.generate("sys", "usr")
          assert out == "first\nsecond"
 +        assert second == "first\nsecond"
          assert captured["payload"]["model"] == "claude-3-5-haiku-latest"
 +        assert factories == ["secret"]
++
 +    def test_anthropic_teacher_wraps_request_failures(
 +        self, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        monkeypatch.setenv("ANTHROPIC_API_KEY", "secret")
++
 +        class _Messages:
 +            @staticmethod
 +            def create(**_kwargs: Any) -> Any:
 +                raise RuntimeError("boom")
++
 +        class _Client:
 +            messages = _Messages()
++
 +        teacher = AnthropicTeacher(
 +            "claude-3-5-haiku-latest",
 +            client_factory=lambda _api_key: _Client(),
 +        )
++
 +        with pytest.raises(
 +            TeacherInvocationError,
 +            match="anthropic:claude-3-5-haiku-latest request failed: boom",
 +        ):
 +            teacher.generate("sys", "usr")
  class TestVllmServerTeacher:
 +    def test_blank_url_refused(self) -> None:
 +        with pytest.raises(InvalidTeacherSpecError, match="must include a URL"):
 +            VllmServerTeacher("   ")
++
      def test_invalid_url_refused(self) -> None:
          with pytest.raises(InvalidTeacherSpecError, match="http\\(s\\)"):
              VllmServerTeacher("localhost:8000")
      def test_vllm_teacher_queries_model_and_completion(
          self, monkeypatch: pytest.MonkeyPatch
      ) -> None:
 -        calls: dict[str, Any] = {}
 +        model_calls: list[tuple[str, float]] = []
 +        completion_calls: list[tuple[Any, ...]] = []
          def _fake_models(base_url: str, *, request_timeout: float) -> str | None:
 -            calls["models"] = (base_url, request_timeout)
 +            model_calls.append((base_url, request_timeout))
              return "demo-model"
          def _fake_completion(
              seed: int | None,
              request_timeout: float,
          ) -> str:
 -            calls["completion"] = (
 -                base_url,
 -                model_id,
 -                messages,
 -                max_new_tokens,
 -                temperature,
 -                top_p,
 -                seed,
 -                request_timeout,
 +            completion_calls.append(
 +                (
 +                    base_url,
 +                    model_id,
 +                    messages,
 +                    max_new_tokens,
 +                    temperature,
 +                    top_p,
 +                    seed,
 +                    request_timeout,
 +                )
+             )
              return " served "
          teacher = VllmServerTeacher("http://127.0.0.1:8000")
          out = teacher.generate("sys", "usr", max_new_tokens=29, temperature=0.4, top_p=0.75, seed=9)
 +        second = teacher.generate("sys", "usr")
          assert out == "served"
 -        assert calls["models"] == ("http://127.0.0.1:8000", 30.0)
 -        assert calls["completion"][1] == "demo-model"
 -        assert calls["completion"][3:] == (29, 0.4, 0.75, 9, 30.0)
 +        assert second == "served"
 +        assert model_calls == [("http://127.0.0.1:8000", 30.0)]
 +        assert completion_calls[0][1] == "demo-model"
 +        assert completion_calls[0][3:] == (29, 0.4, 0.75, 9, 30.0)
++
++
 +class TestTeacherHelpers:
 +    def test_flatten_teacher_prompt_handles_partial_inputs(self) -> None:
 +        assert teachers_mod._flatten_teacher_prompt("system", "user").startswith("System:\n")
 +        assert teachers_mod._flatten_teacher_prompt("", "user") == "user"
 +        assert teachers_mod._flatten_teacher_prompt("system", "") == "system"
++
 +    def test_require_non_empty_teacher_output_refuses_blank_text(self) -> None:
 +        with pytest.raises(TeacherInvocationError, match="self returned empty output"):
 +            teachers_mod._require_non_empty_teacher_output("   ", teacher="self")
++
 +    def test_extract_openai_message_text_handles_list_content_and_errors(self) -> None:
 +        response = {
 +            "choices": [
 +                {
 +                    "message": {
 +                        "content": [
 +                            {"text": " first "},
 +                            {"text": " second "},
 +                        ]
 +                    }
 +                }
 +            ]
 +        }
 +        assert teachers_mod._extract_openai_message_text(response) == "first\nsecond"
++
 +        with pytest.raises(TeacherInvocationError, match="missing choices"):
 +            teachers_mod._extract_openai_message_text({})
++
 +        with pytest.raises(TeacherInvocationError, match="missing choices\\[0\\]\\.message"):
 +            teachers_mod._extract_openai_message_text({"choices": [{}]})
++
 +        with pytest.raises(TeacherInvocationError, match="missing non-empty message content"):
 +            teachers_mod._extract_openai_message_text({"choices": [{"message": {"content": None}}]})
++
 +    def test_extract_anthropic_text_handles_errors(self) -> None:
 +        with pytest.raises(TeacherInvocationError, match="missing content blocks"):
 +            teachers_mod._extract_anthropic_text({})
++
 +        with pytest.raises(TeacherInvocationError, match="missing non-empty text blocks"):
 +            teachers_mod._extract_anthropic_text(
 +                {"content": [{"type": "image", "text": "ignored"}, {"type": "text", "text": "   "}]}
 +            )
++
 +    def test_normalize_chat_content_and_obj_get_helpers(self) -> None:
 +        assert teachers_mod._normalize_chat_content(" hello ") == "hello"
 +        assert (
 +            teachers_mod._normalize_chat_content([{"text": " one "}, {"text": " two "}])
 +            == "one\ntwo"
 +        )
 +        assert teachers_mod._normalize_chat_content([{"text": "   "}]) is None
 +        assert teachers_mod._normalize_chat_content(123) is None
 +        assert teachers_mod._obj_get({"name": "value"}, "name") == "value"
 +        assert teachers_mod._obj_get(SimpleNamespace(name="value"), "name") == "value"
++
 +    def test_openai_compat_url_helpers_normalize_suffixes(self) -> None:
 +        assert (
 +            teachers_mod._normalize_openai_compat_base_url(
 +                "http://127.0.0.1:8000/v1/chat/completions"
 +            )
 +            == "http://127.0.0.1:8000"
 +        )
 +        assert (
 +            teachers_mod._normalize_openai_compat_base_url("http://127.0.0.1:8000/chat/completions")
 +            == "http://127.0.0.1:8000"
 +        )
 +        assert teachers_mod._openai_compat_models_url("http://127.0.0.1:8000/v1") == (
 +            "http://127.0.0.1:8000/v1/models"
 +        )
 +        assert teachers_mod._openai_compat_models_url("http://127.0.0.1:8000") == (
 +            "http://127.0.0.1:8000/v1/models"
 +        )
 +        assert teachers_mod._openai_compat_chat_url("http://127.0.0.1:8000/v1") == (
 +            "http://127.0.0.1:8000/v1/chat/completions"
 +        )
 +        assert teachers_mod._openai_compat_chat_url("http://127.0.0.1:8000") == (
 +            "http://127.0.0.1:8000/v1/chat/completions"
 +        )
++
++
 +class TestTeacherRuntimeHelpers:
 +    def test_resolve_generation_device_prefers_requested_or_detected_backends(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        assert teachers_mod._resolve_generation_device("mps") == "mps"
++
 +        monkeypatch.delitem(sys.modules, "torch", raising=False)
 +        real_import = builtins.__import__
++
 +        def _missing_torch(
 +            name: str,
 +            globals: dict[str, object] | None = None,
 +            locals: dict[str, object] | None = None,
 +            fromlist: tuple[str, ...] = (),
 +            level: int = 0,
 +        ) -> object:
 +            if name == "torch":
 +                raise ImportError("no torch")
 +            return real_import(name, globals, locals, fromlist, level)
++
 +        monkeypatch.setattr(builtins, "__import__", _missing_torch)
 +        assert teachers_mod._resolve_generation_device("auto") == "cpu"
++
 +        monkeypatch.setattr(builtins, "__import__", real_import)
 +        monkeypatch.setitem(
 +            sys.modules,
 +            "torch",
 +            SimpleNamespace(
 +                cuda=SimpleNamespace(is_available=lambda: True),
 +                backends=SimpleNamespace(mps=SimpleNamespace(is_available=lambda: False)),
 +            ),
 +        )
 +        assert teachers_mod._resolve_generation_device("auto") == "cuda"
++
 +        monkeypatch.setitem(
 +            sys.modules,
 +            "torch",
 +            SimpleNamespace(
 +                cuda=SimpleNamespace(is_available=lambda: False),
 +                backends=SimpleNamespace(mps=SimpleNamespace(is_available=lambda: True)),
 +            ),
 +        )
 +        assert teachers_mod._resolve_generation_device("auto") == "mps"
++
 +        monkeypatch.setitem(
 +            sys.modules,
 +            "torch",
 +            SimpleNamespace(
 +                cuda=SimpleNamespace(is_available=lambda: False),
 +                backends=SimpleNamespace(mps=SimpleNamespace(is_available=lambda: False)),
 +            ),
 +        )
 +        assert teachers_mod._resolve_generation_device("auto") == "cpu"
++
 +    def test_default_openai_client_validates_import_surface(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        def _raise_import(name: str) -> object:
 +            raise ImportError(name)
++
 +        monkeypatch.setattr("dlm.synth.teachers.importlib.import_module", _raise_import)
 +        with pytest.raises(TeacherUnavailableError, match="requires the openai package"):
 +            teachers_mod._default_openai_client("secret")
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.importlib.import_module", lambda _name: SimpleNamespace()
 +        )
 +        with pytest.raises(TeacherUnavailableError, match="does not expose OpenAI client"):
 +            teachers_mod._default_openai_client("secret")
++
 +        captured: list[str] = []
++
 +        class _OpenAI:
 +            def __init__(self, *, api_key: str) -> None:
 +                captured.append(api_key)
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.importlib.import_module",
 +            lambda _name: SimpleNamespace(OpenAI=_OpenAI),
 +        )
 +        client = teachers_mod._default_openai_client("secret")
 +        assert isinstance(client, _OpenAI)
 +        assert captured == ["secret"]
++
 +    def test_default_anthropic_client_validates_import_surface(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        def _raise_import(name: str) -> object:
 +            raise ImportError(name)
++
 +        monkeypatch.setattr("dlm.synth.teachers.importlib.import_module", _raise_import)
 +        with pytest.raises(TeacherUnavailableError, match="requires the anthropic package"):
 +            teachers_mod._default_anthropic_client("secret")
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.importlib.import_module", lambda _name: SimpleNamespace()
 +        )
 +        with pytest.raises(TeacherUnavailableError, match="does not expose Anthropic client"):
 +            teachers_mod._default_anthropic_client("secret")
++
 +        captured: list[str] = []
++
 +        class _Anthropic:
 +            def __init__(self, *, api_key: str) -> None:
 +                captured.append(api_key)
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.importlib.import_module",
 +            lambda _name: SimpleNamespace(Anthropic=_Anthropic),
 +        )
 +        client = teachers_mod._default_anthropic_client("secret")
 +        assert isinstance(client, _Anthropic)
 +        assert captured == ["secret"]
++
 +    def test_fetch_openai_compat_model_id_handles_success_empty_and_errors(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        class _Response:
 +            def __init__(self, payload: object) -> None:
 +                self._payload = payload
++
 +            def __enter__(self) -> _Response:
 +                return self
++
 +            def __exit__(self, *_args: object) -> Literal[False]:
 +                return False
++
 +            def read(self) -> bytes:
 +                return json.dumps(self._payload).encode("utf-8")
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.urllib.request.urlopen",
 +            lambda *_args, **_kwargs: _Response({"data": [{"id": "demo-model"}]}),
 +        )
 +        assert (
 +            teachers_mod._fetch_openai_compat_model_id(
 +                "http://127.0.0.1:8000",
 +                request_timeout=1.0,
 +            )
 +            == "demo-model"
 +        )
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.urllib.request.urlopen",
 +            lambda *_args, **_kwargs: _Response({"data": []}),
 +        )
 +        assert (
 +            teachers_mod._fetch_openai_compat_model_id(
 +                "http://127.0.0.1:8000",
 +                request_timeout=1.0,
 +            )
 +            is None
 +        )
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.urllib.request.urlopen",
 +            lambda *_args, **_kwargs: _Response({"data": [{"id": "   "}]}),
 +        )
 +        assert (
 +            teachers_mod._fetch_openai_compat_model_id(
 +                "http://127.0.0.1:8000",
 +                request_timeout=1.0,
 +            )
 +            is None
 +        )
++
 +        def _raise_url_error(*_args: object, **_kwargs: object) -> object:
 +            raise urllib.error.URLError("boom")
++
 +        monkeypatch.setattr("dlm.synth.teachers.urllib.request.urlopen", _raise_url_error)
 +        with pytest.raises(TeacherUnavailableError, match="could not query models"):
 +            teachers_mod._fetch_openai_compat_model_id(
 +                "http://127.0.0.1:8000",
 +                request_timeout=1.0,
 +            )
++
 +    def test_request_openai_compat_completion_handles_success_and_failures(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        class _Response:
 +            def __init__(self, payload: object) -> None:
 +                self._payload = payload
++
 +            def __enter__(self) -> _Response:
 +                return self
++
 +            def __exit__(self, *_args: object) -> Literal[False]:
 +                return False
++
 +            def read(self) -> bytes:
 +                return json.dumps(self._payload).encode("utf-8")
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.urllib.request.urlopen",
 +            lambda *_args, **_kwargs: _Response(
 +                {"choices": [{"message": {"content": [{"text": " served "}]}}]}
 +            ),
 +        )
 +        assert (
 +            teachers_mod._request_openai_compat_completion(
 +                "http://127.0.0.1:8000",
 +                model_id="demo-model",
 +                messages=[{"role": "user", "content": "hello"}],
 +                max_new_tokens=11,
 +                temperature=0.2,
 +                top_p=0.8,
 +                seed=5,
 +                request_timeout=1.0,
 +            )
 +            == "served"
 +        )
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.urllib.request.urlopen",
 +            lambda *_args, **_kwargs: _Response({"choices": []}),
 +        )
 +        with pytest.raises(TeacherInvocationError, match="response missing choices"):
 +            teachers_mod._request_openai_compat_completion(
 +                "http://127.0.0.1:8000",
 +                model_id=None,
 +                messages=[{"role": "user", "content": "hello"}],
 +                max_new_tokens=11,
 +                temperature=0.2,
 +                top_p=None,
 +                seed=None,
 +                request_timeout=1.0,
 +            )
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.urllib.request.urlopen",
 +            lambda *_args, **_kwargs: _Response({"choices": [{}]}),
 +        )
 +        with pytest.raises(
 +            TeacherInvocationError, match="response missing choices\\[0\\]\\.message"
 +        ):
 +            teachers_mod._request_openai_compat_completion(
 +                "http://127.0.0.1:8000",
 +                model_id=None,
 +                messages=[{"role": "user", "content": "hello"}],
 +                max_new_tokens=11,
 +                temperature=0.2,
 +                top_p=None,
 +                seed=None,
 +                request_timeout=1.0,
 +            )
++
 +        monkeypatch.setattr(
 +            "dlm.synth.teachers.urllib.request.urlopen",
 +            lambda *_args, **_kwargs: _Response(
 +                {"choices": [{"message": {"content": [{"text": "   "}]}}]}
 +            ),
 +        )
 +        with pytest.raises(TeacherInvocationError, match="missing non-empty message content"):
 +            teachers_mod._request_openai_compat_completion(
 +                "http://127.0.0.1:8000",
 +                model_id=None,
 +                messages=[{"role": "user", "content": "hello"}],
 +                max_new_tokens=11,
 +                temperature=0.2,
 +                top_p=None,
 +                seed=None,
 +                request_timeout=1.0,
 +            )
++
 +        def _raise_url_error(*_args: object, **_kwargs: object) -> object:
 +            raise urllib.error.URLError("boom")
++
 +        monkeypatch.setattr("dlm.synth.teachers.urllib.request.urlopen", _raise_url_error)
 +        with pytest.raises(TeacherInvocationError, match="request to http://127.0.0.1:8000 failed"):
 +            teachers_mod._request_openai_compat_completion(
 +                "http://127.0.0.1:8000",
 +                model_id=None,
 +                messages=[{"role": "user", "content": "hello"}],
 +                max_new_tokens=11,
 +                temperature=0.2,
 +                top_p=None,
 +                seed=None,
 +                request_timeout=1.0,
 +            )
++
++
 +def _install_self_loader_modules(
 +    monkeypatch: pytest.MonkeyPatch,
 +    *,
 +    manifest_exists: bool = True,
 +    license_acceptance: object | None = "accepted",
 +    load_manifest_error: str | None = None,
 +    resolve_error: str | None = None,
 +    select_error: str | None = None,
 +    backend_load_error: str | None = None,
 +) -> dict[str, object]:
 +    calls: dict[str, object] = {}
 +    spec = object()
 +    caps = object()
 +    parsed = SimpleNamespace(
 +        frontmatter=SimpleNamespace(
 +            dlm_id="01KPQ9X1000000000000000000",
 +            base_model="smollm2-135m",
 +        )
 +    )
 +    manifest = SimpleNamespace(exists=lambda: manifest_exists)
 +    store = SimpleNamespace(manifest=manifest)
++
 +    class GatedModelError(Exception):
 +        pass
++
 +    class AdapterNotFoundError(Exception):
 +        pass
++
 +    class UnsupportedBackendError(Exception):
 +        pass
++
 +    class ManifestCorruptError(Exception):
 +        pass
++
 +    class _Backend:
 +        def load(self, spec_arg: object, store_arg: object) -> None:
 +            calls["load"] = (spec_arg, store_arg)
 +            if backend_load_error is not None:
 +                raise AdapterNotFoundError(backend_load_error)
++
 +    backend = _Backend()
++
 +    def _resolve(base_model: str, *, accept_license: bool) -> object:
 +        calls["resolve"] = (base_model, accept_license)
 +        if resolve_error is not None:
 +            raise GatedModelError(resolve_error)
 +        return spec
++
 +    def _load_manifest(_path: object) -> object:
 +        calls["load_manifest"] = True
 +        if load_manifest_error is not None:
 +            raise ManifestCorruptError(load_manifest_error)
 +        return SimpleNamespace(license_acceptance=license_acceptance)
++
 +    def _select_backend(backend_name: str, capabilities: object) -> str:
 +        calls["select_backend"] = (backend_name, capabilities)
 +        if select_error is not None:
 +            raise UnsupportedBackendError(select_error)
 +        return "stub-backend"
++
 +    def _build_backend(name: str, capabilities: object) -> object:
 +        calls["build_backend"] = (name, capabilities)
 +        return backend
++
 +    monkeypatch.setitem(
 +        sys.modules, "dlm.base_models", _module("dlm.base_models", resolve=_resolve)
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.base_models.errors",
 +        _module("dlm.base_models.errors", GatedModelError=GatedModelError),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.doc.parser",
 +        _module("dlm.doc.parser", parse_file=lambda _path: parsed),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.hardware",
 +        _module("dlm.hardware", doctor=lambda: SimpleNamespace(capabilities=caps)),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.inference",
 +        _module("dlm.inference", AdapterNotFoundError=AdapterNotFoundError),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.inference.backends",
 +        _module(
 +            "dlm.inference.backends", build_backend=_build_backend, select_backend=_select_backend
 +        ),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.inference.backends.select",
 +        _module("dlm.inference.backends.select", UnsupportedBackendError=UnsupportedBackendError),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.store.errors",
 +        _module("dlm.store.errors", ManifestCorruptError=ManifestCorruptError),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.store.manifest",
 +        _module("dlm.store.manifest", load_manifest=_load_manifest),
 +    )
 +    monkeypatch.setitem(
 +        sys.modules,
 +        "dlm.store.paths",
 +        _module("dlm.store.paths", for_dlm=lambda _dlm_id: store),
 +    )
++
 +    calls["caps"] = caps
 +    calls["store"] = store
 +    calls["spec"] = spec
 +    calls["errors"] = {
 +        "gated": GatedModelError,
 +        "adapter": AdapterNotFoundError,
 +        "unsupported": UnsupportedBackendError,
 +        "manifest": ManifestCorruptError,
 +    }
 +    return calls
++
++
 +class TestTeacherLoaderHelpers:
 +    def test_load_self_backend_wraps_import_error(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        real_import = builtins.__import__
++
 +        def _raise_on_base_models(
 +            name: str,
 +            globals: dict[str, object] | None = None,
 +            locals: dict[str, object] | None = None,
 +            fromlist: tuple[str, ...] = (),
 +            level: int = 0,
 +        ) -> object:
 +            if name.startswith("dlm.base_models"):
 +                raise ImportError("boom")
 +            return real_import(name, globals, locals, fromlist, level)
++
 +        monkeypatch.setattr(builtins, "__import__", _raise_on_base_models)
 +        with pytest.raises(TeacherUnavailableError, match="requires the local inference stack"):
 +            teachers_mod._load_self_backend(Path("/tmp/doc.dlm"), "auto")
++
 +    def test_load_self_backend_uses_recorded_license_acceptance(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        calls = _install_self_loader_modules(monkeypatch, license_acceptance="accepted")
++
 +        backend = teachers_mod._load_self_backend(Path("/tmp/doc.dlm"), "auto")
++
 +        assert backend is not None
 +        assert calls["resolve"] == ("smollm2-135m", True)
 +        assert calls["select_backend"] == ("auto", calls["caps"])
 +        assert calls["build_backend"] == ("stub-backend", calls["caps"])
 +        assert calls["load"] == (calls["spec"], calls["store"])
++
 +    def test_load_self_backend_tolerates_manifest_read_failure(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        calls = _install_self_loader_modules(
 +            monkeypatch,
 +            load_manifest_error="bad manifest",
 +        )
++
 +        teachers_mod._load_self_backend(Path("/tmp/doc.dlm"), "auto")
++
 +        assert calls["resolve"] == ("smollm2-135m", False)
++
 +    def test_load_self_backend_wraps_gated_backend_and_adapter_failures(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        _install_self_loader_modules(monkeypatch, resolve_error="gated")
 +        with pytest.raises(TeacherUnavailableError, match="cannot resolve gated base"):
 +            teachers_mod._load_self_backend(Path("/tmp/doc.dlm"), "auto")
++
 +        _install_self_loader_modules(monkeypatch, select_error="unsupported backend")
 +        with pytest.raises(TeacherUnavailableError, match="unsupported backend"):
 +            teachers_mod._load_self_backend(Path("/tmp/doc.dlm"), "auto")
++
 +        _install_self_loader_modules(monkeypatch, backend_load_error="missing adapter")
 +        with pytest.raises(TeacherUnavailableError, match="requires a trained adapter"):
 +            teachers_mod._load_self_backend(Path("/tmp/doc.dlm"), "auto")
++
 +    def test_default_hf_loader_wraps_import_error(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        real_import = builtins.__import__
++
 +        def _raise_transformers(
 +            name: str,
 +            globals: dict[str, object] | None = None,
 +            locals: dict[str, object] | None = None,
 +            fromlist: tuple[str, ...] = (),
 +            level: int = 0,
 +        ) -> object:
 +            if name == "transformers":
 +                raise ImportError("boom")
 +            return real_import(name, globals, locals, fromlist, level)
++
 +        monkeypatch.setattr(builtins, "__import__", _raise_transformers)
 +        with pytest.raises(TeacherUnavailableError, match="requires transformers"):
 +            teachers_mod._default_hf_loader("hf/model", "cpu")
++
 +    def test_default_hf_loader_moves_model_and_sets_eval(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        seen: dict[str, object] = {}
++
 +        class _Model:
 +            def to(self, device: str) -> _Model:
 +                seen["device"] = device
 +                return self
++
 +            def eval(self) -> None:
 +                seen["eval"] = True
++
 +        model = _Model()
++
 +        class AutoModelForCausalLM:
 +            @staticmethod
 +            def from_pretrained(hf_id: str) -> _Model:
 +                seen["model_id"] = hf_id
 +                return model
++
 +        class AutoTokenizer:
 +            @staticmethod
 +            def from_pretrained(hf_id: str) -> str:
 +                seen["tokenizer_id"] = hf_id
 +                return "tok"
++
 +        monkeypatch.setitem(
 +            sys.modules,
 +            "transformers",
 +            _module(
 +                "transformers",
 +                AutoModelForCausalLM=AutoModelForCausalLM,
 +                AutoTokenizer=AutoTokenizer,
 +            ),
 +        )
++
 +        loaded = teachers_mod._default_hf_loader("hf/model", "cuda")
++
 +        assert loaded.model is model
 +        assert loaded.tokenizer == "tok"
 +        assert loaded.device == "cuda"
 +        assert seen == {
 +            "model_id": "hf/model",
 +            "tokenizer_id": "hf/model",
 +            "device": "cuda",
 +            "eval": True,
 +        }
++
 +    def test_default_hf_generate_seeds_torch_and_calls_runner(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        manual: list[int] = []
 +        manual_all: list[int] = []
 +        calls: dict[str, object] = {}
++
 +        def _generate(
 +            model: object,
 +            tokenizer: object,
 +            prompt: str,
 +            *,
 +            max_new_tokens: int,
 +            temperature: float,
 +            top_p: float | None,
 +        ) -> str:
 +            calls["args"] = (model, tokenizer, prompt, max_new_tokens, temperature, top_p)
 +            return "ok"
++
 +        monkeypatch.setitem(
 +            sys.modules,
 +            "dlm.inference.generate",
 +            _module("dlm.inference.generate", generate=_generate),
 +        )
 +        monkeypatch.setitem(
 +            sys.modules,
 +            "torch",
 +            SimpleNamespace(
 +                manual_seed=lambda seed: manual.append(seed),
 +                cuda=SimpleNamespace(
 +                    is_available=lambda: True,
 +                    manual_seed_all=lambda seed: manual_all.append(seed),
 +                ),
 +            ),
 +        )
++
 +        out = teachers_mod._default_hf_generate(
 +            "model",
 +            "tokenizer",
 +            "prompt",
 +            max_new_tokens=17,
 +            temperature=0.3,
 +            top_p=0.8,
 +            seed=7,
 +        )
++
 +        assert out == "ok"
 +        assert manual == [7]
 +        assert manual_all == [7]
 +        assert calls["args"] == ("model", "tokenizer", "prompt", 17, 0.3, 0.8)
++
 +    def test_default_hf_generate_tolerates_missing_torch_when_seeding(
 +        self,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        real_import = builtins.__import__
++
 +        def _generate(
 +            model: object,
 +            tokenizer: object,
 +            prompt: str,
 +            *,
 +            max_new_tokens: int,
 +            temperature: float,
 +            top_p: float | None,
 +        ) -> str:
 +            _ = model, tokenizer, prompt, max_new_tokens, temperature, top_p
 +            return "ok"
++
 +        def _raise_torch(
 +            name: str,
 +            globals: dict[str, object] | None = None,
 +            locals: dict[str, object] | None = None,
 +            fromlist: tuple[str, ...] = (),
 +            level: int = 0,
 +        ) -> object:
 +            if name == "torch":
 +                raise ImportError("no torch")
 +            return real_import(name, globals, locals, fromlist, level)
++
 +        monkeypatch.setitem(
 +            sys.modules,
 +            "dlm.inference.generate",
 +            _module("dlm.inference.generate", generate=_generate),
 +        )
 +        monkeypatch.delitem(sys.modules, "torch", raising=False)
 +        monkeypatch.setattr(builtins, "__import__", _raise_torch)
++
 +        out = teachers_mod._default_hf_generate(
 +            "model",
 +            "tokenizer",
 +            "prompt",
 +            max_new_tokens=17,
 +            temperature=0.3,
 +            top_p=0.8,
 +            seed=7,
 +        )
++
 +        assert out == "ok"

tests/unit/templates/test_init.pymodified

40 lines changed — click to load

  from __future__ import annotations
  from pathlib import Path
 +from types import SimpleNamespace
 +from unittest.mock import patch
  import pytest
 +from dlm.base_models import GatedModelError
  from dlm.doc.parser import parse_file
  from dlm.templates import TemplateApplyError, TemplateNotFoundError, apply_template
          apply_template("nonexistent-template", target)
      # And doesn't leave a half-written file behind.
      assert not target.exists()
++
++
 +def test_apply_template_wraps_gated_model_error(tmp_path: Path) -> None:
 +    target = tmp_path / "out.dlm"
++
 +    with (
 +        patch(
 +            "dlm.base_models.resolve",
 +            side_effect=GatedModelError("llama-3.2-1b", "https://example.test/license"),
 +        ),
 +        pytest.raises(TemplateApplyError, match="pass accept_license=True"),
 +    ):
 +        apply_template("coding-tutor", target)
++
++
 +def test_apply_template_refuses_gated_base_without_acceptance_flag(tmp_path: Path) -> None:
 +    target = tmp_path / "out.dlm"
 +    spec = SimpleNamespace(key="llama-3.2-1b")
++
 +    with (
 +        patch("dlm.base_models.resolve", return_value=spec),
 +        patch("dlm.base_models.license.is_gated", return_value=True),
 +        pytest.raises(TemplateApplyError, match="uses gated base"),
 +    ):
 +        apply_template("coding-tutor", target)

tests/unit/templates/test_registry.pymodified

22 lines changed — click to load

      assert list_bundled(gallery_dir=tmp_path) == []
 +def test_load_template_rejects_non_mapping_meta(tmp_path: Path) -> None:
 +    (tmp_path / "broken.dlm").write_text("---\ndlm_id: 01AAAA\nbase_model: foo\n---\n# body\n")
 +    (tmp_path / "broken.meta.yaml").write_text("- not\n- a\n- mapping\n")
++
 +    with pytest.raises(TemplateMetaError, match="meta must be a YAML mapping"):
 +        load_template("broken", gallery_dir=tmp_path)
++
++
 +def test_load_template_rejects_schema_invalid_meta(tmp_path: Path) -> None:
 +    (tmp_path / "broken.dlm").write_text("---\ndlm_id: 01AAAA\nbase_model: foo\n---\n# body\n")
 +    (tmp_path / "broken.meta.yaml").write_text("name: broken\ntitle: Broken\nsummary: hi\n")
++
 +    with pytest.raises(TemplateMetaError, match="failed schema validation"):
 +        load_template("broken", gallery_dir=tmp_path)
++
++
  def test_load_template_with_mismatched_name_raises(tmp_path: Path) -> None:
      (tmp_path / "fine.dlm").write_text("---\ndlm_id: 01AAAA\nbase_model: foo\n---\n# body\n")
      # meta.name doesn't match the filename stem.

tests/unit/test_io_atomic.pymodified

51 lines changed — click to load

  class TestCleanupStaleTmp:
 +    def test_cleanup_skips_directories(self, tmp_path: Path) -> None:
 +        (tmp_path / "nested.tmp.999.deadbeef").mkdir()
 +        assert atomic.cleanup_stale_tmp_files(tmp_path) == []
++
      def test_removes_only_dead_pid_tmp_files(self, tmp_path: Path) -> None:
          """Legacy nonce-less tmps still get cleaned up — back-compat for
          sweeps that span a pre-/post-upgrade writer on the same store."""
          assert atomic.cleanup_stale_tmp_files(tmp_path) == []
          assert malformed.exists()
 +    def test_cleanup_ignores_tmp_file_removed_between_list_and_unlink(self, tmp_path: Path) -> None:
 +        doomed = tmp_path / "name.tmp.99999999.deadbeef"
 +        doomed.write_bytes(b"x")
++
 +        real_unlink = Path.unlink
++
 +        def fake_unlink(self: Path, *args: object, **kwargs: object) -> None:
 +            if self == doomed:
 +                raise FileNotFoundError
 +            real_unlink(self, *args, **kwargs)
++
 +        with (
 +            patch("dlm.io.atomic._is_alive", return_value=False),
 +            patch("pathlib.Path.unlink", autospec=True, side_effect=fake_unlink),
 +        ):
 +            assert atomic.cleanup_stale_tmp_files(tmp_path) == []
++
++
 +class TestTmpPid:
 +    def test_invalid_regex_pid_falls_back_to_none(self, tmp_path: Path) -> None:
 +        target = tmp_path / "file.bin.tmp.1234.deadbeef"
++
 +        class FakeMatch:
 +            @staticmethod
 +            def group(name: str) -> str:
 +                assert name == "pid"
 +                return "not-a-pid"
++
 +        fake_pattern = type(
 +            "FakePattern", (), {"search": staticmethod(lambda _name: FakeMatch())}
 +        )()
++
 +        with patch("dlm.io.atomic._TMP_RE", fake_pattern):
 +            assert atomic._tmp_pid(target) is None
++
  class TestIsAlive:
      def test_zero_or_negative_dead(self) -> None:

tests/unit/test_main.pyadded

15 lines changed — click to load

 +"""Direct coverage for the `python -m dlm` entrypoint."""
++
 +from __future__ import annotations
++
 +import runpy
++
++
 +def test_module_entrypoint_invokes_cli_main(monkeypatch) -> None:
 +    called: list[bool] = []
++
 +    monkeypatch.setattr("dlm.cli.app.main", lambda: called.append(True))
++
 +    runpy.run_module("dlm", run_name="__main__")
++
 +    assert called == [True]

tests/unit/test_package_init.pyadded

24 lines changed — click to load

 +"""Direct coverage for package-level version fallback wiring."""
++
 +from __future__ import annotations
++
 +import runpy
 +from importlib.metadata import PackageNotFoundError
 +from pathlib import Path
 +from unittest.mock import patch
++
 +_INIT_PATH = Path(__file__).resolve().parents[2] / "src" / "dlm" / "__init__.py"
++
++
 +def test_package_init_reads_installed_version() -> None:
 +    with patch("importlib.metadata.version", return_value="1.2.3"):
 +        module_globals = runpy.run_path(str(_INIT_PATH))
++
 +    assert module_globals["__version__"] == "1.2.3"
++
++
 +def test_package_init_falls_back_when_package_metadata_is_missing() -> None:
 +    with patch("importlib.metadata.version", side_effect=PackageNotFoundError):
 +        module_globals = runpy.run_path(str(_INIT_PATH))
++
 +    assert module_globals["__version__"] == "0.0.0+unknown"

tests/unit/train/cpt/test_embed_warmup.pymodified

22 lines changed — click to load

  class TestUnfreezeContextManager:
 +    def test_missing_embedding_modules_yield_empty_list(self) -> None:
 +        model = SimpleNamespace(
 +            get_input_embeddings=lambda: None,
 +            get_output_embeddings=lambda: None,
 +        )
 +        with unfreeze_embeddings_for(model) as weights:
 +            assert weights == []
++
 +    def test_modules_without_weight_are_skipped(self) -> None:
 +        model = SimpleNamespace(
 +            get_input_embeddings=lambda: SimpleNamespace(weight=None),
 +            get_output_embeddings=lambda: SimpleNamespace(weight=None),
 +        )
 +        with unfreeze_embeddings_for(model) as weights:
 +            assert weights == []
++
      def test_unfreezes_both_embeddings(self) -> None:
          model = _model(embed_frozen=True, head_frozen=True)
          with unfreeze_embeddings_for(model) as weights:

tests/unit/train/distributed/test_gpus.pymodified

30 lines changed — click to load

  class TestParseGpus:
 +    def test_none_raises_empty(self) -> None:
 +        with pytest.raises(UnsupportedGpuSpecError, match="empty"):
 +            parse_gpus(None)  # type: ignore[arg-type]
++
      def test_all_case_insensitive(self) -> None:
          for value in ("all", "ALL", "All"):
              spec = parse_gpus(value)
          with pytest.raises(UnsupportedGpuSpecError, match="non-integer"):
              parse_gpus("0,foo,1")
 +    def test_empty_comma_list_rejected(self) -> None:
 +        with pytest.raises(UnsupportedGpuSpecError, match="is empty"):
 +            parse_gpus(", ,")
++
      def test_malformed_scalar_rejected(self) -> None:
          with pytest.raises(UnsupportedGpuSpecError, match="not `all`"):
              parse_gpus("xyz")
  class TestResolveGpuSpec:
 +    def test_list_returns_requested_ids(self) -> None:
 +        spec = GpuSpec(kind="list", value=(0, 2))
 +        assert spec.resolve(device_count=4) == (0, 2)
++
      def test_all_returns_full_range(self) -> None:
          spec = GpuSpec(kind="all", value=None)
          assert spec.resolve(device_count=3) == (0, 1, 2)

tests/unit/train/distributed/test_rank_env.pymodified

10 lines changed — click to load

          monkeypatch.setenv("LOCAL_RANK", "2")
          assert detect_rank() == 2
 +    def test_negative_rank_clamped_to_zero(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        monkeypatch.setenv("RANK", "-3")
 +        assert detect_rank() == 0
++
      def test_malformed_raises(self, monkeypatch: pytest.MonkeyPatch) -> None:
          monkeypatch.setenv("RANK", "oops")
          with pytest.raises(ValueError, match="RANK"):

tests/unit/train/distributed/test_rank_io.pymodified

8 lines changed — click to load

          out = gather_metrics(acc, {"loss": 2.0})
          # mean of [2.0, 3.0] = 2.5
          assert out["loss"] == pytest.approx(2.5)
++
 +    def test_gather_none_falls_back_to_original_value(self) -> None:
 +        acc = SimpleNamespace(gather_for_metrics=lambda tensor: None, is_main_process=True)
 +        out = gather_metrics(acc, {"loss": 2.0})
 +        assert out == {"loss": 2.0}

tests/unit/train/gate/test_module.pymodified

26 lines changed — click to load

                      "mode": "trained",
+                 }
+             )
++
 +    def test_non_integer_dims_rejected(self) -> None:
 +        with pytest.raises(GateConfigError, match="input_dim/hidden_proj_dim"):
 +            GateMetadata.from_json(
 +                {
 +                    "input_dim": "8",
 +                    "hidden_proj_dim": 4,
 +                    "adapter_names": ["a", "b"],
 +                    "mode": "trained",
 +                }
 +            )
++
 +    def test_non_numeric_entropy_rejected(self) -> None:
 +        with pytest.raises(GateConfigError, match="entropy_lambda"):
 +            GateMetadata.from_json(
 +                {
 +                    "input_dim": 8,
 +                    "hidden_proj_dim": 4,
 +                    "adapter_names": ["a", "b"],
 +                    "mode": "trained",
 +                    "entropy_lambda": "high",
 +                }
 +            )

tests/unit/train/gate/test_orchestrator.pymodified

22 lines changed — click to load

+         )
          assert result is None
 +    def test_exactly_one_named_adapter_returns_none(self, tmp_path: Path) -> None:
 +        parsed = _parsed((_prose("x", adapter="solo"),), gate_enabled=False, adapters=("solo",))
 +        object.__setattr__(parsed.frontmatter.training.gate, "enabled", True)
 +        store = StorePath(root=tmp_path)
 +        store.ensure_layout()
 +        recorder = MetricsRecorder(tmp_path)
 +        result = run_post_sft_gate(
 +            store,
 +            parsed,
 +            run_id=1,
 +            recorder=recorder,
 +            embed=lambda _p: _tensor(4),
 +            input_dim=4,
 +        )
 +        assert result is None
++
      def test_cold_start_fallback_records_uniform_events(self, tmp_path: Path) -> None:
          parsed = _parsed((_prose("only-a", adapter="a"),))
          store = StorePath(root=tmp_path)

tests/unit/train/gate/test_trainer.pymodified

30 lines changed — click to load

      load_gate,
      train_gate,
+ )
 +from dlm.train.gate.errors import GateTrainingError
  from dlm.train.gate.paths import gate_config_path, gate_save_path
+         )
          assert len(seen) == 7
 +    def test_non_finite_loss_raises(self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
 +        import torch
++
 +        store = _store(tmp_path)
 +        samples = _synthetic_samples(per_class=5, input_dim=4, seed=0)
 +        monkeypatch.setattr(torch, "isfinite", lambda value: torch.tensor(False))
 +        with pytest.raises(GateTrainingError, match="non-finite"):
 +            train_gate(
 +                store,  # type: ignore[arg-type]
 +                samples,
 +                adapter_names=["a", "b"],
 +                input_dim=4,
 +                steps=1,
 +                cold_start_floor=1,
 +                batch_size=4,
 +            )
++
  class TestLoadGateErrors:
      def test_missing_config(self, tmp_path: Path) -> None:

tests/unit/train/multi_adapter/test_orchestrator.pymodified

72 lines changed — click to load

          # Flat layout: version dir lives under adapter/versions/, not a named subdir.
          assert store.adapter_version(1).is_dir()
 +    def test_one_named_adapter_still_passthroughs(self, tmp_path: Path) -> None:
 +        dlm_id = "01HZ4X7TGZM3J1A2B3C4D5E6FZ"
 +        store = _seed_store(tmp_path, dlm_id)
 +        parsed = ParsedDlm(
 +            frontmatter=DlmFrontmatter(
 +                dlm_id=dlm_id,
 +                base_model="smollm2-135m",
 +                training=TrainingConfig(
 +                    seed=42,
 +                    adapters={"knowledge": AdapterConfig()},
 +                ),
 +            ),
 +            sections=(
 +                Section(type=SectionType.PROSE, content="Shared domain prose."),
 +                Section(
 +                    type=SectionType.INSTRUCTION,
 +                    content="### Q\nfacts?\n### A\nfacts.",
 +                    adapter="knowledge",
 +                ),
 +            ),
 +        )
 +        results = run_all(
 +            store,
 +            parsed,
 +            BASE_MODELS["smollm2-135m"],
 +            _plan(),
 +            mode="fresh",
 +            trainer_factory=_mock_trainer_factory,
 +        )
 +        assert len(results) == 1
++
 +    def test_gate_enabled_with_one_named_adapter_still_returns_one_result(
 +        self, tmp_path: Path
 +    ) -> None:
 +        dlm_id = "01HZ4X7TGZM3J1A2B3C4D5E6FY"
 +        store = _seed_store(tmp_path, dlm_id)
 +        parsed = ParsedDlm(
 +            frontmatter=DlmFrontmatter(
 +                dlm_id=dlm_id,
 +                base_model="smollm2-135m",
 +                training=TrainingConfig(
 +                    seed=42,
 +                    adapters={"knowledge": AdapterConfig()},
 +                    gate=GateConfig(enabled=False),
 +                ),
 +            ),
 +            sections=(
 +                Section(type=SectionType.PROSE, content="Shared domain prose."),
 +                Section(
 +                    type=SectionType.INSTRUCTION,
 +                    content="### Q\nfacts?\n### A\nfacts.",
 +                    adapter="knowledge",
 +                ),
 +            ),
 +        )
 +        object.__setattr__(parsed.frontmatter.training.gate, "enabled", True)
 +        results = run_all(
 +            store,
 +            parsed,
 +            BASE_MODELS["smollm2-135m"],
 +            _plan(),
 +            mode="fresh",
 +            trainer_factory=_mock_trainer_factory,
 +        )
 +        assert len(results) == 1
++
  class TestMultiAdapterOrchestration:
      def test_trains_each_declared_adapter(self, tmp_path: Path) -> None:

tests/unit/train/preference/test_dpo_phase.pymodified

44 lines changed — click to load

  from __future__ import annotations
 +from dataclasses import replace
  from pathlib import Path
  from types import SimpleNamespace
  from typing import Any
  from unittest.mock import MagicMock
 +import pytest
++
 +import dlm.train.preference.dpo_phase as dpo_phase
  from dlm.base_models import BASE_MODELS
  from dlm.doc.parser import ParsedDlm
  from dlm.doc.schema import DlmFrontmatter, PreferenceConfig, TrainingConfig
              trainer_factory=_capturing_factory,
+         )
          assert captured["include_auto_mined"] is False
++
 +    def test_writes_lock_when_decision_requests_it(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        store = for_dlm("01DPOTEST5", home=tmp_path)
 +        _seed_prior_sft(store, dlm_id="01DPOTEST5")
 +        parsed = replace(_parsed_with_preferences(), source_path=tmp_path / "doc.dlm")
 +        persist_lock = MagicMock()
++
 +        monkeypatch.setattr(
 +            dpo_phase,
 +            "_validate_or_abort_lock",
 +            lambda **_kwargs: SimpleNamespace(should_write_lock=True),
 +        )
 +        monkeypatch.setattr(dpo_phase, "_persist_lock", persist_lock)
++
 +        run(
 +            store,
 +            parsed,
 +            BASE_MODELS["smollm2-135m"],
 +            _plan(),
 +            reference_adapter_version=1,
 +            trainer_factory=_mock_factory,
 +        )
++
 +        persist_lock.assert_called_once()

tests/unit/train/preference/test_orpo_phase.pymodified

47 lines changed — click to load

  from __future__ import annotations
 +from dataclasses import replace
  from pathlib import Path
  from types import SimpleNamespace
  from typing import Any
  from unittest.mock import MagicMock
 +import pytest
++
 +import dlm.train.preference.orpo_phase as orpo_phase
  from dlm.base_models import BASE_MODELS
  from dlm.doc.parser import ParsedDlm
  from dlm.doc.schema import DlmFrontmatter, PreferenceConfig, TrainingConfig
+         )
          assert captured["max_steps"] == 25
 +    def test_writes_lock_when_decision_requests_it(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        store = for_dlm("01ORPOTEST5", home=tmp_path)
 +        _seed_prior_sft(store, dlm_id="01ORPOTEST5")
 +        parsed = replace(_parsed_with_preferences(), source_path=tmp_path / "doc.dlm")
 +        persist_lock = MagicMock()
++
 +        monkeypatch.setattr(
 +            orpo_phase,
 +            "_validate_or_abort_lock",
 +            lambda **_kwargs: SimpleNamespace(should_write_lock=True),
 +        )
 +        monkeypatch.setattr(orpo_phase, "_persist_lock", persist_lock)
++
 +        run(
 +            store,
 +            parsed,
 +            BASE_MODELS["smollm2-135m"],
 +            _plan(),
 +            reference_adapter_version=1,
 +            trainer_factory=_mock_factory,
 +        )
++
 +        persist_lock.assert_called_once()
++
  class TestLockModes:
      def test_ignore_mode_skips_lock_write(self, tmp_path: Path) -> None:

tests/unit/train/preference/test_phase_orchestrator.pymodified

46 lines changed — click to load

  import pytest
 +import dlm.train.preference.phase_orchestrator as phase_orchestrator
  from dlm.doc.schema import PreferenceConfig
  from dlm.doc.sections import Section, SectionType
  from dlm.train.preference.errors import (
          _, kwargs = sft.call_args
          assert kwargs["strict_metrics"] is True
 +    def test_sft_phase_forwards_world_size_to_sft_runner(self) -> None:
 +        sft = MagicMock(return_value=_FakeRunResult(adapter_version=1))
++
 +        run_phases(
 +            store=MagicMock(),
 +            parsed=_parsed([_prose()]),
 +            spec=MagicMock(),
 +            plan=MagicMock(),
 +            phase="sft",
 +            world_size=4,
 +            sft_runner=sft,
 +            dpo_runner=MagicMock(),
 +        )
++
 +        _, kwargs = sft.call_args
 +        assert kwargs["world_size"] == 4
++
      def test_sft_phase_skips_when_no_sft_content(self) -> None:
          sft = MagicMock()
          dpo = MagicMock()
              pr.phase = "dpo"  # type: ignore[misc]
 +class TestMethodRunner:
 +    def test_method_runner_uses_registry_resolver(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        fake = MagicMock()
 +        monkeypatch.setattr(
 +            "dlm.train.preference.method_registry.resolve",
 +            lambda method: fake if method == "orpo" else None,
 +        )
 +        assert phase_orchestrator._method_runner("orpo") is fake
++
++
  class TestAutoEnableIntegration:
      """Auto-enable: when user didn't set `enabled` and preference
      content is present, DPO runs under `--phase all`."""

tests/unit/train/test_cache.pyadded

38 lines changed — click to load

 +from __future__ import annotations
++
 +import logging
 +import os
++
 +from dlm.train.cache import DISABLE_ENV_VAR, disabled_cache, is_cache_disabled, set_disable_flag
++
++
 +class TestCacheDisableFlag:
 +    def test_disabled_false_by_default(self, monkeypatch) -> None:
 +        monkeypatch.delenv(DISABLE_ENV_VAR, raising=False)
 +        assert is_cache_disabled() is False
++
 +    def test_set_disable_flag_sets_env_and_logs(self, monkeypatch, caplog) -> None:
 +        monkeypatch.delenv(DISABLE_ENV_VAR, raising=False)
 +        with caplog.at_level(logging.INFO):
 +            set_disable_flag("cli flag")
 +        assert is_cache_disabled() is True
 +        assert "tokenized cache disabled (cli flag)" in caplog.text
++
 +    def test_disabled_cache_restores_missing_prior_value(self, monkeypatch) -> None:
 +        monkeypatch.delenv(DISABLE_ENV_VAR, raising=False)
 +        with disabled_cache("scoped test"):
 +            assert is_cache_disabled() is True
 +        assert DISABLE_ENV_VAR not in os.environ
 +        assert is_cache_disabled() is False
++
 +    def test_disabled_cache_restores_prior_value(self, monkeypatch) -> None:
 +        monkeypatch.setenv(DISABLE_ENV_VAR, "0")
 +        with disabled_cache("scoped test"):
 +            assert is_cache_disabled() is True
 +        assert is_cache_disabled() is False
++
 +    def test_disabled_cache_preserves_existing_disabled_state(self, monkeypatch) -> None:
 +        monkeypatch.setenv(DISABLE_ENV_VAR, "1")
 +        with disabled_cache("already disabled"):
 +            assert is_cache_disabled() is True
 +        assert is_cache_disabled() is True

tests/unit/train/test_checkpoint_commit.pymodified

118 lines changed — click to load

  import pytest
 +import dlm.train.checkpoint_commit as checkpoint_commit
  from dlm.store.paths import for_dlm
  from dlm.train.checkpoint_commit import (
      _uniquify_rejected,
      fsync_dir,
      list_pending_versions,
+ )
 +from dlm.train.integrity import NaNWeightsError
  def _store(home: Path):
          v1 = allocate_next_version(store)
          assert v1.name == "v0001"
 +    def test_ignores_non_dir_entries(self, tmp_path: Path) -> None:
 +        store = _store(tmp_path)
 +        (store.adapter_versions / "v0009").write_text("not a directory")
 +        v1 = allocate_next_version(store)
 +        assert v1.name == "v0001"
++
  class TestCommitVersion:
      def test_happy_path_flips_current(self, tmp_path: Path) -> None:
          v2 = allocate_next_version(store)
          assert v2.name == "v0002"
 +    def test_nonfinite_writer_uniquify_failure_leaves_pending(
 +        self, tmp_path: Path, monkeypatch
 +    ) -> None:
 +        store = _store(tmp_path)
++
 +        def bad_writer(p: Path) -> None:
 +            (p / "weights.safetensors").write_text("bad")
 +            raise NaNWeightsError(["adapter.lora_A"])
++
 +        def boom(_: Path) -> Path:
 +            raise RuntimeError("no rejected slot")
++
 +        monkeypatch.setattr(checkpoint_commit, "_uniquify_rejected", boom)
++
 +        with pytest.raises(RuntimeError, match="no rejected slot"):
 +            commit_version(store, bad_writer)
++
 +        assert store.adapter_version(1).exists()
 +        assert store.resolve_current_adapter() is None
++
 +    def test_nonfinite_writer_rename_failure_still_reraises(
 +        self, tmp_path: Path, monkeypatch
 +    ) -> None:
 +        store = _store(tmp_path)
++
 +        def bad_writer(p: Path) -> None:
 +            (p / "weights.safetensors").write_text("bad")
 +            raise NaNWeightsError(["adapter.lora_B"])
++
 +        def bad_rename(self: Path, target: Path) -> Path:
 +            raise OSError("rename blocked")
++
 +        monkeypatch.setattr(Path, "rename", bad_rename)
++
 +        with pytest.raises(NaNWeightsError, match="NaN/inf"):
 +            commit_version(store, bad_writer)
++
 +        assert store.adapter_version(1).exists()
 +        assert store.resolve_current_adapter() is None
++
 +    def test_nonfinite_writer_renames_to_rejected_path(self, tmp_path: Path) -> None:
 +        store = _store(tmp_path)
++
 +        def bad_writer(p: Path) -> None:
 +            (p / "weights.safetensors").write_text("bad")
 +            raise NaNWeightsError(["adapter.lora_B"])
++
 +        with pytest.raises(NaNWeightsError, match="NaN/inf"):
 +            commit_version(store, bad_writer)
++
 +        assert not store.adapter_version(1).exists()
 +        assert (store.adapter_versions / "v0001-rejected").exists()
 +        assert store.resolve_current_adapter() is None
++
  class TestListPending:
      def test_no_pending_when_all_committed(self, tmp_path: Path) -> None:
          pending = list_pending_versions(store)
          assert [p.name for p in pending] == [v1.name]
 +    def test_named_adapter_pending_versions_report_orphans(self, tmp_path: Path) -> None:
 +        store = _store(tmp_path)
 +        orphan = allocate_next_version(store, adapter_name="writer")
 +        commit_version(store, lambda p: (p / "a").write_text("a"), adapter_name="writer")
 +        pending = list_pending_versions(store, adapter_name="writer")
 +        assert [p.name for p in pending] == [orphan.name]
++
 +    def test_named_adapter_pending_versions_without_current(self, tmp_path: Path) -> None:
 +        store = _store(tmp_path)
 +        orphan = allocate_next_version(store, adapter_name="writer")
 +        pending = list_pending_versions(store, adapter_name="writer")
 +        assert pending == [orphan]
++
  class TestFsyncDir:
      def test_fsync_no_error_on_real_dir(self, tmp_path: Path) -> None:
  class TestRejectedPathAllocation:
 +    def test_returns_first_available_suffix(self, tmp_path: Path) -> None:
 +        pending = tmp_path / "v0001"
 +        pending.mkdir()
 +        (tmp_path / "v0001-rejected").mkdir()
 +        (tmp_path / "v0001-rejected-1").mkdir()
 +        assert _uniquify_rejected(pending) == tmp_path / "v0001-rejected-2"
++
      def test_raises_after_1000_collisions(self, tmp_path: Path) -> None:
          pending = tmp_path / "v0001"
          pending.mkdir()

tests/unit/train/test_inject.pymodified

10 lines changed — click to load

          with pytest.raises(ValueError, match="capacity must be positive"):
              InjectedProbeQueue(capacity=0)
 +    def test_capacity_property_reflects_configured_limit(self) -> None:
 +        q = InjectedProbeQueue(capacity=8)
 +        assert q.capacity == 8
++
      def test_depth_reports_current(self) -> None:
          q = InjectedProbeQueue(capacity=8)
          assert q.depth() == 0

tests/unit/train/test_integrity.pymodified

9 lines changed — click to load

          # "check iff eval ran", so no eval entries means nothing to check.
          assert_eval_finite([{"loss": 2.0, "step": 1}, {"loss": 1.5, "step": 2}])
 +    def test_non_dict_entries_ignored(self) -> None:
 +        assert_eval_finite([{"loss": 2.0, "step": 1}, "not-a-dict"])
++
      def test_finite_eval_does_not_raise(self) -> None:
          assert_eval_finite([{"eval_loss": 1.8, "step": 10}])

tests/unit/train/test_logger.pymodified

36 lines changed — click to load

  from __future__ import annotations
  import json
 +from dataclasses import dataclass
  from pathlib import Path
  import pytest
  class TestContextManager:
 +    def test_path_property_round_trips(self, tmp_path: Path) -> None:
 +        path = tmp_path / "x.jsonl"
 +        log = StepLogger(path)
 +        assert log.path == path
++
      def test_outside_context_raises(self, tmp_path: Path) -> None:
          log = StepLogger(tmp_path / "x.jsonl")
          with pytest.raises(RuntimeError, match="not open"):
          parsed = json.loads(p.read_text().strip())
          assert parsed["val_ppl"] == 4.5
 +    def test_dataclass_fields_are_sanitized(self, tmp_path: Path) -> None:
 +        @dataclass
 +        class _Payload:
 +            step: int
 +            note: str
++
 +        p = tmp_path / "run.jsonl"
 +        with StepLogger(p) as log:
 +            log.log_event("custom", payload=_Payload(step=3, note="ok"))
 +        parsed = json.loads(p.read_text().strip())
 +        assert parsed["payload"] == {"step": 3, "note": "ok"}
++
  class TestLogPath:
      def test_shape(self, tmp_path: Path) -> None:

tests/unit/train/test_rpc.pymodified

134 lines changed — click to load

  from __future__ import annotations
  import json
 +import socket
  import urllib.error
  import urllib.request
  from collections.abc import Iterator
      return resp.status, json.loads(resp.read())
 +def _raw_post(
 +    server: ProbeRpcServer,
 +    *,
 +    headers: dict[str, str],
 +    body: bytes = b"",
 +    path: str = "/rpc",
 +) -> tuple[int, dict[str, Any]]:
 +    host, port = server.address
 +    lines = [
 +        f"POST {path} HTTP/1.1",
 +        f"Host: {host}:{port}",
 +        *[f"{key}: {value}" for key, value in headers.items()],
 +        "",
 +        "",
 +    ]
 +    request = "\r\n".join(lines).encode("utf-8") + body
 +    with socket.create_connection((host, port), timeout=5.0) as sock:
 +        sock.sendall(request)
 +        response = b""
 +        while b"\r\n\r\n" not in response:
 +            response += sock.recv(4096)
 +        head, rest = response.split(b"\r\n\r\n", 1)
 +        header_lines = head.decode("iso-8859-1").split("\r\n")
 +        status = int(header_lines[0].split()[1])
 +        parsed_headers: dict[str, str] = {}
 +        for line in header_lines[1:]:
 +            if ":" not in line:
 +                continue
 +            key, value = line.split(":", 1)
 +            parsed_headers[key.lower()] = value.strip()
 +        content_length = int(parsed_headers.get("content-length", "0"))
 +        while len(rest) < content_length:
 +            rest += sock.recv(4096)
 +    return status, json.loads(rest[:content_length].decode("utf-8"))
++
++
  class TestHappyPath:
      def test_inject_probe_accepted(self, server: ProbeRpcServer) -> None:
          status, body = _post(
          assert status == 400
          assert "malformed" in body["error"].lower()
 +    def test_invalid_content_length_400(self, server: ProbeRpcServer) -> None:
 +        status, body = _raw_post(
 +            server,
 +            headers={
 +                "Authorization": f"Bearer {_TOKEN}",
 +                "Content-Type": "application/json",
 +                "Content-Length": "nope",
 +            },
 +        )
 +        assert status == 400
 +        assert "content-length" in body["error"].lower()
++
 +    def test_empty_body_400(self, server: ProbeRpcServer) -> None:
 +        status, body = _raw_post(
 +            server,
 +            headers={
 +                "Authorization": f"Bearer {_TOKEN}",
 +                "Content-Type": "application/json",
 +                "Content-Length": "0",
 +            },
 +        )
 +        assert status == 400
 +        assert "empty body" in body["error"].lower()
++
 +    def test_oversized_body_400(self, server: ProbeRpcServer) -> None:
 +        status, body = _raw_post(
 +            server,
 +            headers={
 +                "Authorization": f"Bearer {_TOKEN}",
 +                "Content-Type": "application/json",
 +                "Content-Length": str(70 * 1024),
 +            },
 +        )
 +        assert status == 400
 +        assert "exceeds" in body["error"].lower()
++
 +    def test_payload_must_be_object(self, server: ProbeRpcServer) -> None:
 +        status, body = _post(server, body="[]")
 +        assert status == 400
 +        assert "json object" in body["error"].lower()
++
      def test_missing_prompt_400(self, server: ProbeRpcServer) -> None:
          status, body = _post(server, body={"method": "inject_probe", "params": {"reference": "a"}})
          assert status == 400
          assert "prompt" in body["error"].lower()
 +    def test_params_must_be_object(self, server: ProbeRpcServer) -> None:
 +        status, body = _post(server, body={"method": "inject_probe", "params": "bad"})
 +        assert status == 400
 +        assert "`params`" in body["error"]
++
 +    def test_empty_reference_400(self, server: ProbeRpcServer) -> None:
 +        status, body = _post(
 +            server,
 +            body={"method": "inject_probe", "params": {"prompt": "q", "reference": "   "}},
 +        )
 +        assert status == 400
 +        assert "reference" in body["error"].lower()
++
      def test_non_string_tags_400(self, server: ProbeRpcServer) -> None:
          status, body = _post(
              server,
      def test_empty_token_rejected(self) -> None:
          with pytest.raises(ValueError, match="bearer token"):
              ProbeRpcServer(host="127.0.0.1", port=0, token="", queue=InjectedProbeQueue())
++
 +    def test_start_twice_rejected(self) -> None:
 +        try:
 +            srv = ProbeRpcServer(
 +                host="127.0.0.1",
 +                port=0,
 +                token=_TOKEN,
 +                queue=InjectedProbeQueue(),
 +            )
 +        except PermissionError as exc:
 +            pytest.skip(f"loopback bind blocked on this host: {exc}")
 +        srv.start()
 +        try:
 +            with pytest.raises(RuntimeError, match="already started"):
 +                srv.start()
 +        finally:
 +            srv.stop()

tests/unit/train/test_state_sidecar.pymodified

94 lines changed — click to load

  from __future__ import annotations
 +import builtins
  import hashlib
  import io
  import json
      TRAINING_RUN_FILENAME,
      VERSIONS_FILENAME,
      TrainingState,
 +    _decode_python_random_state,
 +    _encode_python_random_state,
      capture_runtime_versions,
      load_state,
      save_state,
          # live in the JSON sidecar.
          assert "numpy_rng_state" not in payload
 +    def test_python_random_none_helpers_round_trip(self) -> None:
 +        assert _encode_python_random_state(None) is None
 +        assert _decode_python_random_state(None) is None
++
  class TestLegacyV1Compat:
      """Audit-11 B7: one-release back-compat for pre-B7 sidecars.
          loaded = load_state(tmp_path, runtime_versions={"torch": torch.__version__})
          assert loaded["global_step"] == 10
 +    def test_double_failed_torch_load_raises_integrity_error(
 +        self, tmp_path: Path, monkeypatch
 +    ) -> None:
 +        save_state(tmp_path, _mock_state())
++
 +        calls = {"count": 0}
 +        real_load = torch.load
++
 +        def fake_load(*args: Any, **kwargs: Any) -> Any:
 +            calls["count"] += 1
 +            if calls["count"] == 1:
 +                raise RuntimeError("weights-only failed")
 +            raise RuntimeError("legacy failed")
++
 +        monkeypatch.setattr(torch, "load", fake_load)
 +        with pytest.raises(ResumeIntegrityError, match="legacy load also failed"):
 +            load_state(tmp_path, runtime_versions={"torch": torch.__version__})
 +        monkeypatch.setattr(torch, "load", real_load)
++
 +    def test_missing_sidecar_version_defaults_rng_to_none(
 +        self, tmp_path: Path, monkeypatch
 +    ) -> None:
 +        save_state(tmp_path, _mock_state())
 +        real_load = torch.load
++
 +        def fake_load(*args: Any, **kwargs: Any) -> dict[str, Any]:
 +            return {
 +                "optimizer_state_dict": {"lr": 1e-4},
 +                "scheduler_state_dict": {"step": 5},
 +                "scaler_state_dict": None,
 +                "torch_rng_state": torch.get_rng_state(),
 +                "cuda_rng_state": None,
 +                "global_step": 10,
 +                "epoch": 0.5,
 +                "best_val_loss": 0.9,
 +                "dlm_manifest_hash": None,
 +                "base_model_revision": "a" * 40,
 +                "pinned_versions": {"torch": torch.__version__},
 +                "use_qlora": False,
 +            }
++
 +        monkeypatch.setattr(torch, "load", fake_load)
 +        loaded = load_state(tmp_path, runtime_versions={"torch": torch.__version__})
 +        monkeypatch.setattr(torch, "load", real_load)
++
 +        assert loaded["numpy_rng_state"] is None
 +        assert loaded["python_random_state"] is None
++
  class TestCaptureRuntimeVersions:
      def test_torch_key_populated(self) -> None:
          reports that drove the run."""
          versions = capture_runtime_versions()
          assert "sway" in versions
++
 +    def test_missing_import_returns_none(self, monkeypatch) -> None:
 +        real_import = builtins.__import__
++
 +        def fake_import(name: str, *args: Any, **kwargs: Any) -> Any:
 +            if name == "bitsandbytes":
 +                raise ImportError("forced missing package")
 +            return real_import(name, *args, **kwargs)
++
 +        monkeypatch.setattr(builtins, "__import__", fake_import)
 +        versions = capture_runtime_versions()
 +        assert versions["bitsandbytes"] is None

tests/unit/train/test_tokenization.pymodified

33 lines changed — click to load

  from pathlib import Path
  from typing import Any, cast
 +import numpy as np
  import pytest
  from transformers import PreTrainedTokenizerBase
  from dlm.directives.cache import TokenizedCache
  from dlm.train.tokenization import (
      TokenizationStats,
 +    _as_int_list,
      pretokenize_rows,
+ )
+         )
          with pytest.raises(dataclasses.FrozenInstanceError):
              s.total_sections = 3  # type: ignore[misc]
++
++
 +class TestAsIntList:
 +    def test_numpy_batch_of_one_is_flattened(self) -> None:
 +        arr = np.asarray([[1, 2, 3]], dtype=np.int64)
 +        assert _as_int_list(arr) == [1, 2, 3]
++
 +    def test_tolist_like_object_is_flattened(self) -> None:
 +        class _FakeTensor:
 +            def tolist(self) -> list[list[int]]:
 +                return [[4, 5, 6]]
++
 +        assert _as_int_list(_FakeTensor()) == [4, 5, 6]
++
 +    def test_plain_iterable_falls_back_to_iteration(self) -> None:
 +        assert _as_int_list((7, 8, 9)) == [7, 8, 9]

tests/unit/train/test_trainer_helpers.pymodified

366 lines changed — click to load

  from __future__ import annotations
 +import logging
  from pathlib import Path
+-
 +from types import SimpleNamespace
 +from typing import cast
 +from unittest.mock import MagicMock
++
 +import pytest
++
 +from dlm.base_models import BASE_MODELS
 +from dlm.directives import ExpandResult, SourceProvenance
 +from dlm.directives.discovery import DiscoveredConfig
 +from dlm.directives.schema import DlmTrainingConfig
 +from dlm.doc.parser import ParsedDlm
 +from dlm.doc.schema import DlmFrontmatter, SourceDirective, TrainingConfig
 +from dlm.doc.sections import Section, SectionType
 +from dlm.lock import LockDecision, LockSchemaError, Severity
 +from dlm.replay import ChangeSet
  from dlm.train.trainer import (
 +    _append_change_set_to_replay,
      _append_training_run,
 +    _attach_dlm_trainer_callback,
 +    _build_candidate_lock,
 +    _compute_weight_distribution,
 +    _expand_directives,
      _maybe_float,
 +    _maybe_record_tokenization,
      _next_run_id,
      _sample_replay_rows,
      _utc_naive,
 +    _validate_or_abort_lock,
+ )
  # --- _maybe_float -----------------------------------------------------------
  # --- _sample_replay_rows ----------------------------------------------------
 -class _FakeChangeSet:
 -    def __init__(self, new_count: int) -> None:
 -        self.new = [object() for _ in range(new_count)]
 +def _fake_change_set(new_count: int) -> ChangeSet:
 +    return ChangeSet(
 +        new=[Section(type=SectionType.PROSE, content=f"row {i}") for i in range(new_count)]
 +    )
  class _EmptyReplay:
          replay = _EmptyReplay()
          out = _sample_replay_rows(
              replay,  # type: ignore[arg-type]
 -            change_set=_FakeChangeSet(5),  # type: ignore[arg-type]
 +            change_set=_fake_change_set(5),
              seed=42,
              adapter_version=1,
+         )
          replay = _WarmReplay(entries=200)
          out = _sample_replay_rows(
              replay,  # type: ignore[arg-type]
 -            change_set=_FakeChangeSet(100),  # type: ignore[arg-type]
 +            change_set=_fake_change_set(100),
              seed=42,
              adapter_version=1,
+         )
          replay = _WarmReplay(entries=100)
          _sample_replay_rows(
              replay,  # type: ignore[arg-type]
 -            change_set=_FakeChangeSet(0),  # |new| = 0 → k = max(32, 0) = 32
 +            change_set=_fake_change_set(0),  # |new| = 0 → k = max(32, 0) = 32
              seed=0,
              adapter_version=1,
+         )
          # both sample_rows calls receive an equal-state Random instance.
          _sample_replay_rows(
              replay1,  # type: ignore[arg-type]
 -            change_set=_FakeChangeSet(5),  # type: ignore[arg-type]
 +            change_set=_fake_change_set(5),
              seed=7,
              adapter_version=3,
+         )
          _sample_replay_rows(
              replay2,  # type: ignore[arg-type]
 -            change_set=_FakeChangeSet(5),  # type: ignore[arg-type]
 +            change_set=_fake_change_set(5),
              seed=7,
              adapter_version=3,
+         )
      return store
 +_SOURCE_PATH_SENTINEL = object()
++
++
 +def _parsed(
 +    tmp_path: Path,
 +    *,
 +    source_path: object = _SOURCE_PATH_SENTINEL,
 +    sections: tuple[Section, ...] | None = None,
 +    sources: tuple[SourceDirective, ...] | None = None,
 +) -> ParsedDlm:
 +    resolved_source_path: Path | None
 +    if source_path is _SOURCE_PATH_SENTINEL:
 +        resolved_source_path = tmp_path / "doc.dlm"
 +        resolved_source_path.write_text("placeholder .dlm body\n", encoding="utf-8")
 +    else:
 +        assert source_path is None or isinstance(source_path, Path)
 +        resolved_source_path = source_path
 +    return ParsedDlm(
 +        frontmatter=DlmFrontmatter(
 +            dlm_id="01HZ4X7TGZM3J1A2B3C4D5E6F7",
 +            base_model="smollm2-135m",
 +            training=TrainingConfig(seed=42, sources=sources),
 +        ),
 +        sections=sections or (Section(type=SectionType.PROSE, content="x"),),
 +        source_path=resolved_source_path,
 +    )
++
++
  class TestNextRunId:
      def test_missing_manifest_returns_1(self, tmp_path: Path) -> None:
          """Edge case: manifest not yet written → fresh run."""
+         )
          assert state["scaler_state_dict"] is None
          assert state["use_qlora"] is True
++
++
 +class TestAttachDlmTrainerCallback:
 +    def test_returns_when_trainer_has_no_add_callback(self) -> None:
 +        _attach_dlm_trainer_callback(
 +            trainer=SimpleNamespace(),
 +            recorder=MagicMock(),
 +            run_id=1,
 +            step_logger=MagicMock(),
 +        )
++
 +    def test_warns_and_swallows_callback_attachment_errors(
 +        self,
 +        caplog: pytest.LogCaptureFixture,
 +    ) -> None:
 +        caplog.set_level(logging.WARNING, logger="dlm.train.trainer")
 +        trainer = SimpleNamespace(add_callback=MagicMock(side_effect=RuntimeError("boom")))
++
 +        _attach_dlm_trainer_callback(
 +            trainer=trainer,
 +            recorder=MagicMock(),
 +            run_id=1,
 +            step_logger=MagicMock(),
 +        )
++
 +        assert "failed to attach DlmTrainerCallback" in caplog.text
++
++
 +class TestMaybeRecordTokenization:
 +    def test_missing_trainer_stats_is_a_no_op(self) -> None:
 +        recorder = MagicMock()
++
 +        _maybe_record_tokenization(
 +            recorder=recorder,
 +            run_id=1,
 +            trainer=SimpleNamespace(),
 +        )
++
 +        recorder.record_tokenization.assert_not_called()
++
++
 +class TestAppendChangeSetToReplay:
 +    def test_all_media_change_set_does_not_append(self) -> None:
 +        replay = MagicMock()
 +        change_set = SimpleNamespace(
 +            new=[
 +                Section(type=SectionType.IMAGE, content="", media_path="hero.png"),
 +                Section(
 +                    type=SectionType.AUDIO,
 +                    content="",
 +                    media_path="clip.wav",
 +                    media_transcript="spoken transcript",
 +                ),
 +            ]
 +        )
++
 +        _append_change_set_to_replay(
 +            replay,
 +            cast(ChangeSet, change_set),
 +            run_id=7,
 +        )
++
 +        replay.append_many.assert_not_called()
++
++
 +class TestBuildCandidateLock:
 +    def test_requires_source_path(self, tmp_path: Path) -> None:
 +        parsed = _parsed(tmp_path, source_path=None)
++
 +        with pytest.raises(ValueError, match="source_path is required"):
 +            _build_candidate_lock(
 +                parsed=parsed,
 +                spec=BASE_MODELS["smollm2-135m"],
 +                seed=42,
 +                run_id=1,
 +                versions={"torch": "2.4.0"},
 +                determinism_class="strict",
 +                capabilities=None,
 +            )
++
++
 +class TestValidateOrAbortLock:
 +    def test_default_mode_reraises_unreadable_prior_lock(self, tmp_path: Path) -> None:
 +        store = _bootstrap_store(tmp_path)
 +        parsed = _parsed(tmp_path)
 +        (store.root / "dlm.lock").write_text("{not json", encoding="utf-8")  # type: ignore[attr-defined]
++
 +        with pytest.raises(LockSchemaError):
 +            _validate_or_abort_lock(
 +                store=store,  # type: ignore[arg-type]
 +                parsed=parsed,
 +                spec=BASE_MODELS["smollm2-135m"],
 +                seed=42,
 +                run_id=1,
 +                versions={"torch": "2.4.0"},
 +                determinism_class="strict",
 +                capabilities=None,
 +                lock_mode="default",
 +            )
++
 +    def test_logs_warning_mismatches_when_validator_allows_proceed(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +        caplog: pytest.LogCaptureFixture,
 +    ) -> None:
 +        import dlm.train.trainer as trainer_mod
++
 +        store = _bootstrap_store(tmp_path)
 +        parsed = _parsed(tmp_path)
 +        decision = LockDecision(
 +            action="proceed_with_warnings",
 +            mismatches=[(Severity.WARN, "torch minor-version drift")],
 +            should_write_lock=True,
 +        )
 +        monkeypatch.setattr(trainer_mod, "load_lock", lambda _root: object())
 +        monkeypatch.setattr(
 +            trainer_mod,
 +            "validate_lock",
 +            lambda _prior, _candidate, mode="default": decision,
 +        )
 +        caplog.set_level(logging.WARNING, logger="dlm.train.trainer")
++
 +        got = _validate_or_abort_lock(
 +            store=store,  # type: ignore[arg-type]
 +            parsed=parsed,
 +            spec=BASE_MODELS["smollm2-135m"],
 +            seed=42,
 +            run_id=1,
 +            versions={"torch": "2.4.0"},
 +            determinism_class="strict",
 +            capabilities=None,
 +            lock_mode="default",
 +        )
++
 +        assert got == decision
 +        assert "dlm.lock drift: torch minor-version drift" in caplog.text
++
++
 +class TestComputeWeightDistribution:
 +    def test_counts_rows_when_directive_weights_are_active(self, tmp_path: Path) -> None:
 +        parsed = _parsed(
 +            tmp_path,
 +            sections=(Section(type=SectionType.PROSE, content="note", tags={"kind": "note"}),),
 +        )
 +        discovered = (
 +            DiscoveredConfig(
 +                anchor=tmp_path,
 +                config=DlmTrainingConfig(weights={"kind": {"note": 2.0}}),
 +                ignore_rules=(),
 +            ),
 +        )
++
 +        dist = _compute_weight_distribution(parsed=parsed, directive_discovered=discovered)
++
 +        assert dist == {"kind": {"note": 1}}
++
++
 +class TestExpandDirectives:
 +    def test_returns_original_parsed_when_expansion_finds_no_sections(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        parsed = _parsed(
 +            tmp_path,
 +            sources=(SourceDirective(path="corpus"),),
 +        )
 +        discovered = (
 +            DiscoveredConfig(
 +                anchor=tmp_path,
 +                config=DlmTrainingConfig(),
 +                ignore_rules=(),
 +            ),
 +        )
++
 +        def _fake_expand_sources(
 +            parsed_arg: ParsedDlm,
 +            *,
 +            base_path: Path,
 +        ) -> ExpandResult:
 +            assert parsed_arg is parsed
 +            assert parsed.source_path is not None
 +            assert base_path == parsed.source_path.parent
 +            return ExpandResult(
 +                sections=(),
 +                provenance=(SourceProvenance(path="corpus", file_count=0, total_bytes=0),),
 +                discovered=discovered,
 +            )
++
 +        monkeypatch.setattr("dlm.directives.expand_sources", _fake_expand_sources)
++
 +        new_parsed, provenance, got_discovered = _expand_directives(parsed)
++
 +        assert new_parsed is parsed
 +        assert provenance[0].file_count == 0
 +        assert got_discovered == discovered
++
 +    def test_falls_back_to_cwd_and_logs_when_sections_expand(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch: pytest.MonkeyPatch,
 +        caplog: pytest.LogCaptureFixture,
 +    ) -> None:
 +        parsed = _parsed(
 +            tmp_path,
 +            source_path=None,
 +            sources=(SourceDirective(path="corpus"),),
 +        )
 +        captured: dict[str, Path] = {}
++
 +        def _fake_expand_sources(
 +            parsed_arg: ParsedDlm,
 +            *,
 +            base_path: Path,
 +        ) -> ExpandResult:
 +            captured["base_path"] = base_path
 +            assert parsed_arg is parsed
 +            return ExpandResult(
 +                sections=(Section(type=SectionType.PROSE, content="expanded prose"),),
 +                provenance=(SourceProvenance(path="corpus", file_count=1, total_bytes=14),),
 +                discovered=(
 +                    DiscoveredConfig(
 +                        anchor=base_path,
 +                        config=DlmTrainingConfig(),
 +                        ignore_rules=(),
 +                    ),
 +                ),
 +            )
++
 +        monkeypatch.setattr("dlm.directives.expand_sources", _fake_expand_sources)
 +        caplog.set_level(logging.INFO, logger="dlm.train.trainer")
++
 +        new_parsed, provenance, discovered = _expand_directives(parsed)
++
 +        assert captured["base_path"] == Path.cwd()
 +        assert len(new_parsed.sections) == len(parsed.sections) + 1
 +        assert provenance[0].path == "corpus"
 +        assert len(discovered) == 1
 +        assert "directives: expanded 1 file(s) across 1 source(s)" in caplog.text

tests/unit/watch/test_debounce.pymodified

16 lines changed — click to load

  from __future__ import annotations
 +from unittest.mock import patch
++
  import pytest
  from dlm.watch.debounce import Debouncer
              Debouncer(quiet_seconds=0)
          with pytest.raises(ValueError, match="quiet_seconds"):
              Debouncer(quiet_seconds=-0.1)
++
 +    def test_default_clock_uses_time_monotonic(self) -> None:
 +        d = Debouncer(quiet_seconds=0.4)
 +        with patch("time.monotonic", return_value=12.5):
 +            assert d._now() == 12.5

tests/unit/watch/test_watcher_filter.pymodified

34 lines changed — click to load

          target = tmp_path / "gone.dlm"
          batch: set[tuple[object, str]] = {("added", str(target))}
          assert filter_events_for_path(batch, target) is True
++
 +    def test_target_resolve_oserror_falls_back_to_plain_string(
 +        self, tmp_path: Path, monkeypatch
 +    ) -> None:
 +        target = tmp_path / "doc.dlm"
 +        target.write_text("x")
 +        batch: set[tuple[object, str]] = {("modified", str(target))}
++
 +        monkeypatch.setattr(Path, "resolve", lambda self: (_ for _ in ()).throw(OSError("boom")))
++
 +        assert filter_events_for_path(batch, target) is True
++
 +    def test_raw_path_resolve_oserror_falls_back_to_raw_path_string(
 +        self,
 +        tmp_path: Path,
 +        monkeypatch,
 +    ) -> None:
 +        target = tmp_path / "doc.dlm"
 +        target.write_text("x")
 +        batch: set[tuple[object, str]] = {("modified", str(target))}
 +        real_path = Path
++
 +        class BrokenPath(Path):
 +            _flavour = real_path()._flavour  # type: ignore[attr-defined]
++
 +            def resolve(self) -> Path:
 +                raise OSError("boom")
++
 +        monkeypatch.setattr("dlm.watch.watcher.Path", BrokenPath)
++
 +        assert filter_events_for_path(batch, target) is True

tests/unit/watch/test_watcher_loop.pyadded

55 lines changed — click to load

 +"""Loop-level coverage for watch_for_changes and default stream wrapper."""
++
 +from __future__ import annotations
++
 +from collections.abc import Iterator
 +from pathlib import Path
 +from types import SimpleNamespace
 +from unittest.mock import patch
++
 +import pytest
++
 +from dlm.watch.errors import WatchSetupError
 +from dlm.watch.watcher import _default_event_stream, watch_for_changes
++
++
 +def test_default_event_stream_wraps_watchfiles_iterator(tmp_path: Path) -> None:
 +    seen: list[tuple[str, object | None]] = []
 +    expected = [{("modified", str(tmp_path / "doc.dlm"))}]
++
 +    def fake_watch(
 +        path: str, *, stop_event: object | None = None
 +    ) -> Iterator[set[tuple[object, str]]]:
 +        seen.append((path, stop_event))
 +        yield from expected
++
 +    with patch.dict("sys.modules", {"watchfiles": SimpleNamespace(watch=fake_watch)}):
 +        batches = list(_default_event_stream(tmp_path / "doc.dlm", stop_event="stop"))
++
 +    assert batches == expected
 +    assert seen == [(str(tmp_path), "stop")]
++
++
 +def test_watch_for_changes_requires_existing_file(tmp_path: Path) -> None:
 +    with pytest.raises(WatchSetupError, match="does not exist"):
 +        watch_for_changes(tmp_path / "missing.dlm", lambda: None)
++
++
 +def test_watch_for_changes_invokes_callback_for_matching_batches(tmp_path: Path) -> None:
 +    target = tmp_path / "doc.dlm"
 +    target.write_text("x")
 +    seen: list[str] = []
++
 +    def event_stream(
 +        _path: Path, *, stop_event: object | None = None
 +    ) -> Iterator[set[tuple[object, str]]]:
 +        assert stop_event == "stop"
 +        yield {("modified", str(tmp_path / "other.dlm"))}
 +        yield {("modified", str(target))}
 +        yield {("added", str(target))}
++
 +    watch_for_changes(
 +        target, lambda: seen.append("changed"), stop_event="stop", event_stream=event_stream
 +    )
++
 +    assert seen == ["changed", "changed"]

Diff truncated: 121 files; expand each to load its hunks.

  import pytest
 +from dlm.share import ServeHandle
 -def _start_server_in_thread(tmp_path: Path, *, ttl: int = 600):
++
 +def _start_server_in_thread(
 +    tmp_path: Path, *, ttl: int = 600
 +) -> tuple[ServeHandle, threading.Thread, bytes]:
      """Helper: pack a trivial file + start the peer server in a thread.
      Returns `(handle, thread, pack_bytes)`. Caller stops via
      pack.write_bytes(pack_bytes)
      opts = ServeOptions(port=0, token_ttl_seconds=ttl)  # port=0 → OS picks free port
 -    handle = serve("01HZTESTID", pack, opts)
 +    try:
 +        handle = serve("01HZTESTID", pack, opts)
 +    except PermissionError as exc:
 +        pytest.skip(f"loopback bind blocked on this host: {exc}")
      thread = threading.Thread(target=handle._server.serve_forever, daemon=True)
      thread.start()
      return handle, thread, pack_bytes
 -def _stop_server(handle, thread: threading.Thread) -> None:
 +def _stop_server(handle: ServeHandle, thread: threading.Thread) -> None:
      handle._server.shutdown()
      handle._server.server_close()
      thread.join(timeout=2.0)

          with pytest.raises(SinkError, match="upload failed"):
              push_hf(pack, "user/myadapter")
 +    def test_readme_upload_failure_translates_to_sink_error(
 +        self,
 +        pack: Path,
 +        patched_hub: dict[str, list[dict[str, object]]],
 +        monkeypatch: pytest.MonkeyPatch,
 +    ) -> None:
 +        import huggingface_hub
++
 +        calls = {"count": 0}
++
 +        def _boom_on_second_upload(**kwargs: object) -> str:
 +            calls["count"] += 1
 +            if calls["count"] == 2:
 +                raise _FakeHfHubHTTPError("readme denied")
 +            return f"https://huggingface.co/{kwargs['repo_id']}/blob/main/{kwargs['path_in_repo']}"
++
 +        monkeypatch.setattr(huggingface_hub, "upload_file", _boom_on_second_upload, raising=False)
++
 +        with pytest.raises(SinkError, match="README upload failed"):
 +            push_hf(pack, "user/myadapter")
++
      def test_progress_fires_with_full_size(
          self, pack: Path, patched_hub: dict[str, list[dict[str, object]]]
      ) -> None:

  from __future__ import annotations
 +import base64
  import time
  import pytest
          with pytest.raises(PeerAuthError):
              s.verify_token("AAAA")
 +    def test_trailing_bytes_refused(self) -> None:
 +        s = new_session("01HZTEST")
 +        nonce = b"x" * 12
 +        expiry_iso = "2099-01-01T00:00:00+00:00"
 +        signature = s._sign(s.dlm_id, expiry_iso, nonce)
 +        payload = (
 +            nonce
 +            + len(expiry_iso).to_bytes(2, "big")
 +            + expiry_iso.encode("ascii")
 +            + signature
 +            + b"!"
 +        )
 +        token = base64.urlsafe_b64encode(payload).decode("ascii").rstrip("=")
++
 +        with pytest.raises(PeerAuthError, match="trailing bytes"):
 +            s.verify_token(token)
++
 +    def test_malformed_expiry_refused(self) -> None:
 +        s = new_session("01HZTEST")
 +        nonce = b"y" * 12
 +        expiry_iso = "not-a-date"
 +        signature = s._sign(s.dlm_id, expiry_iso, nonce)
 +        payload = (
 +            nonce + len(expiry_iso).to_bytes(2, "big") + expiry_iso.encode("ascii") + signature
 +        )
 +        token = base64.urlsafe_b64encode(payload).decode("ascii").rstrip("=")
++
 +        with pytest.raises(PeerAuthError, match="malformed expiry"):
 +            s.verify_token(token)
++
      def test_expired_token(self) -> None:
          # TTL of 0 — any read after issuance is past-expiry.
          s = new_session("01HZTEST", token_ttl_seconds=0)
          with pytest.raises(RateLimitError, match="req/min"):
              rl.check_and_acquire()
 +    def test_prunes_requests_older_than_one_minute(self, monkeypatch: pytest.MonkeyPatch) -> None:
 +        rl = RateLimiter(max_concurrency=10, rate_limit_per_min=10)
 +        rl.requests.extend([10.0, 190.0])
 +        monkeypatch.setattr("dlm.share.peer.time.monotonic", lambda: 200.0)
++
 +        rl.check_and_acquire()
++
 +        assert list(rl.requests) == [190.0, 200.0]
 +        assert rl.active == 1
++
      def test_release_idempotent_on_zero(self) -> None:
          # Release more than was acquired — shouldn't go negative.
          rl = RateLimiter()