style: ruff format pass + embed_warmup ARG002 ignore for HF callback protocol

Status	File	+	-
M	`pyproject.toml`	4	0
M	`src/dlm/base_models/probes.py`	1	3
M	`src/dlm/cli/commands.py`	15	41
M	`src/dlm/cli/scaffold.py`	7	22
M	`src/dlm/data/formatter.py`	5	1
M	`src/dlm/directives/cache.py`	5	9
M	`src/dlm/directives/cache_key.py`	1	3
M	`src/dlm/directives/discovery.py`	2	8
M	`src/dlm/directives/expand.py`	5	17
M	`src/dlm/directives/merge.py`	1	5
M	`src/dlm/directives/safety.py`	1	3
M	`src/dlm/doc/parser.py`	3	8
M	`src/dlm/doc/schema.py`	2	8
M	`src/dlm/doc/serializer.py`	4	2
M	`src/dlm/export/runner.py`	2	5
M	`src/dlm/export/weighted_merge.py`	10	26
M	`src/dlm/hardware/capabilities.py`	1	3
M	`src/dlm/hardware/plan.py`	1	3
M	`src/dlm/hardware/refusals.py`	4	11
M	`src/dlm/inference/backends/mlx_backend.py`	1	2
M	`src/dlm/inference/loader.py`	1	3
M	`src/dlm/metrics/queries.py`	1	3
M	`src/dlm/metrics/sinks/wandb.py`	1	2
M	`src/dlm/share/hf_sink.py`	1	3
M	`src/dlm/share/peer.py`	2	7
M	`src/dlm/share/pull.py`	2	6
M	`src/dlm/share/push.py`	7	7
M	`src/dlm/share/signing.py`	3	6
M	`src/dlm/share/sinks.py`	3	9
M	`src/dlm/share/url_sink.py`	9	12
M	`src/dlm/store/inspect.py`	1	1
M	`src/dlm/store/paths.py`	2	5
M	`src/dlm/templates/init.py`	1	2
M	`src/dlm/train/checkpoint_commit.py`	5	14
M	`src/dlm/train/cpt/embed_warmup.py`	15	3
M	`src/dlm/train/cpt/schedule.py`	2	6
M	`src/dlm/train/cpt/vocab_gap.py`	7	14
M	`src/dlm/train/distributed/rank_env.py`	2	6
M	`src/dlm/train/multi_adapter/router.py`	1	2
M	`src/dlm/train/preference/dpo_phase.py`	2	6
M	`src/dlm/train/preference/dpo_trainer.py`	1	3
M	`src/dlm/train/preference/errors.py`	1	3
M	`src/dlm/train/preference/orpo_phase.py`	2	7
M	`src/dlm/train/preference/phase_orchestrator.py`	2	6
M	`src/dlm/train/trainer.py`	1	3
M	`tests/integration/directives/test_auto_scaffold_cycle.py`	2	6
M	`tests/integration/directives/test_dlm_dir_descent.py`	25	27
M	`tests/integration/directives/test_full_cycle.py`	1	2
M	`tests/integration/metrics/test_full_cycle.py`	1	3
M	`tests/integration/train/multi_adapter/test_two_adapters.py`	4	4
M	`tests/integration/train/multi_adapter/test_weighted_merge.py`	3	9
M	`tests/integration/train/preference/test_dpo_tinymodel.py`	10	2
M	`tests/integration/train/preference/test_orpo_tinymodel.py`	10	2
M	`tests/unit/cli/test_prompt_adapter_flag.py`	1	3
M	`tests/unit/cli/test_serve_guard.py`	5	8
M	`tests/unit/cli/test_train_scaffold_cli.py`	42	35
M	`tests/unit/directives/test_cache.py`	1	3
M	`tests/unit/directives/test_defaults.py`	1	3
M	`tests/unit/directives/test_discovery.py`	2	6
M	`tests/unit/directives/test_expand.py`	4	18
M	`tests/unit/directives/test_merge.py`	56	38
M	`tests/unit/directives/test_safety.py`	1	5
M	`tests/unit/doc/test_fence_adapter_suffix.py`	2	6
M	`tests/unit/doc/test_migration_v1_to_v2.py`	1	3
M	`tests/unit/doc/test_round_trip_v4_adapters.py`	1	3
M	`tests/unit/doc/test_schema.py`	5	15
M	`tests/unit/eval/test_summary.py`	2	6
M	`tests/unit/export/test_vendoring.py`	1	3
M	`tests/unit/export/test_weighted_merge.py`	1	3
M	`tests/unit/hardware/test_capabilities.py`	1	3
M	`tests/unit/hardware/test_f28_multi_adapter_qlora.py`	5	15
M	`tests/unit/hardware/test_plan.py`	6	18
M	`tests/unit/inference/test_resolve_adapter_path.py`	2	6
M	`tests/unit/lock/test_mismatch_policy.py`	3	3
M	`tests/unit/metrics/test_db_schema.py`	3	10
M	`tests/unit/metrics/test_queries.py`	1	3
M	`tests/unit/replay/test_store.py`	7	21
M	`tests/unit/share/test_peer_tokens.py`	1	3
M	`tests/unit/store/test_inspect_named_adapters.py`	1	3
M	`tests/unit/store/test_paths_named_adapters.py`	2	8
M	`tests/unit/templates/test_registry.py`	3	8
M	`tests/unit/test_templates_parse.py`	1	2
M	`tests/unit/train/cpt/test_embed_warmup.py`	4	6
M	`tests/unit/train/cpt/test_schedule.py`	8	25
M	`tests/unit/train/cpt/test_vocab_gap.py`	2	6
M	`tests/unit/train/distributed/test_rank_env.py`	1	3
M	`tests/unit/train/multi_adapter/test_orchestrator.py`	3	9
M	`tests/unit/train/multi_adapter/test_router.py`	9	32
M	`tests/unit/train/preference/test_determinism_plumbing.py`	4	12
M	`tests/unit/train/preference/test_dpo_dataset.py`	1	3
M	`tests/unit/train/preference/test_dpo_phase.py`	3	9
M	`tests/unit/train/preference/test_dpo_trainer.py`	2	6
M	`tests/unit/train/preference/test_method_registry.py`	1	0
M	`tests/unit/train/preference/test_orpo_phase.py`	3	9
M	`tests/unit/train/preference/test_orpo_trainer.py`	1	3
M	`tests/unit/train/preference/test_phase_orchestrator.py`	2	7
M	`tests/unit/train/test_resolve_adapter_hparams.py`	6	18
M	`tests/unit/watch/test_status.py`	3	9

pyproject.tomlmodified

  # will take so `--help` reflects the shipping surface — even though the
  # stub body discards them.
  "src/dlm/cli/commands.py" = ["ARG001"]
 +# HuggingFace Trainer callbacks MUST accept `args`/`state`/`control`
 +# positionally even when the implementation only reads some of them —
 +# HF dispatches them by position. ARG002 for these wrappers is noise.
 +"src/dlm/train/cpt/embed_warmup.py" = ["ARG002"]
  [tool.ruff.format]
  quote-style = "double"

src/dlm/base_models/probes.pymodified

  # --- aggregate ---------------------------------------------------------------
 -def run_all(
 -    spec: BaseModelSpec, *, skip_export_probes: bool = False
 -) -> ProbeReport:
 +def run_all(spec: BaseModelSpec, *, skip_export_probes: bool = False) -> ProbeReport:
      """Run every probe; aggregate into a `ProbeReport`.
      `GatedModelError` from an individual probe propagates immediately —

src/dlm/cli/commands.pymodified

          from dlm.templates import TemplateError, apply_template
          try:
 -            applied_result = apply_template(
 -                template, path, force=force, accept_license=True
 -            )
 +            applied_result = apply_template(template, path, force=force, accept_license=True)
          except TemplateError as exc:
              console.print(f"[red]init:[/red] {exc}")
              raise typer.Exit(code=1) from exc
      parsed = parse_file(path)
      store = for_dlm(parsed.frontmatter.dlm_id)
 -    runs = recent_runs(
 -        store.root, limit=limit, phase=phase, since=since_delta, run_id=run_id
 -    )
 +    runs = recent_runs(store.root, limit=limit, phase=phase, since=since_delta, run_id=run_id)
      if run_id is not None:
          # Drill-down: show this run's steps + evals.
              writer.writerow(["step", "loss", "lr", "grad_norm", "val_loss"])
              eval_by_step = {e.step: e.val_loss for e in evals}
              for s in steps:
 -                writer.writerow(
 -                    [s.step, s.loss, s.lr, s.grad_norm, eval_by_step.get(s.step)]
 -                )
 +                writer.writerow([s.step, s.loss, s.lr, s.grad_norm, eval_by_step.get(s.step)])
              return
          console.print(
              f"[green]run_id={run.run_id}[/green]  phase={run.phase}  "
          writer = csv.writer(sys.stdout)
          writer.writerow(["run_id", "phase", "seed", "status", "started_at", "ended_at"])
          for r in runs:
 -            writer.writerow(
 -                [r.run_id, r.phase, r.seed, r.status, r.started_at, r.ended_at]
 -            )
 +            writer.writerow([r.run_id, r.phase, r.seed, r.status, r.started_at, r.ended_at])
          return
      if not runs:
          raise typer.Exit(code=1) from exc
      store = for_dlm(parsed.frontmatter.dlm_id)
 -    training_sources, discovered_configs = (
 -        _summarize_training_sources_and_discovered(parsed, path.resolve().parent)
 +    training_sources, discovered_configs = _summarize_training_sources_and_discovered(
 +        parsed, path.resolve().parent
+     )
      # Store may not exist yet (no `dlm train` run). Treat that as an
      # informational state rather than an error — useful after `dlm init`.
      return f"{n} PB"
 -def _summarize_training_sources(
 -    parsed: object, base_path: Path
 -) -> list[dict[str, object]] | None:
 +def _summarize_training_sources(parsed: object, base_path: Path) -> list[dict[str, object]] | None:
      """Best-effort resolution of `training.sources` for `dlm show`.
      Returns None when the frontmatter declares no directives; returns
                  "has_ignore": bool(dc.ignore_rules),
                  "include": list(dc.config.include) if dc.config else [],
                  "exclude": list(dc.config.exclude) if dc.config else [],
 -                "exclude_defaults": (
 -                    dc.config.exclude_defaults if dc.config else True
 -                ),
 +                "exclude_defaults": (dc.config.exclude_defaults if dc.config else True),
                  "metadata": dict(dc.config.metadata) if dc.config else {},
                  "ignore_rules": len(dc.ignore_rules),
+             }
      return records, discovered_records
 -def _summarize_training_cache(
 -    cache_dir: Path, store_root: Path
 -) -> dict[str, object] | None:
 +def _summarize_training_cache(cache_dir: Path, store_root: Path) -> dict[str, object] | None:
      """Return a JSON-friendly snapshot of the tokenized-section cache.
      None when the cache dir doesn't exist (store never trained with
          console.print(f"    last hit rate:  {float(rate):.1%}")
 -def _render_training_sources_text(
 -    console: object, records: list[dict[str, object]]
 -) -> None:
 +def _render_training_sources_text(console: object, records: list[dict[str, object]]) -> None:
      from rich.console import Console
      assert isinstance(console, Console)
          bool,
          typer.Option("--sign", help="Sign the pack with minisign before upload."),
      ] = False,
 -    include_exports: Annotated[
 -        bool, typer.Option("--include-exports")
 -    ] = False,
 +    include_exports: Annotated[bool, typer.Option("--include-exports")] = False,
      include_base: Annotated[bool, typer.Option("--include-base")] = False,
      include_logs: Annotated[bool, typer.Option("--include-logs")] = False,
      licensee: Annotated[
          raise typer.Exit(code=1) from exc
      size_mb = result.bytes_sent / (1024 * 1024)
 -    console.print(
 -        f"[green]pushed:[/green] {result.destination} "
 -        f"({size_mb:.2f} MB)"
 -    )
 +    console.print(f"[green]pushed:[/green] {result.destination} ({size_mb:.2f} MB)")
      if result.sink_kind.value == "hf":
          console.print(f"[dim]install:[/dim] dlm pull {result.destination}")
      if result.detail:
          raise typer.Exit(code=1) from exc
      size_mb = result.bytes_received / (1024 * 1024)
 -    console.print(
 -        f"[green]pulled:[/green] {result.source} → {result.dlm_path} "
 -        f"({size_mb:.2f} MB)"
 -    )
 +    console.print(f"[green]pulled:[/green] {result.source} → {result.dlm_path} ({size_mb:.2f} MB)")
      status = result.verification.status
      if status == VerifyStatus.VERIFIED:
      store = for_dlm(dlm_id)
      if not store.manifest.exists():
          console.print(
 -            f"[red]serve:[/red] no training state for {dlm_id} — run "
 -            "[bold]dlm train[/bold] first."
 +            f"[red]serve:[/red] no training state for {dlm_id} — run [bold]dlm train[/bold] first."
+         )
          raise typer.Exit(code=1)
      seconds = _parse_duration(older_than)
      if seconds is None:
          console.print(
 -            f"[red]cache:[/red] invalid --older-than {older_than!r} "
 -            "(expected e.g. 30d, 12h, 45m)"
 +            f"[red]cache:[/red] invalid --older-than {older_than!r} (expected e.g. 30d, 12h, 45m)"
+         )
          raise typer.Exit(code=2)

src/dlm/cli/scaffold.pymodified

      if not target.exists():
          raise ScaffoldError(f"target does not exist: {target}", path=target)
      if not target.is_dir():
 -        raise ScaffoldError(
 -            f"scaffold expects a directory, got file: {target}", path=target
 -        )
 +        raise ScaffoldError(f"scaffold expects a directory, got file: {target}", path=target)
      dlm_dir = target / _SCAFFOLD_DIR
      existing = sorted(dlm_dir.glob("*.dlm")) if dlm_dir.is_dir() else []
              return ScaffoldResult(dlm_path=named_match, scaffolded=False, dlm_id=dlm_id)
          if name_is_default and len(existing) == 1:
              dlm_id = _dlm_id_from_file(existing[0])
 -            return ScaffoldResult(
 -                dlm_path=existing[0], scaffolded=False, dlm_id=dlm_id
 -            )
 +            return ScaffoldResult(dlm_path=existing[0], scaffolded=False, dlm_id=dlm_id)
          if name_is_default and len(existing) > 1:
 -            listing = "\n".join(
 -                f"  dlm train {target} --name {c.stem}" for c in existing
 -            )
 +            listing = "\n".join(f"  dlm train {target} --name {c.stem}" for c in existing)
              raise ScaffoldError(
                  f"multiple .dlm files found under {target / _SCAFFOLD_DIR}; "
                  f"pass --name to pick one:\n{listing}",
+         )
      dlm_path = dlm_dir / f"{name}.dlm"
 -    existing_id = (
 -        _dlm_id_from_file(dlm_path)
 -        if rescaffold and dlm_path.is_file()
 -        else None
 -    )
 +    existing_id = _dlm_id_from_file(dlm_path) if rescaffold and dlm_path.is_file() else None
      dlm_id = existing_id or mint_ulid()
      dlm_dir.mkdir(parents=True, exist_ok=True)
          policy=policy,
          target=target,
+     )
 -    _LOG.info(
 -        "scaffold: wrote %s (dlm_id=%s, base=%s)", dlm_path, dlm_id, base
 -    )
 +    _LOG.info("scaffold: wrote %s (dlm_id=%s, base=%s)", dlm_path, dlm_id, base)
      return ScaffoldResult(dlm_path=dlm_path, scaffolded=True, dlm_id=dlm_id)
+         [
              "---",
              "",
 -            "# Auto-scaffolded by `dlm train`. Edit the frontmatter above "
 -            "to refine training.",
 +            "# Auto-scaffolded by `dlm train`. Edit the frontmatter above to refine training.",
              "",
+         ]
+     )
      atomic_write_text(dlm_path, "\n".join(lines))
 -def _build_include_globs(
 -    include: tuple[str, ...], *, recursive: bool
 -) -> tuple[str, ...]:
 +def _build_include_globs(include: tuple[str, ...], *, recursive: bool) -> tuple[str, ...]:
      """Map `--include` flags + `--recursive` to frontmatter globs.
      Empty `--include` + `--recursive` → `["**/*"]`: train on every

src/dlm/data/formatter.pymodified

              if not isinstance(text, str):
                  raise DataFormatError(f"`text` field must be str, got {type(text).__name__}")
              return text
 -        if row.get("prompt") is not None and row.get("chosen") is not None and row.get("rejected") is not None:
 +        if (
 +            row.get("prompt") is not None
 +            and row.get("chosen") is not None
 +            and row.get("rejected") is not None
 +        ):
              raise DataFormatError(
                  "preference rows (prompt/chosen/rejected) must be routed to DPOTrainer, "
                  "not SFTTrainer's formatting_func"

src/dlm/directives/cache.pymodified

      # ---- Open / construct --------------------------------------------
      @classmethod
 -    def open(
 -        cls, root: Path, *, max_bytes: int = _DEFAULT_MAX_BYTES
 -    ) -> TokenizedCache:
 +    def open(cls, root: Path, *, max_bytes: int = _DEFAULT_MAX_BYTES) -> TokenizedCache:
          """Open (or create) a cache at `root`.
          Creates the directory layout idempotently. Missing manifest →
          mid-put fallback.
          """
          cutoff = time.time() - older_than_seconds
 -        stale_keys = [
 -            e.key_str
 -            for e in self._manifest.values()
 -            if e.last_access_ts < cutoff
 -        ]
 +        stale_keys = [e.key_str for e in self._manifest.values() if e.last_access_ts < cutoff]
          for key_str in stale_keys:
              entry = self._manifest[key_str]
              self._entry_path(entry).unlink(missing_ok=True)
              del self._manifest[key_str]
          if stale_keys:
 -            _LOG.info("cache: pruned %d entries older than %ds", len(stale_keys), older_than_seconds)
 +            _LOG.info(
 +                "cache: pruned %d entries older than %ds", len(stale_keys), older_than_seconds
 +            )
          return len(stale_keys)
      def clear(self) -> int:

src/dlm/directives/cache_key.pymodified

          birthday threshold. The full sha is persisted in the manifest
          for verification if a collision ever occurs in practice.
          """
 -        return (
 -            f"{self.section_id}.{self.tokenizer_sha[:12]}.seq{self.sequence_len}.npz"
 -        )
 +        return f"{self.section_id}.{self.tokenizer_sha[:12]}.seq{self.sequence_len}.npz"
      def shard(self) -> str:
          """First 2 hex chars of section_id — the directory shard."""

src/dlm/directives/discovery.pymodified

          anchor = dlm_dir.parent
          config = _load_training_yaml(dlm_dir / _CONFIG_FILENAME)
          ignore_rules = _load_ignore(dlm_dir / _IGNORE_FILENAME)
 -        discovered.append(
 -            DiscoveredConfig(
 -                anchor=anchor, config=config, ignore_rules=ignore_rules
 -            )
 -        )
 +        discovered.append(DiscoveredConfig(anchor=anchor, config=config, ignore_rules=ignore_rules))
      discovered.sort(key=lambda d: len(d.anchor.as_posix()))
      return tuple(discovered)
      try:
          return DlmTrainingConfig.model_validate(raw)
      except ValidationError as exc:
 -        _LOG.warning(
 -            "discovery: %s: schema violation (%s); skipping config", path, exc
 -        )
 +        _LOG.warning("discovery: %s: schema violation (%s); skipping config", path, exc)
          return None

src/dlm/directives/expand.pymodified

      if not directives:
          return ExpandResult(sections=(), provenance=(), discovered=())
 -    effective_base = (
 -        base_path.parent if base_path.name == ".dlm" else base_path
 -    )
 +    effective_base = base_path.parent if base_path.name == ".dlm" else base_path
      strict = training.sources_policy == "strict"
      sections: list[Section] = []
      provenance: list[SourceProvenance] = []
      header_root = resolved_root if resolved_root.is_dir() else resolved_root.parent
      for file_path in _iter_candidates(resolved_root):
 -        if (
 -            directive.max_files is not None
 -            and len(sections) >= directive.max_files
 -        ):
 +        if directive.max_files is not None and len(sections) >= directive.max_files:
              _LOG.info(
                  "directive: hit max_files=%d for %s; truncating deterministically",
                  directive.max_files,
              _LOG.warning("directive: stat failed for %s: %s; skipping", file_path, exc)
              continue
 -        if (
 -            directive.max_bytes_per_file is not None
 -            and size > directive.max_bytes_per_file
 -        ):
 +        if directive.max_bytes_per_file is not None and size > directive.max_bytes_per_file:
              _LOG.info(
                  "directive: %s (%d bytes) exceeds max_bytes_per_file=%d; skipping",
                  file_path,
              continue
          if is_probably_binary(raw):
 -            _LOG.info(
 -                "directive: %s looks binary (NUL in first KiB); skipping", file_path
 -            )
 +            _LOG.info("directive: %s looks binary (NUL in first KiB); skipping", file_path)
              skipped_binary += 1
              continue
          relpath = file_path.relative_to(header_root).as_posix()
          content = f"# source: {relpath}\n\n{text}"
 -        sections.append(
 -            Section(type=SectionType.PROSE, content=content, tags=effective.tags)
 -        )
 +        sections.append(Section(type=SectionType.PROSE, content=content, tags=effective.tags))
          total_bytes += len(raw)
      return sections, SourceProvenance(

src/dlm/directives/merge.pymodified

      """Return DiscoveredConfigs whose anchor is an ancestor of file_path,
      sorted shallowest → deepest. Includes the direct-parent anchor."""
      abs_file = file_path.resolve()
 -    result = [
 -        d
 -        for d in discovered
 -        if _is_ancestor(d.anchor.resolve(), abs_file)
 -    ]
 +    result = [d for d in discovered if _is_ancestor(d.anchor.resolve(), abs_file)]
      result.sort(key=lambda d: len(d.anchor.as_posix()))
      return tuple(result)

src/dlm/directives/safety.pymodified

              yield candidate
 -def _matches_filters(
 -    rel_path: str, include: Iterable[str], exclude: Iterable[str]
 -) -> bool:
 +def _matches_filters(rel_path: str, include: Iterable[str], exclude: Iterable[str]) -> bool:
      """Match rel_path against include (any) and exclude (none)."""
      if any(_compile_glob(pat).fullmatch(rel_path) for pat in exclude):
          return False

src/dlm/doc/parser.pymodified

              match = _FENCE_RE.match(line)
              if match:
                  fence_name = match.group(1)
 -                fence_type, fence_adapter = _resolve_fence_type(
 -                    fence_name, source_line, path
 -                )
 +                fence_type, fence_adapter = _resolve_fence_type(fence_name, source_line, path)
                  flush()
                  current_type = fence_type
                  current_adapter = fence_adapter
      return sections
 -def _resolve_fence_type(
 -    name: str, line: int, path: Path | None
 -) -> tuple[SectionType, str | None]:
 +def _resolve_fence_type(name: str, line: int, path: Path | None) -> tuple[SectionType, str | None]:
      """Map a fence name to `(SectionType, adapter_name|None)` or raise.
      Multi-adapter fences carry a `#<adapter>` suffix; the adapter part is
          section_type = SectionType(base)
      except ValueError as exc:
          raise FenceError(
 -            f"unknown section fence '::{name}::'; valid types are "
 -            f"{[t.value for t in SectionType]}",
 +            f"unknown section fence '::{name}::'; valid types are {[t.value for t in SectionType]}",
              path=path,
              line=line,
              col=1,

src/dlm/doc/schema.pymodified

      enabled: bool = False
      method: Literal["dpo", "orpo"] = "dpo"
 -    hyperparams: PreferenceHyperparams = Field(
 -        default_factory=lambda: PreferenceHyperparams()
 -    )
 +    hyperparams: PreferenceHyperparams = Field(default_factory=lambda: PreferenceHyperparams())
      # DPO-only fields — ignored for ORPO but kept on the config so a
      # user switching methods doesn't have to delete them.
      loss_type: Literal["sigmoid", "hinge", "ipo"] = "sigmoid"
              "target_modules": "auto",
              "learning_rate": 2e-4,
+         }
 -        drift = [
 -            key
 -            for key, default in flat_defaults.items()
 -            if getattr(self, key) != default
 -        ]
 +        drift = [key for key, default in flat_defaults.items() if getattr(self, key) != default]
          if drift:
              raise ValueError(
                  "training.adapters is declared; flat per-adapter fields "

src/dlm/doc/serializer.pymodified

              lines.append(f"{pad}{field_name}:")
              lines.extend(nested)
              continue
 -        if isinstance(value, dict) and value and all(
 -            isinstance(v, BaseModel) for v in value.values()
 +        if (
 +            isinstance(value, dict)
 +            and value
 +            and all(isinstance(v, BaseModel) for v in value.values())
          ):
              # `dict[str, BaseModel]` (e.g. training.adapters) — emit
              # each entry as a nested mapping. The key is the dict

src/dlm/export/runner.pymodified

          if not adapter_path.exists():
              from dlm.export.errors import ExportError
 -            raise ExportError(
 -                f"adapter_path_override {adapter_path} does not exist"
 -            )
 +            raise ExportError(f"adapter_path_override {adapter_path} does not exist")
      elif adapter_name is None:
          resolved = store.resolve_current_adapter()
          pointer = store.adapter_current_pointer
              from dlm.export.errors import ExportError
              raise ExportError(
 -                f"no current adapter under {pointer}; "
 -                "run `dlm train` before exporting."
 +                f"no current adapter under {pointer}; run `dlm train` before exporting."
+             )
          adapter_path = resolved
      else:

src/dlm/export/weighted_merge.pymodified

      for piece in raw.split(","):
          token = piece.strip()
          if not token:
 -            raise InvalidMixSpecError(
 -                f"--adapter-mix: empty entry in spec {spec_str!r}"
 -            )
 +            raise InvalidMixSpecError(f"--adapter-mix: empty entry in spec {spec_str!r}")
          if ":" not in token:
              raise InvalidMixSpecError(
 -                f"--adapter-mix: entry {token!r} is missing a weight "
 -                "(shape: `name:weight`)"
 +                f"--adapter-mix: entry {token!r} is missing a weight (shape: `name:weight`)"
+             )
          name, _, weight_str = token.rpartition(":")
          name = name.strip()
          weight_str = weight_str.strip()
          if not _NAME_RE.fullmatch(name):
              raise InvalidMixSpecError(
 -                f"--adapter-mix: adapter name {name!r} is not valid "
 -                f"(must match {_NAME_RE.pattern})"
 +                f"--adapter-mix: adapter name {name!r} is not valid (must match {_NAME_RE.pattern})"
+             )
          if name in seen:
 -            raise InvalidMixSpecError(
 -                f"--adapter-mix: adapter {name!r} appears twice"
 -            )
 +            raise InvalidMixSpecError(f"--adapter-mix: adapter {name!r} appears twice")
          seen.add(name)
          try:
              weight = float(weight_str)
          except ValueError as exc:
              raise InvalidMixSpecError(
 -                f"--adapter-mix: weight {weight_str!r} for adapter "
 -                f"{name!r} is not a number"
 +                f"--adapter-mix: weight {weight_str!r} for adapter {name!r} is not a number"
              ) from exc
          if weight < 0:
              raise InvalidMixSpecError(
 -                f"--adapter-mix: weight {weight} for adapter {name!r} "
 -                "is negative (must be >= 0)"
 +                f"--adapter-mix: weight {weight} for adapter {name!r} is negative (must be >= 0)"
+             )
          entries.append(MixEntry(name=name, weight=weight))
      return entries
 -def validate_mix_against_declared(
 -    entries: list[MixEntry], declared: set[str]
 -) -> None:
 +def validate_mix_against_declared(entries: list[MixEntry], declared: set[str]) -> None:
      """Refuse mix entries that reference adapters not in `training.adapters`.
      Single source of error messaging so the CLI and the runner both
      first = entries[0]
      first_path = _resolve_or_raise(store, first.name)
 -    model = PeftModel.from_pretrained(
 -        base_model, str(first_path), adapter_name=first.name
 -    )
 +    model = PeftModel.from_pretrained(base_model, str(first_path), adapter_name=first.name)
      for extra in entries[1:]:
          path = _resolve_or_raise(store, extra.name)
          model.load_adapter(str(path), adapter_name=extra.name)
      single-valued), so any source is interchangeable — we pick the first.
      """
      if not entries:
 -        raise InvalidMixSpecError(
 -            "resolve_first_source_path: empty mix"
 -        )
 +        raise InvalidMixSpecError("resolve_first_source_path: empty mix")
      return _resolve_or_raise(store, entries[0].name)
      import shutil
      tmp_dir.mkdir(parents=True, exist_ok=True)
 -    merged_model.save_pretrained(
 -        str(tmp_dir), selected_adapters=[_MERGED_ADAPTER_NAME]
 -    )
 +    merged_model.save_pretrained(str(tmp_dir), selected_adapters=[_MERGED_ADAPTER_NAME])
      # PEFT nests under the adapter name; that's where run_export
      # expects to find adapter_config.json + safetensors.

src/dlm/hardware/capabilities.pymodified

      return psutil.virtual_memory().total / (1024**3)
 -def _supports_bf16(
 -    backend: Backend, sm: tuple[int, int] | None, rocm_arch: str | None
 -) -> bool:
 +def _supports_bf16(backend: Backend, sm: tuple[int, int] | None, rocm_arch: str | None) -> bool:
      if backend == Backend.CUDA:
          return sm is not None and sm >= (8, 0)
      if backend == Backend.ROCM:

src/dlm/hardware/plan.pymodified

          raise ValueError(f"world_size must be >= 1, got {world_size}")
      if world_size > 1:
          check_multi_gpu_refusals(caps, world_size)
 -    check_refusals(
 -        training, caps, base_params, force=force, num_adapters=num_adapters
 -    )
 +    check_refusals(training, caps, base_params, force=force, num_adapters=num_adapters)
      use_qlora = _should_qlora(training, caps)
      precision = _pick_precision(caps, override=training.precision)

src/dlm/hardware/refusals.pymodified

          per_adapter_gb = max(0.1, base_params * avg_lora_r / (1e9 * 64))
          activations_gb = base_params * 2.0 / 1e9 * 0.25
          qlora_adapter_count = _qlora_adapter_count(training, num_adapters)
 -        est_peak = (
 -            base_gb + per_adapter_gb * qlora_adapter_count + activations_gb
 -        )
 +        est_peak = base_gb + per_adapter_gb * qlora_adapter_count + activations_gb
          budget = caps.vram_gb * 0.85
          if est_peak > budget:
              offenders = _qlora_adapter_names(training)
 -            offender_note = (
 -                f" (offending adapters: {sorted(offenders)})" if offenders else ""
 -            )
 +            offender_note = f" (offending adapters: {sorted(offenders)})" if offenders else ""
              raise ResolutionError(
                  "Multi-adapter QLoRA would exceed VRAM "
                  f"(~{est_peak:.1f} GB estimated vs {budget:.1f} GB budget "
+         )
      if caps.backend == Backend.CPU:
          raise ResolutionError(
 -            "Multi-GPU training on CPU is not supported. "
 -            "Drop `--gpus` or run single-process.",
 +            "Multi-GPU training on CPU is not supported. Drop `--gpus` or run single-process.",
+         )
      if caps.backend == Backend.ROCM:
          raise ResolutionError(
      """Average LoRA rank across declared adapters (fallback: flat lora_r)."""
      if training.adapters is None or not training.adapters:
          return float(training.lora_r)
 -    return sum(a.lora_r for a in training.adapters.values()) / len(
 -        training.adapters
 -    )
 +    return sum(a.lora_r for a in training.adapters.values()) / len(training.adapters)
  def _qlora_adapter_count(training: TrainingConfig, fallback: int) -> int:

src/dlm/inference/backends/mlx_backend.pymodified

      src_config = peft_adapter_dir / _ADAPTER_CONFIG_FILENAME
      if not src_config.exists():
          raise MlxConversionError(
 -            f"{peft_adapter_dir} is not a PEFT adapter dir "
 -            f"({_ADAPTER_CONFIG_FILENAME} is missing)"
 +            f"{peft_adapter_dir} is not a PEFT adapter dir ({_ADAPTER_CONFIG_FILENAME} is missing)"
+         )
      if not (peft_adapter_dir / "adapter_model.safetensors").exists():
          raise MlxConversionError(

src/dlm/inference/loader.pymodified

      return lookup.get(precision, torch.float16)
 -def resolve_adapter_path(
 -    store: StorePath, *, adapter_name: str | None
 -) -> Path:
 +def resolve_adapter_path(store: StorePath, *, adapter_name: str | None) -> Path:
      """Return the on-disk adapter version dir for inference.
      Single entry point for both the flat (unnamed) and named-adapter

src/dlm/metrics/queries.pymodified

      return [EvalRow(*row) for row in rows]
 -def tokenization_for_run(
 -    store_root: Path, run_id: int
 -) -> TokenizationRow | None:
 +def tokenization_for_run(store_root: Path, run_id: int) -> TokenizationRow | None:
      """The tokenization row for `run_id`, or None when absent.
      Returns None when the table is empty for this run (i.e. the run

src/dlm/metrics/sinks/wandb.pymodified

              import wandb  # type: ignore[import-not-found]
          except ImportError as exc:  # pragma: no cover - depends on install
              raise RuntimeError(
 -                "W&B sink requires `wandb`; "
 -                "run `uv sync --extra observability` to install it."
 +                "W&B sink requires `wandb`; run `uv sync --extra observability` to install it."
              ) from exc
          wandb_dir = store_root / "wandb"

src/dlm/share/hf_sink.pymodified

              exist_ok=True,
+         )
      except HfHubHTTPError as exc:
 -        raise SinkError(
 -            f"hf push: failed to ensure repo {repo_id!r}: {exc}"
 -        ) from exc
 +        raise SinkError(f"hf push: failed to ensure repo {repo_id!r}: {exc}") from exc
      # Upload the pack.
      if progress is not None:

src/dlm/share/peer.pymodified

          signature = self._sign(self.dlm_id, expiry_iso, nonce)
          # Wire format: nonce || len(expiry_iso) || expiry_iso || sig
          payload = (
 -            nonce
 -            + len(expiry_iso).to_bytes(2, "big")
 -            + expiry_iso.encode("ascii")
 -            + signature
 +            nonce + len(expiry_iso).to_bytes(2, "big") + expiry_iso.encode("ascii") + signature
+         )
          return base64.urlsafe_b64encode(payload).decode("ascii").rstrip("=")
              while self.requests and self.requests[0] < window_start:
                  self.requests.popleft()
              if len(self.requests) >= self.rate_limit_per_min:
 -                raise RateLimitError(
 -                    f"rate limit: {self.rate_limit_per_min} req/min exceeded"
 -                )
 +                raise RateLimitError(f"rate limit: {self.rate_limit_per_min} req/min exceeded")
              if self.active >= self.max_concurrency:
                  raise RateLimitError(
                      f"rate limit: max concurrent connections ({self.max_concurrency}) exceeded"

src/dlm/share/pull.pymodified

          pack_path = staging / "incoming.dlm.pack"
          sig_path = pack_path.with_suffix(pack_path.suffix + ".minisig")
 -        bytes_received = _dispatch_pull(
 -            spec, pack_path, sig_path, progress=progress
 -        )
 +        bytes_received = _dispatch_pull(spec, pack_path, sig_path, progress=progress)
          # Verify signature BEFORE unpack so users learn the trust
          # status even if unpack then fails for an unrelated reason.
  def _log_verification(source: str, result: VerifyResult) -> None:
      if result.status == VerifyStatus.VERIFIED:
 -        _LOG.info(
 -            "pull: verified signature from %s using %s", source, result.key_path
 -        )
 +        _LOG.info("pull: verified signature from %s using %s", source, result.key_path)
      elif result.status == VerifyStatus.UNVERIFIED:
          _LOG.warning(
              "pull: signature present but could not verify (%s). "

src/dlm/share/push.pymodified

      _LOG.info("push: signed %s → %s", pack_path, sig_path)
 -def _dispatch_push(
 -    pack_path: Path, spec: SinkSpec, *, progress: ProgressCallback
 -) -> PushResult:
 +def _dispatch_push(pack_path: Path, spec: SinkSpec, *, progress: ProgressCallback) -> PushResult:
      if spec.kind == SinkKind.HF:
          from dlm.share.hf_sink import push_hf
          import zstandard as zstd
          fields: dict[str, str] = {}
 -        with pack_path.open("rb") as f, zstd.ZstdDecompressor().stream_reader(f) as r, tarfile.open(fileobj=r, mode="r|") as tar:
 +        with (
 +            pack_path.open("rb") as f,
 +            zstd.ZstdDecompressor().stream_reader(f) as r,
 +            tarfile.open(fileobj=r, mode="r|") as tar,
 +        ):
              for member in tar:
                  if member.name.endswith("header.json"):
                      import json
                          header = json.loads(data.read().decode("utf-8"))
                          fields["dlm_id"] = str(header.get("dlm_id", ""))
                          fields["base_model"] = str(header.get("base_model", ""))
 -                        fields["adapter_version"] = str(
 -                            header.get("adapter_version", "")
 -                        )
 +                        fields["adapter_version"] = str(header.get("adapter_version", ""))
                      break
          return fields
      except (OSError, ValueError, ImportError) as exc:

src/dlm/share/signing.pymodified

      sig_path = target.with_suffix(target.suffix + ".minisig")
      if not sig_path.is_file():
          raise ShareError(
 -            f"minisign succeeded but {sig_path} is missing; "
 -            "signing integration is out of sync"
 +            f"minisign succeeded but {sig_path} is missing; signing integration is out of sync"
+         )
      return sig_path
      if not minisign_available():
          _LOG.warning(
 -            "verify: signature present (%s) but `minisign` is not installed; "
 -            "cannot verify",
 +            "verify: signature present (%s) but `minisign` is not installed; cannot verify",
              signature,
+         )
          return VerifyResult(
      keys_dir = trusted_keys_dir or _DEFAULT_TRUSTED_KEYS_DIR
      if not keys_dir.is_dir():
          _LOG.warning(
 -            "verify: signature present but no trusted keys at %s; "
 -            "pack is unverifiable",
 +            "verify: signature present but no trusted keys at %s; pack is unverifiable",
              keys_dir,
+         )
          return VerifyResult(

src/dlm/share/sinks.pymodified

      if source.startswith("hf:"):
          rest = source[len("hf:") :]
          if not rest or "/" not in rest:
 -            raise UnknownSinkError(
 -                f"hf: source must be 'hf:<org>/<repo>', got {source!r}"
 -            )
 +            raise UnknownSinkError(f"hf: source must be 'hf:<org>/<repo>', got {source!r}")
          return SinkSpec(kind=SinkKind.HF, target=rest)
      if source.startswith(("http://", "https://")):
      if source.startswith("peer://"):
          rest = source[len("peer://") :]
          if not rest:
 -            raise UnknownSinkError(
 -                f"peer:// source needs host:port/path, got {source!r}"
 -            )
 +            raise UnknownSinkError(f"peer:// source needs host:port/path, got {source!r}")
          return SinkSpec(kind=SinkKind.PEER, target=rest)
      # Fall through to local path. Accept absolute, relative, and `~`.
      if path_looking:
          return SinkSpec(kind=SinkKind.LOCAL, target=source)
 -    raise UnknownSinkError(
 -        f"unrecognized source {source!r}: expected hf:/https:/peer:/ or a path"
 -    )
 +    raise UnknownSinkError(f"unrecognized source {source!r}: expected hf:/https:/peer:/ or a path")

src/dlm/share/url_sink.pymodified

          headers=_build_headers(total, content_type="application/octet-stream"),
+     )
      try:
 -        with pack_path.open("rb") as src, urllib.request.urlopen(  # noqa: S310
 -            req, data=_iter_read(src, total, progress), timeout=60
 -        ) as resp:
 +        with (
 +            pack_path.open("rb") as src,
 +            urllib.request.urlopen(  # noqa: S310
 +                req, data=_iter_read(src, total, progress), timeout=60
 +            ) as resp,
 +        ):
              status = resp.status
              if status < 200 or status >= 300:
                  raise SinkError(f"url push: HTTP {status} from {url}")
          raise SinkError(f"url pull: I/O error writing {out_path}: {exc}") from exc
 -def _build_headers(
 -    content_length: int | None, *, content_type: str | None
 -) -> dict[str, str]:
 +def _build_headers(content_length: int | None, *, content_type: str | None) -> dict[str, str]:
      headers = {"User-Agent": _USER_AGENT}
      if content_type is not None:
          headers["Content-Type"] = content_type
      return headers
 -def _iter_read(
 -    src: IO[bytes], total: int, progress: ProgressCallback
 -) -> bytes:
 +def _iter_read(src: IO[bytes], total: int, progress: ProgressCallback) -> bytes:
      """Streaming read adapter for urllib's `data=` parameter.
      urllib accepts a bytes-or-bytes-iterable. We return the full bytes
      return data
 -def _stream_to_file(
 -    resp: IO[bytes], out_path: Path, total: int, progress: ProgressCallback
 -) -> int:
 +def _stream_to_file(resp: IO[bytes], out_path: Path, total: int, progress: ProgressCallback) -> int:
      written = 0
      with out_path.open("wb") as dst:
          while True:

src/dlm/store/inspect.pymodified

          if not name.startswith(_VERSION_DIR_PREFIX):
              continue
          try:
 -            n = int(name[len(_VERSION_DIR_PREFIX):])
 +            n = int(name[len(_VERSION_DIR_PREFIX) :])
          except ValueError:
              continue
          highest = max(highest, n)

src/dlm/store/paths.pymodified

  def _validate_adapter_name(name: str) -> None:
      if not _ADAPTER_NAME_RE.fullmatch(name):
          raise ValueError(
 -            f"adapter name {name!r} is not valid "
 -            f"(must match {_ADAPTER_NAME_RE.pattern})"
 +            f"adapter name {name!r} is not valid (must match {_ADAPTER_NAME_RE.pattern})"
+         )
              ) from exc
          from dlm.io.atomic import write_text as _atomic_write_text
 -        _atomic_write_text(
 -            self.adapter_current_pointer_for(name), f"{relative}\n"
 -        )
 +        _atomic_write_text(self.adapter_current_pointer_for(name), f"{relative}\n")
      def export_quant_dir(self, quant: str) -> Path:
          """Return `exports/<quant>/` (does NOT create it)."""

src/dlm/templates/init.pymodified

          ) from exc
      if is_gated(spec) and not accept_license:
          raise TemplateApplyError(
 -            f"template {name!r} uses gated base {spec.key!r}; "
 -            "pass accept_license=True"
 +            f"template {name!r} uses gated base {spec.key!r}; pass accept_license=True"
+         )
      parsed = parse_text(template.dlm_text)

src/dlm/train/checkpoint_commit.pymodified

  _VERSION_PREFIX = "v"
 -def allocate_next_version(
 -    store: StorePath, *, adapter_name: str | None = None
 -) -> Path:
 +def allocate_next_version(store: StorePath, *, adapter_name: str | None = None) -> Path:
      """Return the next empty `adapter/[<name>/]versions/vNNNN/` path.
      Creates the directory (and any missing parents). When `adapter_name`
+             )
          except OSError:
              _LOG.exception(
 -                "non-finite adapter weights + rejected-dir rename failed; "
 -                "leaving %s in place",
 +                "non-finite adapter weights + rejected-dir rename failed; leaving %s in place",
                  pending,
+             )
          raise
          os.close(fd)
 -def list_pending_versions(
 -    store: StorePath, *, adapter_name: str | None = None
 -) -> list[Path]:
 +def list_pending_versions(store: StorePath, *, adapter_name: str | None = None) -> list[Path]:
      """Return version dirs that exist on disk but aren't the current pointer.
      Used by the trainer's startup routine to detect crash-before-flip
      return [version_for(n) for n in sorted(existing) if n != current_n]
 -def _existing_versions(
 -    store: StorePath, *, adapter_name: str | None = None
 -) -> list[int]:
 +def _existing_versions(store: StorePath, *, adapter_name: str | None = None) -> list[int]:
      base = (
 -        store.adapter_versions
 -        if adapter_name is None
 -        else store.adapter_versions_for(adapter_name)
 +        store.adapter_versions if adapter_name is None else store.adapter_versions_for(adapter_name)
+     )
      if not base.is_dir():
          return []

src/dlm/train/cpt/embed_warmup.pymodified

          self._active: bool = False
      def on_train_begin(
 -        self, args: Any, state: Any, control: Any, **kwargs: Any  # noqa: ARG002
 +        self,
 +        args: Any,
 +        state: Any,
 +        control: Any,
 +        **kwargs: Any,  # noqa: ARG002
      ) -> None:
          if self.n_steps <= 0:
              return
          self._active = False
      def on_step_end(
 -        self, args: Any, state: Any, control: Any, **kwargs: Any  # noqa: ARG002
 +        self,
 +        args: Any,
 +        state: Any,
 +        control: Any,
 +        **kwargs: Any,  # noqa: ARG002
      ) -> None:
          if self._active and state.global_step >= self.n_steps:
              self._restore()
      def on_train_end(
 -        self, args: Any, state: Any, control: Any, **kwargs: Any  # noqa: ARG002
 +        self,
 +        args: Any,
 +        state: Any,
 +        control: Any,
 +        **kwargs: Any,  # noqa: ARG002
      ) -> None:
          self._restore()

src/dlm/train/cpt/schedule.pymodified

      if warmup_steps < 0:
          raise ValueError(f"warmup_steps must be non-negative, got {warmup_steps}")
      if warmup_steps >= total_steps:
 -        raise ValueError(
 -            f"warmup_steps ({warmup_steps}) must be < total_steps ({total_steps})"
 -        )
 +        raise ValueError(f"warmup_steps ({warmup_steps}) must be < total_steps ({total_steps})")
      if not 0.0 <= floor_ratio <= 1.0:
 -        raise ValueError(
 -            f"floor_ratio must be in [0.0, 1.0], got {floor_ratio}"
 -        )
 +        raise ValueError(f"floor_ratio must be in [0.0, 1.0], got {floor_ratio}")
      if step < 0:
          raise ValueError(f"step must be non-negative, got {step}")

src/dlm/train/cpt/vocab_gap.pymodified

      """
      if len(token_ids) != len(decoded_tokens):
          raise ValueError(
 -            f"token_ids/decoded_tokens length mismatch: "
 -            f"{len(token_ids)} vs {len(decoded_tokens)}"
 +            f"token_ids/decoded_tokens length mismatch: {len(token_ids)} vs {len(decoded_tokens)}"
+         )
      if top_n < 0:
          raise ValueError(f"top_n must be non-negative, got {top_n}")
      total_words = _count_words(text)
      tpw = total_tokens / total_words if total_words else 0.0
 -    unk_hits = (
 -        sum(1 for tid in token_ids if tid == unk_token_id)
 -        if unk_token_id is not None
 -        else 0
 -    )
 +    unk_hits = sum(1 for tid in token_ids if tid == unk_token_id) if unk_token_id is not None else 0
      counts: Counter[str] = Counter(decoded_tokens)
      top_tokens = counts.most_common(top_n)
+     )
 -def report(text: str, tokenizer: Any, *, top_n: int = 10) -> VocabGapReport:  # pragma: no cover - network/heavy
 +def report(
 +    text: str, tokenizer: Any, *, top_n: int = 10
 +) -> VocabGapReport:  # pragma: no cover - network/heavy
      """Run the base tokenizer over `text` and compute the fit report.
      Heavy-import shell around `compute_vocab_gap` — covered by the slow
          f"  <unk> hits      : {r.unk_hits}",
+     ]
      if r.has_unk:
 -        lines.append(
 -            "  WARNING: non-zero <unk> count — tokenizer has rare-character"
 -        )
 -        lines.append(
 -            "  holes for this domain. Consider a different base model."
 -        )
 +        lines.append("  WARNING: non-zero <unk> count — tokenizer has rare-character")
 +        lines.append("  holes for this domain. Consider a different base model.")
      if r.top_tokens:
          lines.append("  top tokens:")
          width = max(len(t) for t, _ in r.top_tokens)

src/dlm/train/distributed/rank_env.pymodified

      try:
          value = int(raw)
      except ValueError as exc:
 -        raise ValueError(
 -            f"WORLD_SIZE env var is not an integer: {raw!r}"
 -        ) from exc
 +        raise ValueError(f"WORLD_SIZE env var is not an integer: {raw!r}") from exc
      if value < 1:
          return 1
      return value
          try:
              value = int(raw)
          except ValueError as exc:
 -            raise ValueError(
 -                f"{key} env var is not an integer: {raw!r}"
 -            ) from exc
 +            raise ValueError(f"{key} env var is not an integer: {raw!r}") from exc
          if value < 0:
              return 0
          return value

src/dlm/train/multi_adapter/router.pymodified

      plan = build_plan(parsed)
      if adapter_name not in plan.by_adapter:
          raise UnknownAdapterError(
 -            f"adapter {adapter_name!r} not declared "
 -            f"(declared: {sorted(plan.by_adapter)})"
 +            f"adapter {adapter_name!r} not declared (declared: {sorted(plan.by_adapter)})"
+         )
      return plan.by_adapter[adapter_name]

src/dlm/train/preference/dpo_phase.pymodified

      # Policy: base + the SFT-trained adapter as trainable.
      base_model = load_base_model(spec, plan)
      adapter_dir = store.adapter_version(reference_adapter_version)
 -    policy_model = PeftModel.from_pretrained(
 -        base_model, str(adapter_dir), is_trainable=True
 -    )
 +    policy_model = PeftModel.from_pretrained(base_model, str(adapter_dir), is_trainable=True)
      # Reference: frozen per preference.reference mode. We reload a
      # clean base for the reference rather than sharing `base_model` so
      doc_ds = build_dpo_dataset(list(parsed.sections))
      rng = _random.Random(seed + reference_adapter_version)
      now = datetime.now(UTC).replace(tzinfo=None, microsecond=0)
 -    replay_rows = replay.sample_preference_rows(
 -        k=max(8, 2 * len(doc_ds)), now=now, rng=rng
 -    )
 +    replay_rows = replay.sample_preference_rows(k=max(8, 2 * len(doc_ds)), now=now, rng=rng)
      if replay_rows:
          replay_ds = Dataset.from_list(replay_rows)
          train_ds = concatenate_datasets([doc_ds, replay_ds])

src/dlm/train/preference/dpo_trainer.pymodified

          try:
              ref = PeftModel.from_pretrained(model, str(adapter_path), is_trainable=False)
          except Exception as exc:
 -            raise DpoReferenceLoadError(
 -                adapter_path=str(adapter_path), cause=str(exc)
 -            ) from exc
 +            raise DpoReferenceLoadError(adapter_path=str(adapter_path), cause=str(exc)) from exc
          _freeze(ref)
          return ref

src/dlm/train/preference/errors.pymodified

      adapter-version path that couldn't be opened."""
      def __init__(self, *, adapter_path: str, cause: str) -> None:
 -        super().__init__(
 -            f"could not load DPO reference model from {adapter_path}: {cause}"
 -        )
 +        super().__init__(f"could not load DPO reference model from {adapter_path}: {cause}")
          self.adapter_path = adapter_path
          self.cause = cause

src/dlm/train/preference/orpo_phase.pymodified

+ )
  if TYPE_CHECKING:
+-
      from dlm.base_models import BaseModelSpec
      from dlm.doc.parser import ParsedDlm
      from dlm.hardware.capabilities import Capabilities
      base_model = load_base_model(spec, plan)
      adapter_dir = store.adapter_version(reference_adapter_version)
 -    policy_model = PeftModel.from_pretrained(
 -        base_model, str(adapter_dir), is_trainable=True
 -    )
 +    policy_model = PeftModel.from_pretrained(base_model, str(adapter_dir), is_trainable=True)
      tok_bringup = prepare_tokenizer(spec.hf_id, spec.revision)
      doc_ds = build_dpo_dataset(list(parsed.sections))
      rng = _random.Random(seed + reference_adapter_version)
      now = datetime.now(UTC).replace(tzinfo=None, microsecond=0)
 -    replay_rows = replay.sample_preference_rows(
 -        k=max(8, 2 * len(doc_ds)), now=now, rng=rng
 -    )
 +    replay_rows = replay.sample_preference_rows(k=max(8, 2 * len(doc_ds)), now=now, rng=rng)
      if replay_rows:
          replay_ds = Dataset.from_list(replay_rows)
          train_ds = concatenate_datasets([doc_ds, replay_ds])

src/dlm/train/preference/phase_orchestrator.pymodified

        explicitly request DPO, skip with a warning instead of raising.
      """
      sections = list(parsed.sections)
 -    pref_cfg = resolve_preference_enabled(
 -        parsed.frontmatter.training.preference, sections
 -    )
 +    pref_cfg = resolve_preference_enabled(parsed.frontmatter.training.preference, sections)
      results: list[PhaseResult] = []
      sft_fn = sft_runner or _real_sft_runner()
          sft_result = sft_fn(store, parsed, spec, plan, **sft_kwargs)
          results.append(PhaseResult(phase="sft", result=sft_result))
 -    should_run_pref = phase == "preference" or (
 -        phase == "all" and pref_cfg.enabled
 -    )
 +    should_run_pref = phase == "preference" or (phase == "all" and pref_cfg.enabled)
      if should_run_pref:
          if not has_preference_content(sections):
              if phase == "preference":

src/dlm/train/trainer.pymodified

      if parsed.frontmatter.training.sources is None:
          return parsed, ()
 -    base_path = (
 -        parsed.source_path.parent if parsed.source_path is not None else Path.cwd()
 -    )
 +    base_path = parsed.source_path.parent if parsed.source_path is not None else Path.cwd()
      result = expand_sources(parsed, base_path=base_path)
      if not result.sections:
          return parsed, result.provenance

tests/integration/directives/test_auto_scaffold_cycle.pymodified

              ),
+         )
 -        run1 = run_training(
 -            store, parsed, spec, plan, mode="fresh", seed=42, max_steps=6
 -        )
 +        run1 = run_training(store, parsed, spec, plan, mode="fresh", seed=42, max_steps=6)
          assert run1.adapter_version == 1
          # --- Second invocation: reuse scaffolded .dlm ---------------------
          # Train again — should produce adapter v0002 in the same store.
          parsed2 = parse_file(result2.dlm_path)
 -        run2 = run_training(
 -            store, parsed2, spec, plan, mode="fresh", seed=42, max_steps=6
 -        )
 +        run2 = run_training(store, parsed2, spec, plan, mode="fresh", seed=42, max_steps=6)
          assert run2.adapter_version == 2
          manifest = load_manifest(store.manifest)

tests/integration/directives/test_dlm_dir_descent.pymodified

  def _build_tree(root: Path) -> None:
      """Build a repo fixture:
 -        root/
 +    root/
 +      .dlm/
 +        training.yaml   include: ['src/**/*.py', 'docs/**/*.md']
 +                        exclude: ['**/test_*.py']
 +                        metadata: {language: python}
 +        ignore          *.log
 +      src/
 +        main.py
 +        test_main.py
 +        vendor/
            .dlm/
 -            training.yaml   include: ['src/**/*.py', 'docs/**/*.md']
 -                            exclude: ['**/test_*.py']
 -                            metadata: {language: python}
 -            ignore          *.log
 -          src/
 -            main.py
 -            test_main.py
 -            vendor/
 -              .dlm/
 -                training.yaml  exclude_defaults: false
 -                               metadata: {vendor: true_yes}
 -              .git_shim/       (bare dir w/ file to prove defaults off)
 -                HEAD
 -              dep.py
 -          docs/
 -            guide.md
 -            .dlm/
 -              ignore  !draft.md     (re-include what parent excluded? N/A)
 -            draft.md
 -          debug.log
 -          .env.local
 -          build/
 -            output.py
 +            training.yaml  exclude_defaults: false
 +                           metadata: {vendor: true_yes}
 +          .git_shim/       (bare dir w/ file to prove defaults off)
 +            HEAD
 +          dep.py
 +      docs/
 +        guide.md
 +        .dlm/
 +          ignore  !draft.md     (re-include what parent excluded? N/A)
 +        draft.md
 +      debug.log
 +      .env.local
 +      build/
 +        output.py
      """
      (root / ".dlm").mkdir()
      (root / ".dlm" / "training.yaml").write_text(
      (root / "src" / "vendor").mkdir()
      (root / "src" / "vendor" / ".dlm").mkdir()
      (root / "src" / "vendor" / ".dlm" / "training.yaml").write_text(
 -        "dlm_training_version: 1\n"
 -        "exclude_defaults: false\n"
 -        "metadata:\n  vendor: true_yes\n",
 +        "dlm_training_version: 1\nexclude_defaults: false\nmetadata:\n  vendor: true_yes\n",
          encoding="utf-8",
+     )
      (root / "src" / "vendor" / "dep.py").write_text("def dep(): pass\n")

tests/integration/directives/test_full_cycle.pymodified

          tree = home / "src"
          tree.mkdir()
          (tree / "a.py").write_text(
 -            "def add(x, y):\n    return x + y\n\n"
 -            "def sub(x, y):\n    return x - y\n",
 +            "def add(x, y):\n    return x + y\n\ndef sub(x, y):\n    return x - y\n",
              encoding="utf-8",
+         )
          (tree / "b.py").write_text(

tests/integration/metrics/test_full_cycle.pymodified

      runs = recent_runs(trained_store.store.root, limit=10)
      assert runs, "trainer.run() did not record any runs"
      latest = runs[0]
 -    assert latest.status in ("ok", "running"), (
 -        f"expected 'ok' or 'running', got {latest.status!r}"
 -    )
 +    assert latest.status in ("ok", "running"), f"expected 'ok' or 'running', got {latest.status!r}"
      steps = steps_for_run(trained_store.store.root, latest.run_id)
      # The tiny-model fixture runs at least one step.

tests/integration/train/multi_adapter/test_two_adapters.pymodified

      import json
      k_cfg = json.loads(
 -        (store.adapter_version_for("knowledge", 1) / "adapter_config.json")
 -        .read_text(encoding="utf-8")
 +        (store.adapter_version_for("knowledge", 1) / "adapter_config.json").read_text(
 +            encoding="utf-8"
 +        )
+     )
      t_cfg = json.loads(
 -        (store.adapter_version_for("tone", 1) / "adapter_config.json")
 -        .read_text(encoding="utf-8")
 +        (store.adapter_version_for("tone", 1) / "adapter_config.json").read_text(encoding="utf-8")
+     )
      assert k_cfg["r"] == 8, f"knowledge lora_r: {k_cfg['r']}"
      assert t_cfg["r"] == 4, f"tone lora_r: {t_cfg['r']}"

tests/integration/train/multi_adapter/test_weighted_merge.pymodified

          make_dlm(
              sections=[prose(_PROSE)],
              base_model="smollm2-135m",
 -            training_overrides={
 -                "adapters": {"knowledge": {}, "tone": {}}
 -            },
 +            training_overrides={"adapters": {"knowledge": {}, "tone": {}}},
          ),
          encoding="utf-8",
+     )
      spec = resolve_base_model(parsed.frontmatter.base_model, accept_license=True)
      cached = download_spec(spec, local_files_only=True)
 -    base_model = AutoModelForCausalLM.from_pretrained(
 -        str(cached.path), revision=spec.revision
 -    )
 +    base_model = AutoModelForCausalLM.from_pretrained(str(cached.path), revision=spec.revision)
      entries = [
          MixEntry(name="knowledge", weight=1.0),
      spec = resolve_base_model(parsed.frontmatter.base_model, accept_license=True)
      cached = download_spec(spec, local_files_only=True)
 -    base_model = AutoModelForCausalLM.from_pretrained(
 -        str(cached.path), revision=spec.revision
 -    )
 +    base_model = AutoModelForCausalLM.from_pretrained(str(cached.path), revision=spec.revision)
      entries = [
          MixEntry(name="knowledge", weight=0.7),

tests/integration/train/preference/test_dpo_tinymodel.pymodified

      the rejected one — the direction DPO should push completions."""
      pairs = [
          ("What is 2 + 2?", "4.", "The sum of two and two is four, a basic arithmetic fact."),
 -        ("What color is grass?", "Green.", "Grass is typically a vibrant shade of green most of the year."),
 +        (
 +            "What color is grass?",
 +            "Green.",
 +            "Grass is typically a vibrant shade of green most of the year.",
 +        ),
          ("Is water wet?", "Yes.", "Water is generally considered wet in most everyday contexts."),
 -        ("Do birds fly?", "Most do.", "The majority of bird species can indeed fly, though a few cannot."),
 +        (
 +            "Do birds fly?",
 +            "Most do.",
 +            "The majority of bird species can indeed fly, though a few cannot.",
 +        ),
          ("What's 10 - 3?", "7.", "Ten minus three equals seven in standard arithmetic."),
+     ]
      parts: list[str] = []

tests/integration/train/preference/test_orpo_tinymodel.pymodified

  def _five_terse_preference_triples() -> str:
      pairs = [
          ("What is 2 + 2?", "4.", "The sum of two and two is four, a basic arithmetic fact."),
 -        ("What color is grass?", "Green.", "Grass is typically a vibrant shade of green most of the year."),
 +        (
 +            "What color is grass?",
 +            "Green.",
 +            "Grass is typically a vibrant shade of green most of the year.",
 +        ),
          ("Is water wet?", "Yes.", "Water is generally considered wet in most everyday contexts."),
 -        ("Do birds fly?", "Most do.", "The majority of bird species can indeed fly, though a few cannot."),
 +        (
 +            "Do birds fly?",
 +            "Most do.",
 +            "The majority of bird species can indeed fly, though a few cannot.",
 +        ),
          ("What's 10 - 3?", "7.", "Ten minus three equals seven in standard arithmetic."),
+     ]
      parts: list[str] = []

tests/unit/cli/test_prompt_adapter_flag.pymodified

  class TestFlatDocRejectsAdapter:
 -    def test_single_adapter_doc_with_adapter_flag_exits_2(
 -        self, tmp_path: Path
 -    ) -> None:
 +    def test_single_adapter_doc_with_adapter_flag_exits_2(self, tmp_path: Path) -> None:
          doc = _scaffold_flat_doc(tmp_path)
          runner = CliRunner()
          result = runner.invoke(

tests/unit/cli/test_serve_guard.pymodified

  def _write_minimal_dlm(path: Path, dlm_id: str = "01KPQ9M3" + "0" * 18) -> None:
      path.write_text(
 -        "---\n"
 -        f"dlm_id: {dlm_id}\n"
 -        "dlm_version: 6\n"
 -        "base_model: smollm2-135m\n"
 -        "---\n"
 -        "body\n",
 +        f"---\ndlm_id: {dlm_id}\ndlm_version: 6\nbase_model: smollm2-135m\n---\nbody\n",
          encoding="utf-8",
+     )
          result = runner.invoke(
              app,
+             [
 -                "--home", str(tmp_path / "home"),
 -                "serve", str(doc),
 +                "--home",
 +                str(tmp_path / "home"),
 +                "serve",
 +                str(doc),
              ],
+         )
          assert result.exit_code == 1, result.output

tests/unit/cli/test_train_scaffold_cli.pymodified

      return {}
 -def _install_capturing_fake(
 -    monkeypatch: pytest.MonkeyPatch, captured: dict[str, Any]
 -) -> None:
 +def _install_capturing_fake(monkeypatch: pytest.MonkeyPatch, captured: dict[str, Any]) -> None:
      """Replace `run_phases` with a stub that records call args and
      returns `[]` (triggering the CLI's "no-op: nothing to train" path
      with exit code 0). The scaffold + manifest + expand_sources pipeline
              result = runner.invoke(
                  app,
+                 [
 -                    "--home", str(tmp_path / "home"),
 -                    "train", str(corpus),
 -                    "--base", "smollm2-135m",
 -                    "--include", "**/*.md",
 +                    "--home",
 +                    str(tmp_path / "home"),
 +                    "train",
 +                    str(corpus),
 +                    "--base",
 +                    "smollm2-135m",
 +                    "--include",
 +                    "**/*.md",
                  ],
+             )
          always 0."""
          corpus = tmp_path / "corpus"
          corpus.mkdir()
 -        (corpus / "alpha.md").write_text(
 -            "# Alpha\nalpha-unique-token\n", encoding="utf-8"
 -        )
 -        (corpus / "beta.md").write_text(
 -            "# Beta\nbeta-unique-token\n", encoding="utf-8"
 -        )
 +        (corpus / "alpha.md").write_text("# Alpha\nalpha-unique-token\n", encoding="utf-8")
 +        (corpus / "beta.md").write_text("# Beta\nbeta-unique-token\n", encoding="utf-8")
          captured = _captured()
          _install_capturing_fake(monkeypatch, captured)
              result = runner.invoke(
                  app,
+                 [
 -                    "--home", str(tmp_path / "home"),
 -                    "train", str(corpus),
 -                    "--base", "smollm2-135m",
 -                    "--include", "**/*.md",
 +                    "--home",
 +                    str(tmp_path / "home"),
 +                    "train",
 +                    str(corpus),
 +                    "--base",
 +                    "smollm2-135m",
 +                    "--include",
 +                    "**/*.md",
                  ],
+             )
+         )
          combined = _section_texts(expanded.sections)
          rendered = "\n".join(f"  {s.content[:80]!r}" for s in expanded.sections)
 -        assert "alpha-unique-token" in combined, (
 -            "B2: alpha.md not ingested. got:\n" + rendered
 -        )
 -        assert "beta-unique-token" in combined, (
 -            "B2: beta.md not ingested. got:\n" + rendered
 -        )
 +        assert "alpha-unique-token" in combined, "B2: alpha.md not ingested. got:\n" + rendered
 +        assert "beta-unique-token" in combined, "B2: beta.md not ingested. got:\n" + rendered
          assert expanded.provenance[0].file_count == 2
          assert expanded.provenance[0].total_bytes > 0
              result = runner.invoke(
                  app,
+                 [
 -                    "--home", str(tmp_path / "home"),
 -                    "train", str(corpus),
 -                    "--base", "smollm2-135m",
 -                    "--include", "**/*.md",
 +                    "--home",
 +                    str(tmp_path / "home"),
 +                    "train",
 +                    str(corpus),
 +                    "--base",
 +                    "smollm2-135m",
 +                    "--include",
 +                    "**/*.md",
                  ],
+             )
              r1 = runner.invoke(
                  app,
+                 [
 -                    "--home", str(tmp_path / "home"),
 -                    "train", str(corpus),
 -                    "--base", "smollm2-135m",
 -                    "--include", "**/*.md",
 +                    "--home",
 +                    str(tmp_path / "home"),
 +                    "train",
 +                    str(corpus),
 +                    "--base",
 +                    "smollm2-135m",
 +                    "--include",
 +                    "**/*.md",
                  ],
+             )
              assert r1.exit_code == 0, r1.output
              r2 = runner.invoke(
                  app,
+                 [
 -                    "--home", str(tmp_path / "home"),
 -                    "train", str(corpus),
 +                    "--home",
 +                    str(tmp_path / "home"),
 +                    "train",
 +                    str(corpus),
                  ],
+             )
          assert r2.exit_code == 0, r2.output
          assert manifest_path.stat().st_mtime_ns == first_mtime, (
 -            "manifest was rewritten on the resume path; "
 -            "training history could be lost"
 +            "manifest was rewritten on the resume path; training history could be lost"
+         )

tests/unit/directives/test_cache.pymodified

          cache.put(key_a, _tokens(4))
          assert cache.get(key_b) is None
 -    def test_missing_file_recovers(
 -        self, tmp_path: Path, caplog: pytest.LogCaptureFixture
 -    ) -> None:
 +    def test_missing_file_recovers(self, tmp_path: Path, caplog: pytest.LogCaptureFixture) -> None:
          """If the on-disk entry vanishes under us, get() should treat
          it as a miss and clean up the stale manifest row."""
          import logging

tests/unit/directives/test_defaults.pymodified

      ],
+ )
  def test_default_excludes_leave_source_alone(path: str) -> None:
 -    assert not _matches_any_default(path), (
 -        f"DEFAULT_EXCLUDES wrongly caught: {path}"
 -    )
 +    assert not _matches_any_default(path), f"DEFAULT_EXCLUDES wrongly caught: {path}"

tests/unit/directives/test_discovery.pymodified

      tmp_path: Path, caplog: pytest.LogCaptureFixture
  ) -> None:
      (tmp_path / ".dlm").mkdir()
 -    (tmp_path / ".dlm" / "training.yaml").write_text(
 -        "dlm_training_version: 1\nunknown_key: bad\n"
 -    )
 +    (tmp_path / ".dlm" / "training.yaml").write_text("dlm_training_version: 1\nunknown_key: bad\n")
      caplog.set_level(logging.WARNING, logger="dlm.directives.discovery")
      configs = discover_configs(tmp_path)
      assert configs[0].config is None
  def test_both_files_coexist(tmp_path: Path) -> None:
      (tmp_path / ".dlm").mkdir()
 -    (tmp_path / ".dlm" / "training.yaml").write_text(
 -        "dlm_training_version: 1\nexclude: ['a']\n"
 -    )
 +    (tmp_path / ".dlm" / "training.yaml").write_text("dlm_training_version: 1\nexclude: ['a']\n")
      (tmp_path / ".dlm" / "ignore").write_text("*.tmp\n")
      (c,) = discover_configs(tmp_path)
      assert c.config is not None

tests/unit/directives/test_expand.pymodified

      src.mkdir()
      for i in range(5):
          (src / f"{i}.py").write_text(f"# {i}\n")
 -    body = (
 -        "  sources:\n"
 -        "    - path: src\n"
 -        "      include: ['**/*.py']\n"
 -        "      max_files: 2\n"
 -    )
 +    body = "  sources:\n    - path: src\n      include: ['**/*.py']\n      max_files: 2\n"
      parsed, _ = _make_parsed(body, tmp_path)
      result = expand_sources(parsed, base_path=tmp_path)  # type: ignore[arg-type]
      # Sorted: 0.py, 1.py land; 2/3/4 get dropped
      src.mkdir()
      (src / "small.py").write_text("x\n")  # 2 bytes
      (src / "big.py").write_text("x" * 100)
 -    body = (
 -        "  sources:\n"
 -        "    - path: src\n"
 -        "      include: ['**/*.py']\n"
 -        "      max_bytes_per_file: 10\n"
 -    )
 +    body = "  sources:\n    - path: src\n      include: ['**/*.py']\n      max_bytes_per_file: 10\n"
      parsed, _ = _make_parsed(body, tmp_path)
      result = expand_sources(parsed, base_path=tmp_path)  # type: ignore[arg-type]
      assert len(result.sections) == 1
      outside.mkdir(exist_ok=True)
      try:
          (outside / "a.py").write_text("x")
 -        body = (
 -            "  sources_policy: strict\n"
 -            "  sources:\n"
 -            f"    - path: {outside}\n"
 -        )
 +        body = f"  sources_policy: strict\n  sources:\n    - path: {outside}\n"
          parsed, _ = _make_parsed(body, tmp_path)
          with pytest.raises(DirectivePolicyError):
              expand_sources(parsed, base_path=tmp_path)  # type: ignore[arg-type]
      outside.mkdir(exist_ok=True)
      try:
          (outside / "a.py").write_text("ok\n")
 -        body = "  sources:\n" f"    - path: {outside}\n      include: ['**/*.py']\n"
 +        body = f"  sources:\n    - path: {outside}\n      include: ['**/*.py']\n"
          parsed, _ = _make_parsed(body, tmp_path)
          result = expand_sources(parsed, base_path=tmp_path)  # type: ignore[arg-type]
          assert len(result.sections) == 1

tests/unit/directives/test_merge.pymodified

+     )
      directive = _directive(tmp_path, include=("**/*.py",))
      configs = discover_configs(tmp_path)
 -    assert effective_config_for(
 -        tmp_path / "src" / "main.py",
 -        source_root=tmp_path,
 -        discovered=configs,
 -        parent_directive=directive,
 -    ).included is True
 -    assert effective_config_for(
 -        tmp_path / "src" / "test_main.py",
 -        source_root=tmp_path,
 -        discovered=configs,
 -        parent_directive=directive,
 -    ).included is False
 +    assert (
 +        effective_config_for(
 +            tmp_path / "src" / "main.py",
 +            source_root=tmp_path,
 +            discovered=configs,
 +            parent_directive=directive,
 +        ).included
 +        is True
 +    )
 +    assert (
 +        effective_config_for(
 +            tmp_path / "src" / "test_main.py",
 +            source_root=tmp_path,
 +            discovered=configs,
 +            parent_directive=directive,
 +        ).included
 +        is False
 +    )
  # ---- .dlm/ignore negation --------------------------------------------------
      _write(tmp_path / ".dlm" / "ignore", "*.log\n!special.log\n")
      directive = _directive(tmp_path)
      configs = discover_configs(tmp_path)
 -    assert effective_config_for(
 -        tmp_path / "debug.log",
 -        source_root=tmp_path,
 -        discovered=configs,
 -        parent_directive=directive,
 -    ).included is False
 -    assert effective_config_for(
 -        tmp_path / "special.log",
 -        source_root=tmp_path,
 -        discovered=configs,
 -        parent_directive=directive,
 -    ).included is True
 +    assert (
 +        effective_config_for(
 +            tmp_path / "debug.log",
 +            source_root=tmp_path,
 +            discovered=configs,
 +            parent_directive=directive,
 +        ).included
 +        is False
 +    )
 +    assert (
 +        effective_config_for(
 +            tmp_path / "special.log",
 +            source_root=tmp_path,
 +            discovered=configs,
 +            parent_directive=directive,
 +        ).included
 +        is True
 +    )
  def test_deeper_ignore_negation_unblocks_parent_exclude(tmp_path: Path) -> None:
      _write(tmp_path / "src" / "main.py", "x")
      directive = _directive(tmp_path)
      configs = discover_configs(tmp_path)
 -    assert effective_config_for(
 -        tmp_path / ".git" / "HEAD",
 -        source_root=tmp_path,
 -        discovered=configs,
 -        parent_directive=directive,
 -    ).included is False
 -    assert effective_config_for(
 -        tmp_path / "src" / "main.py",
 -        source_root=tmp_path,
 -        discovered=configs,
 -        parent_directive=directive,
 -    ).included is True
 +    assert (
 +        effective_config_for(
 +            tmp_path / ".git" / "HEAD",
 +            source_root=tmp_path,
 +            discovered=configs,
 +            parent_directive=directive,
 +        ).included
 +        is False
 +    )
 +    assert (
 +        effective_config_for(
 +            tmp_path / "src" / "main.py",
 +            source_root=tmp_path,
 +            discovered=configs,
 +            parent_directive=directive,
 +        ).included
 +        is True
 +    )
  def test_exclude_defaults_false_disables_default_set(tmp_path: Path) -> None:
          parent_directive=directive,
+     )
      assert eff.tags == {
 -        "language": "python",       # from shallower
 +        "language": "python",  # from shallower
          "domain": "vendor_override",  # deeper overrides shallower
 -        "source": "third_party",   # from deeper only
 +        "source": "third_party",  # from deeper only
+     }

tests/unit/directives/test_safety.pymodified

  def test_enumerate_exclude_wins(tmp_path: Path) -> None:
      (tmp_path / "keep.py").write_text("x")
      (tmp_path / "skip.py").write_text("x")
 -    got = list(
 -        enumerate_matching_files(
 -            tmp_path, include=("**/*.py",), exclude=("skip.py",)
 -        )
 -    )
 +    got = list(enumerate_matching_files(tmp_path, include=("**/*.py",), exclude=("skip.py",)))
      assert [p.name for p in got] == ["keep.py"]

tests/unit/doc/test_fence_adapter_suffix.pymodified

          assert instr[0].adapter == "tone"
      def test_preference_fence_adapter(self) -> None:
 -        parsed = _parse(
 -            "::preference#knowledge::\n### Prompt\nq\n### Chosen\nc\n### Rejected\nr\n"
 -        )
 +        parsed = _parse("::preference#knowledge::\n### Prompt\nq\n### Chosen\nc\n### Rejected\nr\n")
          pref = [s for s in parsed.sections if s.type == SectionType.PREFERENCE]
          assert pref
          assert pref[0].adapter == "knowledge"
          """Routing is structural, not content — same content with and
          without a `#adapter` suffix must produce the same section_id
          so replay snapshots don't duplicate rows on routing edits."""
 -        s_plain = Section(
 -            type=SectionType.INSTRUCTION, content="### Q\nhi\n### A\nbye"
 -        )
 +        s_plain = Section(type=SectionType.INSTRUCTION, content="### Q\nhi\n### A\nbye")
          s_routed = Section(
              type=SectionType.INSTRUCTION,
              content="### Q\nhi\n### A\nbye",

tests/unit/doc/test_migration_v1_to_v2.pymodified

  class TestReferenceRename:
      def test_pre_dpo_adapter_becomes_pre_adapter(self) -> None:
 -        raw: dict[str, Any] = {
 -            "training": {"dpo": {"reference": "pre_dpo_adapter"}}
 -        }
 +        raw: dict[str, Any] = {"training": {"dpo": {"reference": "pre_dpo_adapter"}}}
          out = migrate(raw)
          assert out["training"]["preference"]["reference"] == "pre_adapter"

tests/unit/doc/test_round_trip_v4_adapters.pymodified

      once = serialize(parse_text(original))
      twice = serialize(parse_text(once))
 -    assert once == twice, (
 -        "v4 adapters doc not idempotent under serialize round-trip"
 -    )
 +    assert once == twice, "v4 adapters doc not idempotent under serialize round-trip"
  def test_round_trip_preserves_fence_suffixes() -> None:

tests/unit/doc/test_schema.pymodified

      def test_rejects_unknown_field_inside_preference(self) -> None:
          with pytest.raises(ValidationError):
 -            TrainingConfig.model_validate(
 -                {"preference": {"enabled": True, "rubbish": 1}}
 -            )
 +            TrainingConfig.model_validate({"preference": {"enabled": True, "rubbish": 1}})
  class TestCptConfig:
          assert t.cpt.embed_warmup_steps == 0
      def test_accepts_nested_dict_for_cpt(self) -> None:
 -        t = TrainingConfig.model_validate(
 -            {"cpt": {"schedule": "dapt", "embed_warmup_steps": 200}}
 -        )
 +        t = TrainingConfig.model_validate({"cpt": {"schedule": "dapt", "embed_warmup_steps": 200}})
          assert t.cpt.schedule == "dapt"
          assert t.cpt.embed_warmup_steps == 200
      def test_rejects_unknown_field_inside_cpt(self) -> None:
          with pytest.raises(ValidationError):
 -            TrainingConfig.model_validate(
 -                {"cpt": {"schedule": "dapt", "rubbish": 1}}
 -            )
 +            TrainingConfig.model_validate({"cpt": {"schedule": "dapt", "rubbish": 1}})
  class TestAdapterConfig:
      def test_flat_lora_r_with_block_rejected(self) -> None:
          with pytest.raises(ValidationError, match="flat per-adapter fields"):
 -            TrainingConfig.model_validate(
 -                {"lora_r": 32, "adapters": {"knowledge": {}}}
 -            )
 +            TrainingConfig.model_validate({"lora_r": 32, "adapters": {"knowledge": {}}})
      def test_flat_learning_rate_with_block_rejected(self) -> None:
          with pytest.raises(ValidationError, match="flat per-adapter fields"):
 -            TrainingConfig.model_validate(
 -                {"learning_rate": 1e-3, "adapters": {"tone": {}}}
 -            )
 +            TrainingConfig.model_validate({"learning_rate": 1e-3, "adapters": {"tone": {}}})
      def test_top_level_shared_knobs_allowed_alongside_block(self) -> None:
          # seed, num_epochs, sequence_len, etc. are explicitly shared

tests/unit/eval/test_summary.pymodified

  class TestSplitLossByMode:
      def test_mixed_rows(self) -> None:
 -        out = split_loss_by_mode(
 -            [(1.0, "cpt"), (2.0, "cpt"), (0.5, "sft"), (1.5, "sft")]
 -        )
 +        out = split_loss_by_mode([(1.0, "cpt"), (2.0, "cpt"), (0.5, "sft"), (1.5, "sft")])
          assert out == LossByMode(cpt=1.5, sft=1.0)
      def test_all_cpt(self) -> None:
          assert out.sft is None
      def test_unknown_modes_ignored(self) -> None:
 -        out = split_loss_by_mode(
 -            [(1.0, "cpt"), (2.0, "preference"), (3.0, "other")]
 -        )
 +        out = split_loss_by_mode([(1.0, "cpt"), (2.0, "preference"), (3.0, "other")])
          assert out.cpt == pytest.approx(1.0)
          assert out.sft is None

tests/unit/export/test_vendoring.pymodified

          assert path.is_file()
          assert path.name == "llama-quantize"
 -    def test_missing_binary_raises(
 -        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 -    ) -> None:
 +    def test_missing_binary_raises(self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
          # Clear PATH so the `shutil.which` fallback can't find a
          # brew-installed llama-quantize on the developer's machine.
          monkeypatch.setenv("PATH", str(tmp_path / "empty"))

tests/unit/export/test_weighted_merge.pymodified

          with pytest.raises(InvalidMixSpecError, match="empty mix"):
              resolve_first_source_path(store, [])
 -    def test_missing_adapter_raises_export_error(
 -        self, tmp_path
 -    ) -> None:  # type: ignore[no-untyped-def]
 +    def test_missing_adapter_raises_export_error(self, tmp_path) -> None:  # type: ignore[no-untyped-def]
          from dlm.export.errors import ExportError
          from dlm.export.weighted_merge import resolve_first_source_path
          from dlm.store.paths import StorePath

tests/unit/hardware/test_capabilities.pymodified

              caps = probe()
          assert caps.has_mlx is True
 -    def test_mps_reports_no_mlx_when_mlx_lm_missing(
 -        self, monkeypatch: pytest.MonkeyPatch
 -    ) -> None:
 +    def test_mps_reports_no_mlx_when_mlx_lm_missing(self, monkeypatch: pytest.MonkeyPatch) -> None:
          from dlm.hardware import capabilities as caps_mod
          real_avail = caps_mod._module_available

tests/unit/hardware/test_f28_multi_adapter_qlora.pymodified

  def _qlora_multi_doc(num: int) -> TrainingConfig:
      """TrainingConfig with `num` QLoRA adapters declared."""
 -    adapters = {
 -        f"a{i}": AdapterConfig(adapter="qlora") for i in range(num)
 -    }
 +    adapters = {f"a{i}": AdapterConfig(adapter="qlora") for i in range(num)}
      return TrainingConfig.model_validate({"adapters": adapters})
  def _qlora_multi_doc_with_rank(num: int, lora_r: int) -> TrainingConfig:
      """Multi-adapter doc with `num` QLoRA adapters at the given lora_r."""
 -    adapters = {
 -        f"a{i}": AdapterConfig(adapter="qlora", lora_r=lora_r) for i in range(num)
 -    }
 +    adapters = {f"a{i}": AdapterConfig(adapter="qlora", lora_r=lora_r) for i in range(num)}
      return TrainingConfig.model_validate({"adapters": adapters})
          adapters = {"a0": AdapterConfig(), "a1": AdapterConfig()}
          lora_multi = TrainingConfig.model_validate({"adapters": adapters})
          # LoRA bypasses QLoRA refusals entirely.
 -        check_refusals(
 -            lora_multi, caps, base_params=1_500_000_000, num_adapters=2
 -        )
 +        check_refusals(lora_multi, caps, base_params=1_500_000_000, num_adapters=2)
      def test_small_base_low_rank_multi_qlora_passes(self) -> None:
          """The old formula falsely refused small-base multi-QLoRA.
+             }
+         )
          with pytest.raises(ResolutionError, match="Multi-adapter QLoRA"):
 -            check_refusals(
 -                mixed, caps, base_params=7_000_000_000, num_adapters=3
 -            )
 +            check_refusals(mixed, caps, base_params=7_000_000_000, num_adapters=3)
      def test_mixed_adapter_error_names_only_qlora_offenders(self) -> None:
          with force_cuda(vram_gb=12.0):
+             }
+         )
          with pytest.raises(ResolutionError) as exc_info:
 -            check_refusals(
 -                mixed, caps, base_params=7_000_000_000, num_adapters=3
 -            )
 +            check_refusals(mixed, caps, base_params=7_000_000_000, num_adapters=3)
          message = str(exc_info.value)
          assert "qlora_one" in message
          assert "lora_a" not in message

tests/unit/hardware/test_plan.pymodified

          with force_mps():
              caps = probe()
          with caplog.at_level(logging.WARNING, logger="dlm.hardware.plan"):  # type: ignore[attr-defined]
 -            plan = resolve(
 -                _cfg(precision="fp16"), caps, base_params=8_000_000_000, seq_len=2048
 -            )
 +            plan = resolve(_cfg(precision="fp16"), caps, base_params=8_000_000_000, seq_len=2048)
          assert plan.precision == "fp16"
          # The caller must see the risk explicitly — silent fp16 on MPS
          # is what caused the original bug.
          with force_mps():
              caps = probe()
          with caplog.at_level(logging.WARNING, logger="dlm.hardware.plan"):  # type: ignore[attr-defined]
 -            plan = resolve(
 -                _cfg(precision="bf16"), caps, base_params=1_500_000_000, seq_len=2048
 -            )
 +            plan = resolve(_cfg(precision="bf16"), caps, base_params=1_500_000_000, seq_len=2048)
          assert plan.precision == "bf16"
          assert caplog.records == []  # type: ignore[attr-defined]
          # CUDA default is bf16 (Ampere+) — override to fp32 honored.
          with force_cuda(sm=(8, 0)):
              caps = probe()
 -        plan = resolve(
 -            _cfg(precision="fp32"), caps, base_params=1_500_000_000, seq_len=2048
 -        )
 +        plan = resolve(_cfg(precision="fp32"), caps, base_params=1_500_000_000, seq_len=2048)
          assert plan.precision == "fp32"
          # at 1, not round to 0.
          with force_cuda(sm=(8, 9), vram_gb=4.0):
              caps = probe()
 -        dpo = resolve(
 -            _cfg(), caps, base_params=1_500_000_000, seq_len=2048, phase="dpo"
 -        )
 +        dpo = resolve(_cfg(), caps, base_params=1_500_000_000, seq_len=2048, phase="dpo")
          assert dpo.micro_batch_size >= 1
      def test_dpo_peak_vram_exceeds_sft(self) -> None:
      def test_dpo_reason_mentions_phase(self) -> None:
          with force_cuda(sm=(8, 9), vram_gb=24.0):
              caps = probe()
 -        dpo = resolve(
 -            _cfg(), caps, base_params=1_500_000_000, seq_len=2048, phase="dpo"
 -        )
 -        sft = resolve(
 -            _cfg(), caps, base_params=1_500_000_000, seq_len=2048, phase="sft"
 -        )
 +        dpo = resolve(_cfg(), caps, base_params=1_500_000_000, seq_len=2048, phase="dpo")
 +        sft = resolve(_cfg(), caps, base_params=1_500_000_000, seq_len=2048, phase="sft")
          assert "phase=dpo" in dpo.reason
          assert "phase=dpo" not in sft.reason

tests/unit/inference/test_resolve_adapter_path.pymodified

          v1 = s.adapter_version_for("knowledge", 1)
          v1.mkdir(parents=True)
          s.set_current_adapter_for("knowledge", v1)
 -        assert (
 -            resolve_adapter_path(s, adapter_name="knowledge") == v1.resolve()
 -        )
 +        assert resolve_adapter_path(s, adapter_name="knowledge") == v1.resolve()
 -    def test_missing_named_pointer_mentions_adapter_name(
 -        self, tmp_path: Path
 -    ) -> None:
 +    def test_missing_named_pointer_mentions_adapter_name(self, tmp_path: Path) -> None:
          s = _store(tmp_path)
          s.ensure_adapter_layout("knowledge")
          with pytest.raises(AdapterNotFoundError, match="'knowledge'"):

tests/unit/lock/test_mismatch_policy.pymodified

          current = _lock(pinned_versions={"torch": "2.5.1"})
          msgs = [m for _s, m in classify_mismatches(prior, current)]
          # `_rule_minor_peers` fires on peer disappear with "no longer pinned".
 -        assert any(
 -            "accelerate" in m and "no longer pinned" in m for m in msgs
 -        ), f"expected accelerate-removal warning, got {msgs!r}"
 +        assert any("accelerate" in m and "no longer pinned" in m for m in msgs), (
 +            f"expected accelerate-removal warning, got {msgs!r}"
 +        )
  class TestWorldSize:

tests/unit/metrics/test_db_schema.pymodified

      def test_creates_schema(self, tmp_path: Path) -> None:
          with connect(tmp_path) as conn:
              tables = {
 -                row[0]
 -                for row in conn.execute(
 -                    "SELECT name FROM sqlite_master WHERE type='table'"
 -                )
 +                row[0] for row in conn.execute("SELECT name FROM sqlite_master WHERE type='table'")
+             }
          assert tables == {"runs", "steps", "evals", "exports", "tokenization"}
              conn.execute(
                  "INSERT INTO runs (run_id, started_at, status) VALUES (1, 'now', 'running')"
+             )
 -            conn.execute(
 -                "INSERT INTO steps (run_id, step, loss, at) VALUES (1, 1, 0.5, 'now')"
 -            )
 +            conn.execute("INSERT INTO steps (run_id, step, loss, at) VALUES (1, 1, 0.5, 'now')")
              # Duplicate (1, 1) should violate PK unless we upsert.
              try:
 -                conn.execute(
 -                    "INSERT INTO steps (run_id, step, loss, at) VALUES (1, 1, 0.4, 'now')"
 -                )
 +                conn.execute("INSERT INTO steps (run_id, step, loss, at) VALUES (1, 1, 0.4, 'now')")
                  raise AssertionError("duplicate PK accepted")
              except sqlite3.IntegrityError:
                  pass

tests/unit/metrics/test_queries.pymodified

      """Populate a DB with three runs and a handful of steps/evals."""
      rec = MetricsRecorder(store_root)
      for run_id in (1, 2, 3):
 -        rec.record_run_start(
 -            RunStart(run_id=run_id, adapter_version=run_id, phase="sft", seed=42)
 -        )
 +        rec.record_run_start(RunStart(run_id=run_id, adapter_version=run_id, phase="sft", seed=42))
          for step in (10, 20, 30):
              rec.record_step(StepEvent(run_id=run_id, step=step, loss=2.0 - 0.1 * step))
          rec.record_eval(EvalEvent(run_id=run_id, step=30, val_loss=1.5))

tests/unit/replay/test_store.pymodified

          assert raw_sid in rows[0]["_dlm_section_id"]
 -_PREF_BODY_A = (
 -    "### Prompt\nqA\n### Chosen\ncA\n### Rejected\nrA"
 -)
 -_PREF_BODY_B = (
 -    "### Prompt\nqB\n### Chosen\ncB\n### Rejected\nrB"
 -)
 +_PREF_BODY_A = "### Prompt\nqA\n### Chosen\ncA\n### Rejected\nrA"
 +_PREF_BODY_B = "### Prompt\nqB\n### Chosen\ncB\n### Rejected\nrB"
  class TestSamplePreferenceRows:
      def test_empty_corpus_returns_empty(self, tmp_path: Path) -> None:
          s = _store(tmp_path)
 -        rows = s.sample_preference_rows(
 -            k=5, now=datetime(2026, 4, 1), rng=random.Random(0)
 -        )
 +        rows = s.sample_preference_rows(k=5, now=datetime(2026, 4, 1), rng=random.Random(0))
          assert rows == []
      def test_corpus_with_no_preferences_returns_empty(self, tmp_path: Path) -> None:
          s = _store(tmp_path)
          s.append(_snap("a" * 16, "prose", "hello", added=datetime(2026, 1, 1)))
          s.append(_snap("b" * 16, "instruction", "### Q\nq\n### A\na", added=datetime(2026, 1, 1)))
 -        rows = s.sample_preference_rows(
 -            k=2, now=datetime(2026, 4, 1), rng=random.Random(0)
 -        )
 +        rows = s.sample_preference_rows(k=2, now=datetime(2026, 4, 1), rng=random.Random(0))
          assert rows == []
      def test_filters_to_preferences_only(self, tmp_path: Path) -> None:
          s.append(_snap("a" * 16, "prose", "prose body", added=datetime(2026, 1, 1)))
          s.append(_snap("b" * 16, "preference", _PREF_BODY_A, added=datetime(2026, 1, 1)))
          s.append(_snap("c" * 16, "preference", _PREF_BODY_B, added=datetime(2026, 1, 2)))
 -        rows = s.sample_preference_rows(
 -            k=10, now=datetime(2026, 4, 1), rng=random.Random(0)
 -        )
 +        rows = s.sample_preference_rows(k=10, now=datetime(2026, 4, 1), rng=random.Random(0))
          assert len(rows) == 2
          assert {r["prompt"] for r in rows} == {"qA", "qB"}
          assert all("chosen" in r and "rejected" in r for r in rows)
              sid = f"{i:016x}"
              body = f"### Prompt\nq{i}\n### Chosen\nc{i}\n### Rejected\nr{i}"
              s.append(_snap(sid, "preference", body, added=datetime(2026, 1, 1)))
 -        rows = s.sample_preference_rows(
 -            k=2, now=datetime(2026, 4, 1), rng=random.Random(0)
 -        )
 +        rows = s.sample_preference_rows(k=2, now=datetime(2026, 4, 1), rng=random.Random(0))
          assert len(rows) == 2
      def test_replay_sid_prefix_applied(self, tmp_path: Path) -> None:
          s = _store(tmp_path)
          s.append(_snap("a" * 16, "preference", _PREF_BODY_A, added=datetime(2026, 1, 1)))
 -        rows = s.sample_preference_rows(
 -            k=1, now=datetime(2026, 4, 1), rng=random.Random(0)
 -        )
 +        rows = s.sample_preference_rows(k=1, now=datetime(2026, 4, 1), rng=random.Random(0))
          assert rows[0]["_dlm_section_id"].startswith("replay:")

tests/unit/share/test_peer_tokens.pymodified

          assert "refusing" in messages.lower()
      def test_public_with_ack_binds_all(self) -> None:
 -        bind = resolve_bind(
 -            ServeOptions(public=True, i_know_this_is_public=True)
 -        )
 +        bind = resolve_bind(ServeOptions(public=True, i_know_this_is_public=True))
          assert bind == "0.0.0.0"

tests/unit/store/test_inspect_named_adapters.pymodified

          inspection = inspect_store(store)
          assert inspection.named_adapters == [
 -            NamedAdapterState(
 -                name="knowledge", has_current=False, latest_version=1
 -            )
 +            NamedAdapterState(name="knowledge", has_current=False, latest_version=1)
+         ]
      def test_empty_adapter_dir_without_versions_skipped(self, tmp_path: Path) -> None:

tests/unit/store/test_paths_named_adapters.pymodified

      def test_adapter_version_for_name_pads_four_digits(self, tmp_path: Path) -> None:
          s = _store(tmp_path)
 -        assert (
 -            s.adapter_version_for("tone", 7)
 -            == s.adapter / "tone" / "versions" / "v0007"
 -        )
 +        assert s.adapter_version_for("tone", 7) == s.adapter / "tone" / "versions" / "v0007"
      def test_pointer_path_for_name(self, tmp_path: Path) -> None:
          s = _store(tmp_path)
 -        assert (
 -            s.adapter_current_pointer_for("knowledge")
 -            == s.adapter / "knowledge" / "current.txt"
 -        )
 +        assert s.adapter_current_pointer_for("knowledge") == s.adapter / "knowledge" / "current.txt"
  class TestNamedAdapterValidation:

tests/unit/templates/test_registry.pymodified

  def test_list_bundled_returns_eight_templates() -> None:
      templates = list_bundled()
      assert len(templates) >= 8, (
 -        f"expected at least 8 templates, got {len(templates)}: "
 -        f"{[t.name for t in templates]}"
 +        f"expected at least 8 templates, got {len(templates)}: {[t.name for t in templates]}"
+     )
      names = {t.name for t in templates}
      required = {
  def test_registry_drops_template_with_malformed_meta(tmp_path: Path) -> None:
 -    (tmp_path / "broken.dlm").write_text(
 -        "---\ndlm_id: 01AAAA\nbase_model: foo\n---\n# body\n"
 -    )
 +    (tmp_path / "broken.dlm").write_text("---\ndlm_id: 01AAAA\nbase_model: foo\n---\n# body\n")
      (tmp_path / "broken.meta.yaml").write_text("not: a: valid: yaml: mapping\n")
      assert list_bundled(gallery_dir=tmp_path) == []
  def test_load_template_with_mismatched_name_raises(tmp_path: Path) -> None:
 -    (tmp_path / "fine.dlm").write_text(
 -        "---\ndlm_id: 01AAAA\nbase_model: foo\n---\n# body\n"
 -    )
 +    (tmp_path / "fine.dlm").write_text("---\ndlm_id: 01AAAA\nbase_model: foo\n---\n# body\n")
      # meta.name doesn't match the filename stem.
      (tmp_path / "fine.meta.yaml").write_text(
          "name: different\ntitle: X\nrecommended_base: qwen2.5-1.5b\nsummary: hi\n"

tests/unit/test_templates_parse.pymodified

      # Guard against a silent deletion of the bundled gallery.
      paths = _template_paths()
      assert len(paths) >= 8, (
 -        f"expected at least 8 gallery templates under {bundled_templates_dir()}, "
 -        f"got {len(paths)}"
 +        f"expected at least 8 gallery templates under {bundled_templates_dir()}, got {len(paths)}"
+     )

tests/unit/train/cpt/test_embed_warmup.pymodified

          self.requires_grad = requires_grad
 -def _model(
 -    *, embed_frozen: bool = True, head_frozen: bool = True, tied: bool = False
 -) -> Any:
 +def _model(*, embed_frozen: bool = True, head_frozen: bool = True, tied: bool = False) -> Any:
      embed_param = _FakeParam(requires_grad=not embed_frozen)
      head_param = embed_param if tied else _FakeParam(requires_grad=not head_frozen)
      embed_module = SimpleNamespace(weight=embed_param)
          assert extend_modules_to_save_for_embed_warmup(None, embed_warmup_steps=0) is None
      def test_zero_warmup_passes_through_list(self) -> None:
 -        assert extend_modules_to_save_for_embed_warmup(
 -            ["embed_tokens"], embed_warmup_steps=0
 -        ) == ["embed_tokens"]
 +        assert extend_modules_to_save_for_embed_warmup(["embed_tokens"], embed_warmup_steps=0) == [
 +            "embed_tokens"
 +        ]
      def test_warmup_on_with_no_existing(self) -> None:
          out = extend_modules_to_save_for_embed_warmup(None, embed_warmup_steps=50)

tests/unit/train/cpt/test_schedule.pymodified

          assert cosine_with_floor_lr(0, total_steps=100, warmup_steps=20) == 0.0
      def test_half_warmup_is_half(self) -> None:
 -        assert cosine_with_floor_lr(
 -            10, total_steps=100, warmup_steps=20
 -        ) == pytest.approx(0.5)
 +        assert cosine_with_floor_lr(10, total_steps=100, warmup_steps=20) == pytest.approx(0.5)
      def test_warmup_end_is_peak(self) -> None:
          # step == warmup_steps: first step of decay phase; cosine is 1.0
          # at decay_progress=0, so we're at peak.
 -        assert cosine_with_floor_lr(
 -            20, total_steps=100, warmup_steps=20
 -        ) == pytest.approx(1.0)
 +        assert cosine_with_floor_lr(20, total_steps=100, warmup_steps=20) == pytest.approx(1.0)
      def test_zero_warmup_jumps_to_peak(self) -> None:
 -        assert cosine_with_floor_lr(
 -            0, total_steps=100, warmup_steps=0
 -        ) == pytest.approx(1.0)
 +        assert cosine_with_floor_lr(0, total_steps=100, warmup_steps=0) == pytest.approx(1.0)
  class TestCosineDecay:
      def test_monotone_decrease_through_decay(self) -> None:
 -        lrs = [
 -            cosine_with_floor_lr(s, total_steps=100, warmup_steps=20)
 -            for s in range(20, 100, 5)
 -        ]
 +        lrs = [cosine_with_floor_lr(s, total_steps=100, warmup_steps=20) for s in range(20, 100, 5)]
          for a, b in zip(lrs, lrs[1:], strict=False):
              assert a > b
          # Midpoint of cosine decay (decay_progress=0.5) gives cos(pi/2)=0,
          # so cosine multiplier = 0.5 → LR = floor + (1-floor)*0.5
          floor = 0.1
 -        mid = cosine_with_floor_lr(
 -            60, total_steps=100, warmup_steps=20, floor_ratio=floor
 -        )
 +        mid = cosine_with_floor_lr(60, total_steps=100, warmup_steps=20, floor_ratio=floor)
          expected = floor + (1.0 - floor) * 0.5
          assert mid == pytest.approx(expected)
      @pytest.mark.parametrize("bad", [-0.01, 1.01, 2.0])
      def test_floor_ratio_out_of_range(self, bad: float) -> None:
          with pytest.raises(ValueError, match="floor_ratio must be in"):
 -            cosine_with_floor_lr(
 -                0, total_steps=100, warmup_steps=10, floor_ratio=bad
 -            )
 +            cosine_with_floor_lr(0, total_steps=100, warmup_steps=10, floor_ratio=bad)
  class TestDefaultConstants:
          # At warmup_steps, cosine is exactly 1. They should differ by
          # ~1/warmup_steps (the ramp's last sub-peak increment).
          warmup = 50
 -        last_ramp = cosine_with_floor_lr(
 -            warmup - 1, total_steps=200, warmup_steps=warmup
 -        )
 -        first_decay = cosine_with_floor_lr(
 -            warmup, total_steps=200, warmup_steps=warmup
 -        )
 +        last_ramp = cosine_with_floor_lr(warmup - 1, total_steps=200, warmup_steps=warmup)
 +        first_decay = cosine_with_floor_lr(warmup, total_steps=200, warmup_steps=warmup)
          assert first_decay == pytest.approx(1.0)
          assert math.isclose(first_decay - last_ramp, 1 / warmup, abs_tol=1e-9)

tests/unit/train/cpt/test_vocab_gap.pymodified

  class TestComputeVocabGap:
      def test_empty_inputs(self) -> None:
 -        r = compute_vocab_gap(
 -            [], text="", unk_token_id=None, decoded_tokens=[]
 -        )
 +        r = compute_vocab_gap([], text="", unk_token_id=None, decoded_tokens=[])
          assert r.total_tokens == 0
          assert r.total_words == 0
          assert r.tokens_per_word == 0.0
      def test_negative_top_n_rejected(self) -> None:
          with pytest.raises(ValueError, match="top_n must be non-negative"):
 -            compute_vocab_gap(
 -                [], text="", unk_token_id=None, decoded_tokens=[], top_n=-1
 -            )
 +            compute_vocab_gap([], text="", unk_token_id=None, decoded_tokens=[], top_n=-1)
  class TestRenderReport:

tests/unit/train/distributed/test_rank_env.pymodified

          monkeypatch.delenv("LOCAL_RANK", raising=False)
          assert detect_rank() == 0
 -    def test_rank_takes_precedence_over_local_rank(
 -        self, monkeypatch: pytest.MonkeyPatch
 -    ) -> None:
 +    def test_rank_takes_precedence_over_local_rank(self, monkeypatch: pytest.MonkeyPatch) -> None:
          monkeypatch.setenv("RANK", "3")
          monkeypatch.setenv("LOCAL_RANK", "1")
          assert detect_rank() == 3

tests/unit/train/multi_adapter/test_orchestrator.pymodified

              base_model="smollm2-135m",
              training=TrainingConfig(seed=42),
          ),
 -        sections=(
 -            Section(type=SectionType.PROSE, content="Single-adapter prose."),
 -        ),
 +        sections=(Section(type=SectionType.PROSE, content="Single-adapter prose."),),
+     )
  def _seed_store(tmp_path: Path, dlm_id: str) -> Any:
      store = for_dlm(dlm_id, home=tmp_path)
      store.ensure_layout()
 -    save_manifest(
 -        store.manifest, Manifest(dlm_id=dlm_id, base_model="smollm2-135m")
 -    )
 +    save_manifest(store.manifest, Manifest(dlm_id=dlm_id, base_model="smollm2-135m"))
      return store
          # Flat field stays at 0 (untouched) for multi-adapter stores.
          assert manifest.adapter_version == 0
 -    def test_training_run_summaries_carry_adapter_name(
 -        self, tmp_path: Path
 -    ) -> None:
 +    def test_training_run_summaries_carry_adapter_name(self, tmp_path: Path) -> None:
          """Audit-07 M1: each TrainingRunSummary is tagged with the name."""
          dlm_id = "01HZ4X7TGZM3J1A2B3C4D5E6FB"
          store = _seed_store(tmp_path, dlm_id)

tests/unit/train/multi_adapter/test_router.pymodified

          prose_in_knowledge = [
              s for s in plan.by_adapter["knowledge"] if s.type is SectionType.PROSE
+         ]
 -        prose_in_tone = [
 -            s for s in plan.by_adapter["tone"] if s.type is SectionType.PROSE
 -        ]
 +        prose_in_tone = [s for s in plan.by_adapter["tone"] if s.type is SectionType.PROSE]
          assert len(prose_in_knowledge) == 1
          assert len(prose_in_tone) == 1
          parsed = parse_text(_doc(body, multi_adapter=True))
          plan = build_plan(parsed)
          # First-declared is "knowledge".
 -        assert any(
 -            s.type is SectionType.INSTRUCTION
 -            for s in plan.by_adapter["knowledge"]
 -        )
 -        assert not any(
 -            s.type is SectionType.INSTRUCTION for s in plan.by_adapter["tone"]
 -        )
 +        assert any(s.type is SectionType.INSTRUCTION for s in plan.by_adapter["knowledge"])
 +        assert not any(s.type is SectionType.INSTRUCTION for s in plan.by_adapter["tone"])
      def test_tagged_instruction_goes_to_named_adapter(self) -> None:
          body = "::instruction#tone::\n### Q\nhi\n### A\nbye\n"
          parsed = parse_text(_doc(body, multi_adapter=True))
          plan = build_plan(parsed)
 -        assert not any(
 -            s.type is SectionType.INSTRUCTION
 -            for s in plan.by_adapter["knowledge"]
 -        )
 -        assert any(
 -            s.type is SectionType.INSTRUCTION for s in plan.by_adapter["tone"]
 -        )
 +        assert not any(s.type is SectionType.INSTRUCTION for s in plan.by_adapter["knowledge"])
 +        assert any(s.type is SectionType.INSTRUCTION for s in plan.by_adapter["tone"])
  class TestPreferenceRouting:
      def test_tagged_preference_goes_to_named_adapter(self) -> None:
 -        body = (
 -            "::preference#tone::\n"
 -            "### Prompt\nq\n### Chosen\nc\n### Rejected\nr\n"
 -        )
 +        body = "::preference#tone::\n### Prompt\nq\n### Chosen\nc\n### Rejected\nr\n"
          parsed = parse_text(_doc(body, multi_adapter=True))
          plan = build_plan(parsed)
 -        assert any(
 -            s.type is SectionType.PREFERENCE for s in plan.by_adapter["tone"]
 -        )
 +        assert any(s.type is SectionType.PREFERENCE for s in plan.by_adapter["tone"])
  class TestUnknownAdapter:
  class TestSingleAdapterDoc:
      def test_single_adapter_doc_routes_all_to_default(self) -> None:
 -        body = (
 -            "# Prose\n\nShared.\n\n"
 -            "::instruction::\n### Q\nh\n### A\nb\n"
 -        )
 +        body = "# Prose\n\nShared.\n\n::instruction::\n### Q\nh\n### A\nb\n"
          parsed = parse_text(_doc(body, multi_adapter=False))
          plan = build_plan(parsed)
          assert set(plan.by_adapter) == {"default"}
  class TestSectionsForShortcut:
      def test_returns_same_as_plan_entry(self) -> None:
 -        body = (
 -            "shared prose\n\n"
 -            "::instruction#tone::\n### Q\nh\n### A\nb\n"
 -        )
 +        body = "shared prose\n\n::instruction#tone::\n### Q\nh\n### A\nb\n"
          parsed = parse_text(_doc(body, multi_adapter=True))
          plan = build_plan(parsed)
          assert sections_for(parsed, "tone") == plan.by_adapter["tone"]

tests/unit/train/preference/test_determinism_plumbing.pymodified

  class TestDpoSeedsRngBeforeTraining:
 -    def test_explicit_seed_flows_through_to_seed_everything(
 -        self, tmp_path: Path
 -    ) -> None:
 +    def test_explicit_seed_flows_through_to_seed_everything(self, tmp_path: Path) -> None:
          from dlm.train.preference.dpo_phase import run
          store = _seed_store(tmp_path, "01KDPOSEED" + "0" * 16)
          with patch(
              "dlm.train.preference.dpo_phase.seed_everything",
 -            wraps=__import__(
 -                "dlm.train.determinism", fromlist=["seed_everything"]
 -            ).seed_everything,
 +            wraps=__import__("dlm.train.determinism", fromlist=["seed_everything"]).seed_everything,
          ) as spy:
              run(
                  store,
          with patch(
              "dlm.train.preference.dpo_phase.seed_everything",
 -            wraps=__import__(
 -                "dlm.train.determinism", fromlist=["seed_everything"]
 -            ).seed_everything,
 +            wraps=__import__("dlm.train.determinism", fromlist=["seed_everything"]).seed_everything,
          ) as spy:
              run(
                  store,
          with patch(
              "dlm.train.preference.orpo_phase.seed_everything",
 -            wraps=__import__(
 -                "dlm.train.determinism", fromlist=["seed_everything"]
 -            ).seed_everything,
 +            wraps=__import__("dlm.train.determinism", fromlist=["seed_everything"]).seed_everything,
          ) as spy:
              run(
                  store,

tests/unit/train/preference/test_dpo_dataset.pymodified


 )
 
 _PREF_BODY_ONE = (
-    "### Prompt\nWhat time is it?\n"
-    "### Chosen\nIt is 3 PM.\n"
-    "### Rejected\nTime is an illusion.\n"
+    "### Prompt\nWhat time is it?\n### Chosen\nIt is 3 PM.\n### Rejected\nTime is an illusion.\n"
 )
 
 _PREF_BODY_TWO = (

tests/unit/train/preference/test_dpo_phase.pymodified

  def _parsed_with_preferences() -> ParsedDlm:
 -    pref_body = (
 -        "### Prompt\nq?\n### Chosen\nc.\n### Rejected\nr.\n"
 -    )
 +    pref_body = "### Prompt\nq?\n### Chosen\nc.\n### Rejected\nr.\n"
      return ParsedDlm(
          frontmatter=DlmFrontmatter(
              dlm_id="01KABCD" + "0" * 19,
              base_model="smollm2-135m",
 -            training=TrainingConfig(
 -                seed=42, preference=PreferenceConfig(enabled=True)
 -            ),
 -        ),
 -        sections=(
 -            Section(type=SectionType.PREFERENCE, content=pref_body),
 +            training=TrainingConfig(seed=42, preference=PreferenceConfig(enabled=True)),
          ),
 +        sections=(Section(type=SectionType.PREFERENCE, content=pref_body),),
+     )

tests/unit/train/preference/test_dpo_trainer.pymodified

          cfg = PreferenceConfig(
              enabled=True,
              loss_type="ipo",
 -            hyperparams=PreferenceHyperparams(
 -                beta=0.2, learning_rate=3e-6, num_epochs=2
 -            ),
 -        )
 -        kwargs = build_dpo_config_kwargs(
 -            cfg, _plan(), output_dir=tmp_path, max_length=1024, seed=7
 +            hyperparams=PreferenceHyperparams(beta=0.2, learning_rate=3e-6, num_epochs=2),
+         )
 +        kwargs = build_dpo_config_kwargs(cfg, _plan(), output_dir=tmp_path, max_length=1024, seed=7)
          assert kwargs["output_dir"] == str(tmp_path)
          assert kwargs["learning_rate"] == 3e-6
          assert kwargs["num_train_epochs"] == 2

tests/unit/train/preference/test_method_registry.pymodified

      def test_register_overrides_existing(self) -> None:
          saved = resolve("dpo")
          try:
++
              def _stub(*args: object, **kwargs: object) -> str:  # type: ignore[return-value]
                  return "stub"

tests/unit/train/preference/test_orpo_phase.pymodified

                  preference=PreferenceConfig(enabled=True, method="orpo"),
              ),
          ),
 -        sections=(
 -            Section(type=SectionType.PREFERENCE, content=pref_body),
 -        ),
 +        sections=(Section(type=SectionType.PREFERENCE, content=pref_body),),
+     )
      store.ensure_layout()
      save_manifest(
          store.manifest,
 -        Manifest(
 -            dlm_id=dlm_id, base_model="smollm2-135m", adapter_version=1
 -        ),
 +        Manifest(dlm_id=dlm_id, base_model="smollm2-135m", adapter_version=1),
+     )
      v0001 = store.adapter_version(1)
      v0001.mkdir(parents=True, exist_ok=True)
  class TestRunSteps:
 -    def test_factory_receives_reference_adapter_version(
 -        self, tmp_path: Path
 -    ) -> None:
 +    def test_factory_receives_reference_adapter_version(self, tmp_path: Path) -> None:
          captured: dict[str, Any] = {}
          def _capturing_factory(**kwargs: Any) -> MagicMock:

tests/unit/train/preference/test_orpo_trainer.pymodified

          cfg = PreferenceConfig(
              enabled=True,
              method="orpo",
 -            hyperparams=PreferenceHyperparams(
 -                alpha=0.15, learning_rate=3e-6, num_epochs=2
 -            ),
 +            hyperparams=PreferenceHyperparams(alpha=0.15, learning_rate=3e-6, num_epochs=2),
+         )
          kwargs = build_orpo_config_kwargs(
              cfg, _plan(), output_dir=tmp_path, max_length=1024, seed=7

tests/unit/train/preference/test_phase_orchestrator.pymodified

  def _pref() -> Section:
      return Section(
          type=SectionType.PREFERENCE,
 -        content=(
 -            "### Prompt\nq\n### Chosen\nc\n### Rejected\nr\n"
 -        ),
 +        content=("### Prompt\nq\n### Chosen\nc\n### Rejected\nr\n"),
          start_line=1,
+     )
      who wrote `training.preference.enabled: true/false` in their
      frontmatter.
      """
 -    pref = (
 -        PreferenceConfig() if dpo_enabled is None
 -        else PreferenceConfig(enabled=dpo_enabled)
 -    )
 +    pref = PreferenceConfig() if dpo_enabled is None else PreferenceConfig(enabled=dpo_enabled)
      return _FakeParsed(
          sections=tuple(sections),
          frontmatter=_FakeFrontmatter(training=_FakeTraining(preference=pref)),

tests/unit/train/test_resolve_adapter_hparams.pymodified

  class TestFlatConfig:
      def test_returns_flat_fields_when_adapter_name_is_none(self) -> None:
 -        training = TrainingConfig(
 -            lora_r=16, lora_alpha=32, lora_dropout=0.1, learning_rate=1e-3
 -        )
 +        training = TrainingConfig(lora_r=16, lora_alpha=32, lora_dropout=0.1, learning_rate=1e-3)
          r, alpha, dropout, lr = _resolve_adapter_hparams(_parsed(training), None)
          assert (r, alpha, dropout) == (16, 32, pytest.approx(0.1))
          assert lr == pytest.approx(1e-3)
+                 }
+             }
+         )
 -        k_r, k_alpha, _k_drop, _k_lr = _resolve_adapter_hparams(
 -            _parsed(training), "knowledge"
 -        )
 -        t_r, t_alpha, t_drop, t_lr = _resolve_adapter_hparams(
 -            _parsed(training), "tone"
 -        )
 +        k_r, k_alpha, _k_drop, _k_lr = _resolve_adapter_hparams(_parsed(training), "knowledge")
 +        t_r, t_alpha, t_drop, t_lr = _resolve_adapter_hparams(_parsed(training), "tone")
          assert (k_r, k_alpha) == (8, 16)
          assert (t_r, t_alpha) == (4, 8)
          assert t_drop == pytest.approx(0.2)
          assert t_lr == pytest.approx(1e-4)
      def test_unknown_adapter_name_falls_back_to_flat(self) -> None:
 -        training = TrainingConfig.model_validate(
 -            {"adapters": {"knowledge": {"lora_r": 8}}}
 -        )
 +        training = TrainingConfig.model_validate({"adapters": {"knowledge": {"lora_r": 8}}})
          # ghost isn't declared; we fall back to defaults rather than crash.
          r, _, _, _ = _resolve_adapter_hparams(_parsed(training), "ghost")
          assert r == 8  # flat default
      def test_per_adapter_defaults_when_not_overridden(self) -> None:
 -        training = TrainingConfig.model_validate(
 -            {"adapters": {"default_one": {}}}
 -        )
 -        r, alpha, dropout, lr = _resolve_adapter_hparams(
 -            _parsed(training), "default_one"
 -        )
 +        training = TrainingConfig.model_validate({"adapters": {"default_one": {}}})
 +        r, alpha, dropout, lr = _resolve_adapter_hparams(_parsed(training), "default_one")
          # AdapterConfig() defaults: r=8, alpha=16, dropout=0.05, lr=2e-4
          assert (r, alpha) == (8, 16)
          assert dropout == pytest.approx(0.05)

tests/unit/watch/test_status.pymodified

      def test_after_cycle_shows_loss_and_steps(self) -> None:
          status = WatchStatus(doc_path="mydoc.dlm", sections=12)
 -        status.mark_cycle_done(
 -            train_loss=1.2, val_loss=1.35, steps=50, coalesced=1
 -        )
 +        status.mark_cycle_done(train_loss=1.2, val_loss=1.35, steps=50, coalesced=1)
          line = render_status(status)
          assert "val loss: 1.35" in line
          assert "steps: 50" in line
      def test_coalesced_only_shown_when_plural(self) -> None:
          status = WatchStatus(doc_path="d")
 -        status.mark_cycle_done(
 -            train_loss=None, val_loss=None, steps=10, coalesced=1
 -        )
 +        status.mark_cycle_done(train_loss=None, val_loss=None, steps=10, coalesced=1)
          assert "coalesced" not in render_status(status)
 -        status.mark_cycle_done(
 -            train_loss=None, val_loss=None, steps=10, coalesced=5
 -        )
 +        status.mark_cycle_done(train_loss=None, val_loss=None, steps=10, coalesced=5)
          assert "coalesced: 5" in render_status(status)
      def test_age_buckets(self) -> None:

tenseleyflow/documentlanguagemodel / `b6deabb`

98 changed files

`@@ -12,9 +12,7 @@` from dlm.train.preference.dpo_dataset import (
12	12	)
13	13
14	14	_PREF_BODY_ONE = (
15		- "### Prompt\nWhat time is it?\n"
16		- "### Chosen\nIt is 3 PM.\n"
17		- "### Rejected\nTime is an illusion.\n"
	15	+ "### Prompt\nWhat time is it?\n### Chosen\nIt is 3 PM.\n### Rejected\nTime is an illusion.\n"
18	16	)
19	17
20	18	_PREF_BODY_TWO = (