`e34ec1c`

feat(export): honor DLM_LLAMA_CPP_BUILD env var for ROCm binaries (audit-08 M6)

Authored by

espadonne 3 weeks ago

SHA: e34ec1cb9c06a4b778b0c467bae8afaecc234ee9
Parents: 5aeb871
Tree: 599ab1b

3 changed files

Status	File	+	-
M	`docs/hardware/rocm.md`	4	3
M	`src/dlm/export/vendoring.py`	18	0
M	`tests/unit/export/test_vendoring.py`	41	0

docs/hardware/rocm.mdmodified

  export DLM_LLAMA_CPP_BUILD=vendor/llama.cpp/build-rocm
  ```
 -(Environment-variable plumbing in `dlm.export.vendoring` lands as
 -part of the next ROCm polish pass — for now, manually invoke the
 -ROCm binaries if you need them.)
 +`DLM_LLAMA_CPP_BUILD` is honored by `dlm.export.vendoring` — when
 +set, it's checked before the default vendor dir for each binary, so
 +the ROCm-accelerated `llama-quantize` / `llama-imatrix` win over any
 +CPU-only build left behind from `scripts/bump-llama-cpp.sh build`.
  ## CI / testing

src/dlm/export/vendoring.pymodified

  _REPO_ROOT: Final[Path] = Path(__file__).resolve().parents[3]
  VENDOR_LLAMA_CPP: Final[Path] = _REPO_ROOT / "vendor" / "llama.cpp"
  _ENV_VAR: Final[str] = "DLM_LLAMA_CPP_ROOT"
 +_BUILD_ENV_VAR: Final[str] = "DLM_LLAMA_CPP_BUILD"
 +"""Sprint 22 / audit-08 M6: when set, `_resolve_binary` checks
 +`<DLM_LLAMA_CPP_BUILD>/bin/<name>` before the default vendor layout.
 +Lets users point `dlm export` at a HIP-built llama.cpp without
 +rebuilding the vendor dir itself (see docs/hardware/rocm.md)."""
  CONVERT_HF_TO_GGUF: Final[str] = "convert_hf_to_gguf.py"
  CONVERT_LORA_TO_GGUF: Final[str] = "convert_lora_to_gguf.py"
      binary, fall back to `shutil.which(name)` — covers the common
      `brew install llama.cpp` case where the binary lives under
      `/opt/homebrew/bin/`.
++
 +    Audit-08 M6: `$DLM_LLAMA_CPP_BUILD`, when set, is checked BEFORE
 +    the default vendor tree. Lets ROCm users point at the HIP build
 +    dir produced by `scripts/build-llama-cpp-rocm.sh` without
 +    clobbering the CPU build.
      """
 +    if override is None:
 +        build_env = os.environ.get(_BUILD_ENV_VAR)
 +        if build_env:
 +            build_root = Path(build_env)
 +            for candidate in candidates:
 +                path = build_root / candidate
 +                if path.is_file():
 +                    return path
      root = llama_cpp_root(override)
      for candidate in candidates:
          path = root / candidate

tests/unit/export/test_vendoring.pymodified

          with pytest.raises(VendoringError, match="llama-quantize"):
              llama_quantize_bin(override=root)
 +    def test_dlm_llama_cpp_build_env_preferred(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        """Audit-08 M6: `DLM_LLAMA_CPP_BUILD` overrides the default vendor dir.
++
 +        The env var points at a build-only dir (e.g. the ROCm
 +        `vendor/llama.cpp/build-rocm`) that contains only binaries.
 +        `_resolve_binary` must find `bin/llama-quantize` there before
 +        falling through to the vendor tree.
++
 +        The production path has `override=None`; we mirror that here
 +        by driving vendor resolution through `DLM_LLAMA_CPP_ROOT` so
 +        both env vars coexist (ROCm users set both).
 +        """
 +        rocm_build = tmp_path / "build-rocm"
 +        (rocm_build / "bin").mkdir(parents=True)
 +        rocm_bin = rocm_build / "bin" / "llama-quantize"
 +        rocm_bin.write_text("#!/bin/sh\necho rocm\n")
 +        rocm_bin.chmod(0o755)
++
 +        vendor_root = _populate_vendor(tmp_path / "llama.cpp")
++
 +        monkeypatch.setenv("DLM_LLAMA_CPP_BUILD", str(rocm_build))
 +        monkeypatch.setenv("DLM_LLAMA_CPP_ROOT", str(vendor_root))
 +        path = llama_quantize_bin()
 +        # The ROCm build binary wins over the vendored CPU build.
 +        assert path == rocm_bin
++
 +    def test_dlm_llama_cpp_build_env_missing_binary_falls_through(
 +        self, tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 +    ) -> None:
 +        """Env var pointing at an incomplete dir falls through to vendor."""
 +        empty_build = tmp_path / "build-rocm"
 +        empty_build.mkdir()
 +        vendor_root = _populate_vendor(tmp_path / "llama.cpp")
 +        monkeypatch.setenv("DLM_LLAMA_CPP_BUILD", str(empty_build))
 +        monkeypatch.setenv("DLM_LLAMA_CPP_ROOT", str(vendor_root))
 +        path = llama_quantize_bin()
 +        assert path.is_file()
 +        assert str(vendor_root) in str(path)
++
      def test_legacy_quantize_name_found(self, tmp_path: Path) -> None:
          """Pre-rename builds shipped `quantize` rather than `llama-quantize`."""
          root = _populate_vendor(tmp_path / "llama.cpp", with_binary=False)