`3890e1e`

sway(bridge): align resolver with real dlm API (type/parsers/for_dlm/base_models.resolve)

Authored by

espadonne 3 weeks ago

SHA: 3890e1e09452818cdf352d5fe678fc445fc15298
Parents: 3a27d73
Tree: a5c717a

3 changed files

Status	File	+	-
M	`src/dlm_sway/backends/hf.py`	7	3
M	`src/dlm_sway/integrations/dlm/resolver.py`	84	47
M	`tests/unit/test_dlm_bridge.py`	63	26

src/dlm_sway/backends/hf.pymodified

      def as_base(self) -> Iterator[_HFView]:
          self._enter("base")
          try:
 -            with self._peft_model.disable_adapter():
 +            # peft.PeftModel.disable_adapter is a context manager; mypy
 +            # mis-reads it as a Tensor on this transformers version.
 +            with self._peft_model.disable_adapter():  # type: ignore[operator]
                  yield self._make_view("base")
          finally:
              self._exit()
          exception propagates, to keep the model in a sane state.
          """
          self._enter(f"scaled({lam})")
 -        saved: list[tuple[object, str, float]] = []
 +        # ``module`` is dynamic (peft LoraLayer subclass) — Any avoids
 +        # mypy treating its ``.scaling`` as a Tensor when peft is loaded.
 +        saved: list[tuple[Any, str, float]] = []
          try:
              import peft  # noqa: PLC0415 — already a hard dep of this backend
              yield self._make_view(f"scaled_{lam:.2f}")
          finally:
              for module, key, original in saved:
 -                module.scaling[key] = original  # type: ignore[attr-defined]
 +                module.scaling[key] = original
              self._exit()
      @contextmanager

src/dlm_sway/integrations/dlm/resolver.pymodified

      doc_text = "\n\n".join(s.content for s in sections)
      adapter_path = _resolve_adapter_path(fm.dlm_id)
 +    base_hf_id = _resolve_base_model_to_hf_id(fm.base_model)
      return DlmHandle(
          dlm_id=fm.dlm_id,
 -        base_model=fm.base_model,
 +        base_model=base_hf_id,
          adapter_path=adapter_path,
          sections=sections,
          doc_text=doc_text,
+     )
 +def _resolve_base_model_to_hf_id(base_model: str) -> str:
 +    """Translate dlm's base-model *key* to a HuggingFace repo id.
++
 +    dlm's frontmatter stores registry keys like ``smollm2-135m`` which
 +    resolve to ``HuggingFaceTB/SmolLM2-135M-Instruct``. sway's backends
 +    call ``AutoModelForCausalLM.from_pretrained`` directly and need the
 +    HF id. The ``hf:org/name`` escape hatch passes through unchanged.
 +    """
 +    if base_model.startswith("hf:"):
 +        return base_model[len("hf:") :]
 +    try:
 +        from dlm.base_models import resolve as resolve_base
 +    except ImportError:
 +        return base_model
 +    try:
 +        spec = resolve_base(base_model)
 +    except Exception:  # noqa: BLE001 — unknown dlm errors
 +        return base_model
 +    hf_id = getattr(spec, "hf_id", None)
 +    return str(hf_id) if hf_id else base_model
++
++
  def _resolve_adapter_path(dlm_id: str) -> Path | None:
      """Locate the current adapter directory for ``dlm_id``.
 -    Uses dlm's ``StorePath`` helper if available, else falls back to
 -    the canonical ``~/.dlm/store/<dlm_id>/adapter/current.txt`` pointer.
 -    Returns ``None`` if no adapter has been trained yet.
 +    Uses dlm's module-level ``for_dlm`` helper if available, else falls
 +    back to the canonical ``~/.dlm/store/<dlm_id>/adapter/current.txt``
 +    pointer. Returns ``None`` if no adapter has been trained yet.
      """
 +    # Primary path: use dlm's own store-path helpers.
      try:
 -        from dlm.store.paths import StorePath
+-
 -        _store_path_cls: object | None = StorePath
 +        from dlm.store.paths import for_dlm as _for_dlm
      except ImportError:
 -        _store_path_cls = None
 +        _for_dlm = None
 -    if _store_path_cls is not None:
 +    if _for_dlm is not None:
          try:
 -            store = _store_path_cls.for_dlm(dlm_id)  # type: ignore[attr-defined]
 +            store = _for_dlm(dlm_id)
          except Exception:  # noqa: BLE001 — unknown dlm exception shapes
 -            return None
 -        try:
 -            resolved = store.resolve_current_adapter()
 -        except (AttributeError, FileNotFoundError):
 -            resolved = None
 -        if resolved is not None and resolved.exists():
 -            return Path(resolved)
+-
 -    # Manual fallback in case the dlm API evolves.
 +            store = None
 +        if store is not None:
 +            try:
 +                resolved = store.resolve_current_adapter()
 +            except (AttributeError, FileNotFoundError):
 +                resolved = None
 +            if resolved is not None and Path(resolved).exists():
 +                return Path(resolved)
++
 +    # Manual fallback. The ``current.txt`` pointer is relative to the
 +    # **store root**, not to current.txt's parent dir — so go up one level.
      import os
      home = Path(os.environ.get("DLM_HOME", "~/.dlm")).expanduser()
 -    current_file = home / "store" / dlm_id / "adapter" / "current.txt"
 +    store_root = home / "store" / dlm_id
 +    current_file = store_root / "adapter" / "current.txt"
      if current_file.exists():
          pointer = current_file.read_text(encoding="utf-8").strip()
 -        candidate = (current_file.parent / pointer).resolve()
 +        candidate = (store_root / pointer).resolve()
          if candidate.exists():
              return candidate
      return None
  def _translate_section(dlm_section: object) -> Section:
      """Adapt a ``dlm.doc.sections.Section`` to sway's section type.
 -    The shape dlm uses has been stable through the v0.x series but we
 -    treat field access defensively so a minor dlm refactor can't silently
 -    misread section content.
 +    dlm's Section dataclass uses the attribute name ``type`` (not
 +    ``kind``) and stores instruction/preference content as raw markdown
 +    — dlm ships dedicated parsers (``parse_instruction_body``,
 +    ``parse_preference_body``) that we reuse here so any future dlm
 +    syntax additions land in sway for free.
      """
 -    kind_raw = getattr(dlm_section, "kind", None)
 -    # dlm uses the attribute name "kind" on its Section dataclass.
 +    # dlm's current attribute is ``type``; older revisions used ``kind``.
 +    kind_raw = getattr(dlm_section, "type", getattr(dlm_section, "kind", None))
      kind = _normalize_kind(kind_raw)
      content = str(getattr(dlm_section, "content", ""))
      section_id = str(
      probes: tuple[SectionProbe, ...] = ()
      preferences: tuple[SectionPreference, ...] = ()
      if kind == "instruction":
 -        probes = tuple(_extract_instruction_probes(dlm_section))
 +        probes = tuple(_parse_instruction(content, section_id=section_id))
      elif kind == "preference":
 -        preferences = tuple(_extract_preference_triples(dlm_section))
 +        preferences = tuple(_parse_preference(content, section_id=section_id))
      return Section(
          id=section_id,
      return "prose"
 -def _extract_instruction_probes(dlm_section: object) -> list[SectionProbe]:
 -    """Pull (Q, A) pairs out of a dlm INSTRUCTION section.
 +def _parse_instruction(content: str, *, section_id: str) -> list[SectionProbe]:
 +    """Pull (Q, A) pairs out of a dlm INSTRUCTION section body.
 -    dlm's Section carries its parsed Q/A as ``probes`` or ``qa`` depending
 -    on version. We read the first non-empty one and build
 -    :class:`SectionProbe` records defensively.
 +    Delegates to dlm's own ``parse_instruction_body`` so syntax additions
 +    land in sway without code changes here. Falls back to an empty list
 +    on parse errors — the probe will fail gracefully.
      """
 -    raw_probes = getattr(dlm_section, "probes", None) or getattr(dlm_section, "qa", None)
 -    if not raw_probes:
 +    try:
 +        from dlm.data.instruction_parser import parse_instruction_body
 +    except ImportError:
 +        return []
 +    try:
 +        pairs = parse_instruction_body(content, section_id=section_id)
 +    except Exception:  # noqa: BLE001 — dlm raises InstructionParseError
          return []
      out: list[SectionProbe] = []
 -    for rp in raw_probes:
 -        q = str(getattr(rp, "prompt", getattr(rp, "question", "")))
 -        a = str(getattr(rp, "gold", getattr(rp, "answer", "")))
 +    for p in pairs:
 +        q = getattr(p, "question", getattr(p, "prompt", ""))
 +        a = getattr(p, "answer", getattr(p, "gold", ""))
          if q and a:
 -            out.append(SectionProbe(prompt=q, gold=a))
 +            out.append(SectionProbe(prompt=str(q), gold=str(a)))
      return out
 -def _extract_preference_triples(dlm_section: object) -> list[SectionPreference]:
 -    """Pull (prompt, chosen, rejected) triples out of a dlm PREFERENCE section."""
 -    raw = getattr(dlm_section, "preferences", None) or getattr(dlm_section, "triples", None)
 -    if not raw:
 +def _parse_preference(content: str, *, section_id: str) -> list[SectionPreference]:
 +    """Pull (prompt, chosen, rejected) triples out of a PREFERENCE body."""
 +    try:
 +        from dlm.data.preference_parser import parse_preference_body
 +    except ImportError:
 +        return []
 +    try:
 +        triples = parse_preference_body(content, section_id=section_id)
 +    except Exception:  # noqa: BLE001 — dlm raises PreferenceParseError
          return []
      out: list[SectionPreference] = []
 -    for r in raw:
 -        p = str(getattr(r, "prompt", ""))
 -        c = str(getattr(r, "chosen", ""))
 -        rej = str(getattr(r, "rejected", ""))
 +    for t in triples:
 +        p = str(getattr(t, "prompt", ""))
 +        c = str(getattr(t, "chosen", ""))
 +        rej = str(getattr(t, "rejected", ""))
          if p and c and rej:
              out.append(SectionPreference(prompt=p, chosen=c, rejected=rej))
      return out

tests/unit/test_dlm_bridge.pymodified

      @dataclass
      class _Frontmatter:
          dlm_id: str = "01TESTULID"
 -        base_model: str = "HuggingFaceTB/SmolLM2-135M-Instruct"
+-
 -    @dataclass
 -    class _InstrProbe:
 -        prompt: str
 -        gold: str
+-
 -    @dataclass
 -    class _PrefTriple:
 -        prompt: str
 -        chosen: str
 -        rejected: str
 +        base_model: str = "smollm2-135m"
      @dataclass
      class _Section:
          section_id: str
 -        kind: str
 +        type: str
          content: str
 -        probes: tuple[object, ...] = ()
 -        preferences: tuple[object, ...] = ()
          tag: str | None = None
      @dataclass
              sections=(
                  _Section(
                      section_id="prose-1",
 -                    kind="PROSE",
 +                    type="PROSE",
                      content="This is a prose section with some information. Further detail follows.",
                  ),
                  _Section(
                      section_id="instr-1",
 -                    kind="INSTRUCTION",
 -                    content="Q-A pairs",
 -                    probes=(_InstrProbe("What is X?", "X is a concept"),),
 +                    type="INSTRUCTION",
 +                    content="### Q\nWhat is X?\n\n### A\nX is a concept\n",
                  ),
                  _Section(
                      section_id="pref-1",
 -                    kind="PREFERENCE",
 -                    content="Prefs",
 -                    preferences=(_PrefTriple("Which?", "good answer", "bad answer"),),
 +                    type="PREFERENCE",
 +                    content="chosen/rejected triple",
                  ),
              ),
+         )
          def __init__(self, path: Path) -> None:
              self._p = path
 -        @classmethod
 -        def for_dlm(cls, _dlm_id: str) -> _StorePath:
 -            return cls(adapter_dir)
+-
          def resolve_current_adapter(self) -> Path:
              return self._p
 +    def _for_dlm(_dlm_id: str) -> _StorePath:
 +        return _StorePath(adapter_dir)
++
      dlm_store_paths.StorePath = _StorePath  # type: ignore[attr-defined]
 +    dlm_store_paths.for_dlm = _for_dlm  # type: ignore[attr-defined]
++
 +    # Fake base-model resolver — returns a stub with an ``hf_id`` attribute.
 +    dlm_base = types.ModuleType("dlm.base_models")
++
 +    @dataclass
 +    class _BaseSpec:
 +        hf_id: str
 +        key: str
++
 +    def _resolve(key: str) -> _BaseSpec:
 +        return _BaseSpec(hf_id="HuggingFaceTB/SmolLM2-135M-Instruct", key=key)
++
 +    dlm_base.resolve = _resolve  # type: ignore[attr-defined]
++
 +    # Fake instruction / preference parsers.
 +    dlm_data = types.ModuleType("dlm.data")
 +    dlm_data_instr = types.ModuleType("dlm.data.instruction_parser")
 +    dlm_data_pref = types.ModuleType("dlm.data.preference_parser")
++
 +    @dataclass
 +    class _QAPair:
 +        question: str
 +        answer: str
++
 +    @dataclass
 +    class _Triple:
 +        prompt: str
 +        chosen: str
 +        rejected: str
++
 +    def _parse_instr(body: str, *, section_id: str) -> list[_QAPair]:
 +        del section_id
 +        out: list[_QAPair] = []
 +        parts = body.split("### Q")
 +        for part in parts[1:]:
 +            q_block, _, a_block = part.partition("### A")
 +            q = q_block.strip()
 +            a = a_block.strip()
 +            if q and a:
 +                out.append(_QAPair(question=q, answer=a))
 +        return out
++
 +    def _parse_pref(body: str, *, section_id: str) -> list[_Triple]:
 +        del body, section_id
 +        return [_Triple(prompt="Which?", chosen="good answer", rejected="bad answer")]
++
 +    dlm_data_instr.parse_instruction_body = _parse_instr  # type: ignore[attr-defined]
 +    dlm_data_pref.parse_preference_body = _parse_pref  # type: ignore[attr-defined]
      monkeypatch.setitem(sys.modules, "dlm", dlm_pkg)
      monkeypatch.setitem(sys.modules, "dlm.doc", dlm_doc)
      monkeypatch.setitem(sys.modules, "dlm.doc.parser", dlm_doc_parser)
      monkeypatch.setitem(sys.modules, "dlm.store", dlm_store)
      monkeypatch.setitem(sys.modules, "dlm.store.paths", dlm_store_paths)
 +    monkeypatch.setitem(sys.modules, "dlm.base_models", dlm_base)
 +    monkeypatch.setitem(sys.modules, "dlm.data", dlm_data)
 +    monkeypatch.setitem(sys.modules, "dlm.data.instruction_parser", dlm_data_instr)
 +    monkeypatch.setitem(sys.modules, "dlm.data.preference_parser", dlm_data_pref)
      # Return a path to a fake .dlm file (the parser won't actually read it).
      dlm_file = tmp_path / "doc.dlm"