`4630a24`

test(doc): CptConfig + v2→v3 migrator coverage

Authored by

espadonne 3 weeks ago

SHA: 4630a2483cc7d73acf4ab27003366bca320e7d6e
Parents: 3f2d0f5
Tree: 863cadf

2 changed files

Status	File	+	-
A	`tests/unit/doc/test_migration_v2_to_v3.py`	63	0
M	`tests/unit/doc/test_schema.py`	51	1

tests/unit/doc/test_migration_v2_to_v3.pyadded

 +"""v2 → v3 migrator: additive `training.cpt` block.
++
 +v3 is additive with defaults, so the migrator is pure identity. These
 +tests lock that shape in: a v2 doc round-trips unchanged, and the
 +combined output validates under the v3 `DlmFrontmatter` with the
 +default `CptConfig`.
 +"""
++
 +from __future__ import annotations
++
 +from typing import Any
++
 +from dlm.doc.migrations.v2 import migrate
 +from dlm.doc.schema import CptConfig, DlmFrontmatter
++
 +VALID_ULID = "01HZ4X7TGZM3J1A2B3C4D5E6F7"
++
++
 +class TestIdentityShape:
 +    def test_empty_dict_passthrough(self) -> None:
 +        raw: dict[str, Any] = {}
 +        out = migrate(raw)
 +        assert out == raw
 +        assert out is not raw  # copy, not alias
++
 +    def test_v2_preference_block_preserved(self) -> None:
 +        raw: dict[str, Any] = {
 +            "dlm_id": VALID_ULID,
 +            "base_model": "smollm2-135m",
 +            "training": {
 +                "preference": {
 +                    "method": "orpo",
 +                    "hyperparams": {"alpha": 0.15},
 +                },
 +            },
 +        }
 +        out = migrate(raw)
 +        assert out == raw
++
 +    def test_full_training_block_preserved(self) -> None:
 +        raw: dict[str, Any] = {
 +            "training": {
 +                "adapter": "lora",
 +                "lora_r": 16,
 +                "learning_rate": 1e-4,
 +            },
 +        }
 +        out = migrate(raw)
 +        assert out == raw
++
++
 +class TestValidatesAsV3:
 +    def test_migrated_doc_validates_with_default_cpt(self) -> None:
 +        raw: dict[str, Any] = {
 +            "dlm_id": VALID_ULID,
 +            "base_model": "smollm2-135m",
 +            "dlm_version": 2,
 +        }
 +        out = migrate(raw)
 +        # Dispatcher stamps dlm_version post-migrate; simulate that.
 +        out["dlm_version"] = 3
 +        fm = DlmFrontmatter.model_validate(out)
 +        assert fm.training.cpt == CptConfig()

tests/unit/doc/test_schema.pymodified

  from pydantic import ValidationError
  from dlm.doc.schema import (
 +    CptConfig,
      DlmFrontmatter,
      ExportConfig,
      PreferenceConfig,
+             )
 +class TestCptConfig:
 +    def test_default_instance(self) -> None:
 +        c = CptConfig()
 +        assert c.schedule == "auto"
 +        assert c.embed_warmup_steps == 0
++
 +    def test_frozen_model_rejects_mutation(self) -> None:
 +        c = CptConfig()
 +        with pytest.raises(ValidationError):
 +            c.embed_warmup_steps = 10  # type: ignore[misc]
++
 +    @pytest.mark.parametrize("value", ["auto", "dapt", "sft"])
 +    def test_schedule_accepts_known_values(self, value: str) -> None:
 +        CptConfig(schedule=value)  # type: ignore[arg-type]
++
 +    def test_schedule_rejects_unknown(self) -> None:
 +        with pytest.raises(ValidationError):
 +            CptConfig(schedule="warmup")  # type: ignore[arg-type]
++
 +    def test_embed_warmup_steps_must_be_non_negative(self) -> None:
 +        with pytest.raises(ValidationError):
 +            CptConfig(embed_warmup_steps=-1)
++
 +    def test_extra_fields_forbidden(self) -> None:
 +        with pytest.raises(ValidationError):
 +            CptConfig.model_validate({"schedule": "auto", "rubbish": 1})
++
++
 +class TestTrainingConfigCptSubfield:
 +    def test_default_training_has_auto_cpt(self) -> None:
 +        t = TrainingConfig()
 +        assert isinstance(t.cpt, CptConfig)
 +        assert t.cpt.schedule == "auto"
 +        assert t.cpt.embed_warmup_steps == 0
++
 +    def test_accepts_nested_dict_for_cpt(self) -> None:
 +        t = TrainingConfig.model_validate(
 +            {"cpt": {"schedule": "dapt", "embed_warmup_steps": 200}}
 +        )
 +        assert t.cpt.schedule == "dapt"
 +        assert t.cpt.embed_warmup_steps == 200
++
 +    def test_rejects_unknown_field_inside_cpt(self) -> None:
 +        with pytest.raises(ValidationError):
 +            TrainingConfig.model_validate(
 +                {"cpt": {"schedule": "dapt", "rubbish": 1}}
 +            )
++
++
  class TestExportConfig:
      def test_default_quant(self) -> None:
          assert ExportConfig().default_quant == "Q4_K_M"
  class TestDlmFrontmatter:
      def test_minimal_valid(self) -> None:
          fm = DlmFrontmatter(dlm_id=VALID_ULID, base_model="smollm2-135m")
 -        assert fm.dlm_version == 2
 +        assert fm.dlm_version == 3
          assert fm.training == TrainingConfig()
          assert fm.export == ExportConfig()
          assert fm.system_prompt is None