rename CLI + source references to sway; keep dlm-sway as the PyPI wheel name

Status	File	+	-
A	`.gitignore`	28	0
M	`README.md`	28	16
M	`pyproject.toml`	4	3
M	`src/dlm_sway/__init__.py`	5	1
M	`src/dlm_sway/backends/hf.py`	4	3
M	`src/dlm_sway/cli/__init__.py`	1	1
M	`src/dlm_sway/cli/app.py`	4	4
M	`src/dlm_sway/cli/commands.py`	5	5
M	`src/dlm_sway/core/errors.py`	2	2
M	`src/dlm_sway/suite/report.py`	4	4
M	`src/dlm_sway/suite/spec.py`	2	2
M	`tests/unit/test_cli.py`	4	4
M	`tests/unit/test_suite_score_report.py`	2	2

.gitignoreadded

 +# Python
 +__pycache__/
 +*.py[cod]
 +*$py.class
 +*.so
++
 +# Virtual envs
 +.venv/
 +venv/
 +.env
++
 +# Tooling caches
 +.mypy_cache/
 +.pytest_cache/
 +.ruff_cache/
 +.coverage
 +htmlcov/
++
 +# Build artifacts
 +build/
 +dist/
 +*.egg-info/
++
 +# Editor
 +.idea/
 +.vscode/
 +*.swp
 +.DS_Store

README.mdmodified

 -# dlm-sway
 +# sway
  Differential testing for fine-tuned causal language models.
  in a meaningful way, or is the model just defaulting to the pretrained
  base?*
 -`dlm-sway` gives you a trustworthy, reproducible answer with eleven
 +`sway` gives you a trustworthy, reproducible answer with eleven
  purpose-built primitives, each z-scored against a null-adapter baseline.
  No LLM judges. No external APIs. Deterministic on CPU where possible.
 +> **Naming note.** The source repo and CLI entry point are both `sway`.
 +> The PyPI wheel is named `dlm-sway` because `sway` is already taken on
 +> PyPI by an unrelated project. `pip install dlm-sway` installs the
 +> `sway` command — mismatched names are a PyPA convention (see
 +> `pyyaml` → `import yaml`).
++
  ## Install
  ```bash
  ## 90-second smoke test
  ```bash
 -dlm-sway check path/to/adapter --base HuggingFaceTB/SmolLM2-135M-Instruct
 +sway check path/to/adapter --base HuggingFaceTB/SmolLM2-135M-Instruct
  ```
  Outputs a verdict in under a minute on CPU for small models: *your
    ft:   {kind: hf, base: "HuggingFaceTB/SmolLM2-135M-Instruct",
           adapter: "./runs/adapter/v0003"}
  suite:
 -  - {name: knows_concept, kind: dir,
 -     prompt: "The Dunning-Kruger effect describes",
 -     target: " a cognitive bias where",
 -     distractor: " a programming language"}
 -  - {name: no_reversion, kind: adapter_revert, paraphrases: 4}
 +  - {name: null_baseline,       kind: null_adapter, runs: 3}
 +  - {name: doc_divergence,      kind: delta_kl,
 +     prompts: ["The key insight is", "An important rule"]}
    - {name: section_attribution, kind: section_internalization}
 +  - {name: no_leakage,          kind: leakage}
 +  - {name: ablation_shape,      kind: adapter_ablation,
 +     prompts: ["Tell me more about"]}
  ```
  ```bash
 -dlm-sway run sway.yaml              # full report to terminal + JSON
 -dlm-sway gate sway.yaml --junit     # CI-friendly; non-zero on fail
 +sway run sway.yaml              # full report to terminal + JSON
 +sway gate sway.yaml --junit     # CI-friendly; non-zero on fail
  ```
  ## Why it exists
  move the model toward what I wrote?"* — and existing tools answer this
  poorly.
 -`dlm-sway` answers it directly via eleven primitives across four
 -categories:
 +`sway` answers it directly via eleven primitives across four categories:
  | Category      | Primitives                                            |
  |---------------|-------------------------------------------------------|
  crash. Nobody else does this because nobody else gets this close to the
  adapter math.
 +**The calibration.** Every numeric probe z-scores its raw metric against
 +a null-adapter baseline — a same-structure LoRA with random-init weights.
 +"Your adapter's KL is 4.2σ above noise" is a far stronger claim than a
 +fixed threshold. The null-adapter calibration requires a backend that
 +implements `NullCalibratedBackend` (the HF backend does).
++
  ## The `.dlm` integration
  If you trained your adapter via the [DocumentLanguageModel
 -project](https://github.com/tenseleyFlow/DocumentLanguageModel), sway
 -can auto-generate a test suite from your document's sections:
 +project](https://github.com/tenseleyFlow/DocumentLanguageModel), `sway`
 +auto-generates a test suite from your document's sections:
  ```bash
  pip install "dlm-sway[hf,dlm]"
 -dlm-sway autogen path/to/doc.dlm -o sway.yaml
 -dlm-sway run sway.yaml
 +sway autogen path/to/doc.dlm -o sway.yaml
 +sway run sway.yaml
  ```
  Per-section attribution tells you *which* parts of your document

pyproject.tomlmodified

+ ]
  [project.scripts]
 -dlm-sway = "dlm_sway.cli.app:main"
 +sway = "dlm_sway.cli.app:main"
  [project.urls]
 -Homepage = "https://github.com/tenseleyFlow/DocumentLanguageModel"
 -Issues = "https://github.com/tenseleyFlow/DocumentLanguageModel/issues"
 +Homepage = "https://github.com/tenseleyFlow/sway"
 +Issues = "https://github.com/tenseleyFlow/sway/issues"
 +"Related project" = "https://github.com/tenseleyFlow/DocumentLanguageModel"
  [dependency-groups]
  dev = [

src/dlm_sway/__init__.pymodified

 -"""dlm-sway — differential testing for fine-tuned causal language models."""
 +"""sway — differential testing for fine-tuned causal language models.
++
 +Published on PyPI as ``dlm-sway`` (the short name is taken); the CLI
 +entry point and source repo are ``sway``.
 +"""
  from __future__ import annotations

src/dlm_sway/backends/hf.pymodified

      def as_base(self) -> Iterator[_HFView]:
          self._enter("base")
          try:
 -            # peft.PeftModel.disable_adapter is a context manager; mypy
 -            # mis-reads it as a Tensor on this transformers version.
 -            with self._peft_model.disable_adapter():  # type: ignore[operator]
 +            # peft.PeftModel.disable_adapter is a context manager; newer
 +            # transformers builds ship stubs that mis-type it as a Tensor,
 +            # so we warn-only there (see hf backend mypy overrides).
 +            with self._peft_model.disable_adapter():
                  yield self._make_view("base")
          finally:
              self._exit()

src/dlm_sway/cli/__init__.pymodified

`@@ -1,1 +1,1 @@`
1		-"""Command-line interface (entry point: ``dlm-sway``)."""
	1	+"""Command-line interface (entry point: ``sway``)."""

src/dlm_sway/cli/app.pymodified

 -"""dlm-sway CLI entry point.
 +"""sway CLI entry point.
  ``pip install dlm-sway`` installs this module's :func:`main` as the
 -``dlm-sway`` console script. Every subcommand is a thin wrapper around a
 +``sway`` console script. Every subcommand is a thin wrapper around a
  library-level function so the CLI surface mirrors what programmatic
  callers get.
  """
  from dlm_sway.cli import commands
  app = typer.Typer(
 -    name="dlm-sway",
 +    name="sway",
      no_args_is_help=True,
      add_completion=False,
      help="Differential testing for fine-tuned causal language models.",
  def _version_callback(value: bool) -> None:
      if value:
 -        typer.echo(f"dlm-sway {__version__}")
 +        typer.echo(f"sway {__version__}")
          raise typer.Exit()

src/dlm_sway/cli/commands.pymodified

 -"""Command implementations for the ``dlm-sway`` CLI.
 +"""Command implementations for the ``sway`` CLI.
  Each function here is wired to a subcommand in :mod:`dlm_sway.cli.app`.
  Commands deliberately do as little as possible themselves — the real
          typer.Option("--out", "-o", help="Where to write the generated sway.yaml."),
      ] = Path("sway.yaml"),
  ) -> None:
 -    """Generate a sway.yaml from a .dlm file (requires dlm-sway[dlm])."""
 +    """Generate a sway.yaml from a .dlm file (requires the ``dlm-sway[dlm]`` extra)."""
      import importlib
      try:
  def doctor_cmd() -> None:
      """Print backend availability and version info."""
      console = Console()
 -    console.print(f"[bold]dlm-sway[/bold] {__version__}")
 +    console.print(f"[bold]sway[/bold] {__version__}")
      console.print(f"  python:    {sys.version.split()[0]}")
      console.print(f"  platform:  {sys.platform}")
      console.print()
  def _render_markdown_from_json(raw: dict[str, Any]) -> str:
      score: dict[str, Any] = raw.get("score", {})
      lines: list[str] = [
 -        "# dlm-sway report",
 +        "# sway report",
          "",
          f"**Overall:** {score.get('overall', 0.0):.2f} (`{score.get('band', '?')}`)  ",
          f"**Base:** `{raw.get('base_model_id', '?')}`  ",
      import xml.etree.ElementTree as ET
      probes: list[dict[str, Any]] = raw.get("probes", [])
 -    testsuite = ET.Element("testsuite", {"name": "dlm-sway", "tests": str(len(probes))})
 +    testsuite = ET.Element("testsuite", {"name": "sway", "tests": str(len(probes))})
      for p in probes:
          tc = ET.SubElement(testsuite, "testcase", {"classname": p["kind"], "name": p["name"]})
          if p["verdict"] == "fail":

src/dlm_sway/core/errors.pymodified

 -"""Exception hierarchy for dlm-sway.
 +"""Exception hierarchy for sway.
  Every error sway raises inherits from :class:`SwayError` so callers can
  catch the whole family with a single ``except``. Subclasses carry enough
  class SwayError(Exception):
 -    """Root of the dlm-sway exception hierarchy."""
 +    """Root of the sway exception hierarchy."""
  class SpecValidationError(SwayError):

src/dlm_sway/suite/report.pymodified

  :class:`SuiteResult` dataclass but flattened for easy downstream parsing
  (dashboards, diff tools, history tracking).
 -JUnit XML exists to drop into CI pipelines so ``dlm-sway gate``
 +JUnit XML exists to drop into CI pipelines so ``sway gate``
  integrates with existing test dashboards with no extra glue.
  """
      c = console or Console()
      header = Text.assemble(
 -        ("dlm-sway report — ", "bold"),
 +        ("sway report — ", "bold"),
          (suite.base_model_id, "cyan"),
          ("  vs  ", "dim"),
          (_adapter_label(suite.adapter_id), "cyan"),
      testsuite = ET.Element(
          "testsuite",
+         {
 -            "name": "dlm-sway",
 +            "name": "sway",
              "tests": str(len(suite.probes)),
              "failures": str(sum(1 for p in suite.probes if p.verdict == Verdict.FAIL)),
              "errors": str(sum(1 for p in suite.probes if p.verdict == Verdict.ERROR)),
  def to_markdown(suite: SuiteResult, score: SwayScore) -> str:
      """A portable, CI-friendly markdown report."""
      buf = StringIO()
 -    buf.write("# dlm-sway report\n\n")
 +    buf.write("# sway report\n\n")
      buf.write(f"**Overall:** {score.overall:.2f} (`{score.band}`)  \n")
      buf.write(f"**Base:** `{suite.base_model_id}`  \n")
      buf.write(f"**Adapter:** `{_adapter_label(suite.adapter_id)}`  \n")

src/dlm_sway/suite/spec.pymodified

      instead of toggling on one. More memory-heavy; only useful when a
      backend can't do in-place toggling."""
      coverage_threshold: Annotated[float, Field(ge=0.0, le=1.0)] = 0.6
 -    """Minimum composite score for ``dlm-sway gate`` to pass."""
 +    """Minimum composite score for ``sway gate`` to pass."""
  class SwaySpec(BaseModel):
      """Optional path to a ``.dlm`` file. When present, the runner asks
      :mod:`dlm_sway.integrations.dlm.resolver` for typed sections and
      hands them to probes via :attr:`RunContext.sections`. Auto-populated
 -    by ``dlm-sway autogen``."""
 +    by ``sway autogen``."""
      def check_version(self) -> None:
          """Raise ``ValueError`` if the spec version is unsupported.

tests/unit/test_cli.pymodified

 -"""Smoke tests for the dlm-sway CLI.
 +"""Smoke tests for the sway CLI.
  We avoid exercising backends (they need real models) and instead test
  arg parsing, error paths, and the read-only commands (``doctor``,
  def test_version_exits_zero() -> None:
      result = CliRunner().invoke(app, ["--version"])
      assert result.exit_code == 0
 -    assert "dlm-sway" in result.stdout
 +    assert "sway" in result.stdout
  def test_help_lists_all_commands() -> None:
      result = CliRunner().invoke(app, ["doctor"])
      assert result.exit_code == 0
      # Rich applies color codes by default; assert the bare product name appears.
 -    assert "dlm-sway" in result.stdout
 +    assert "sway" in result.stdout
      assert "backends" in result.stdout
      md = CliRunner().invoke(app, ["report", str(path), "--format", "md"])
      assert md.exit_code == 0
 -    assert "dlm-sway report" in md.stdout
 +    assert "sway report" in md.stdout
      junit = CliRunner().invoke(app, ["report", str(path), "--format", "junit"])
      assert junit.exit_code == 0

tests/unit/test_suite_score_report.pymodified

+         )
          s = score.compute(suite)
          md = report.to_markdown(suite, s)
 -        assert "dlm-sway report" in md
 +        assert "sway report" in md
          assert "| p1 | `__score_adherence`" in md
          console = Console(file=buf, force_terminal=False, width=120)
          report.to_terminal(suite, s, console=console)
          out = buf.getvalue()
 -        assert "dlm-sway report" in out
 +        assert "sway report" in out
          assert "overall:" in out
          assert "p1" in out
          assert "p2" in out

tenseleyflow/sway / `98ad941`

13 changed files