`a608f28`

Disambiguate duplicate output basenames

Authored by

espadonne 2 weeks ago

SHA: a608f2876e1ab3ab6e54193d1e4e4b5f8a7aed28
Parents: 994af83
Tree: 8c9d1b3

2 changed files

Status	File	+	-
M	`src/loader/runtime/workflow.py`	53	14
M	`tests/test_repair.py`	57	0

src/loader/runtime/workflow.pymodified

      """Infer the concrete file path a pending todo is asking the model to mutate."""
      root = project_root or Path.cwd()
 +    target_label = _normalize_pending_output_label(item)
      candidates = todo_file_candidates(item)
      planned_targets = collect_planned_artifact_targets(
          dod,
+     )
      if candidates:
 -        planned_files = {
 -            target.name.lower(): target
 +        planned_files = [
 +            target
              for target, expect_directory in planned_targets
              if not expect_directory
 -        }
 +        ]
          planned_directories = [
              target
              for target, expect_directory in planned_targets
              if candidate.is_absolute() or candidate_str.startswith("~"):
                  return Path(candidate_str).expanduser()
 -            planned_match = planned_files.get(candidate.name.lower())
 -            if planned_match is not None:
 -                return planned_match
+-
 -            for touched in reversed(touched_paths):
 -                if touched.name.lower() == candidate.name.lower():
 -                    continue
 -                if candidate.suffix and touched.suffix.lower() != candidate.suffix.lower():
 -                    continue
 -                return touched.parent / candidate.name
 +            planned_matches = [
 +                target
 +                for target in planned_files
 +                if target.name.lower() == candidate.name.lower()
 +            ]
 +            if planned_matches:
 +                return _select_best_pending_output_path(
 +                    planned_matches,
 +                    todo_label=target_label,
 +                )
++
 +            touched_matches = [
 +                touched.parent / candidate.name
 +                for touched in reversed(touched_paths)
 +                if touched.name.lower() != candidate.name.lower()
 +                and (
 +                    not candidate.suffix
 +                    or touched.suffix.lower() == candidate.suffix.lower()
 +                )
 +            ]
 +            if touched_matches:
 +                return _select_best_pending_output_path(
 +                    touched_matches,
 +                    todo_label=target_label,
 +                )
              for directory in planned_directories:
                  return directory / candidate.name
 -    target_label = _normalize_pending_output_label(item)
      if not target_label:
          return None
      return matches[0][2]
 +def _select_best_pending_output_path(
 +    paths: list[Path],
 +    *,
 +    todo_label: str,
 +) -> Path:
 +    ranked = sorted(
 +        paths,
 +        key=lambda path: (
 +            _pending_output_path_match_score(todo_label, path),
 +            not path.expanduser().exists(),
 +            str(path),
 +        ),
 +        reverse=True,
 +    )
 +    return ranked[0]
++
++
  def preserve_task_grounded_acceptance_criteria(
      task_statement: str,
      *,
      return 0
 +def _pending_output_path_match_score(todo_label: str, path: Path) -> int:
 +    if not todo_label:
 +        return 0
 +    path_label = _normalize_pending_output_label(str(path))
 +    return _pending_output_link_match_score(todo_label, path_label)
++
++
  def _iter_local_html_links(content: str) -> list[tuple[str, str]]:
      pattern = re.compile(
          r"<a\b[^>]*href\s*=\s*[\"']([^\"']+)[\"'][^>]*>(.*?)</a>",

tests/test_repair.pymodified

      assert "Make the next response one concrete evidence-gathering tool call" not in decision.retry_message
 +def test_empty_response_retry_prefers_output_index_over_reference_index_with_same_name(
 +    temp_dir: Path,
 +) -> None:
 +    context = build_context(
 +        temp_dir=temp_dir,
 +        use_react=False,
 +    )
 +    repairer = ResponseRepairer(context)
++
 +    nginx_root = temp_dir / "Loader" / "guides" / "nginx"
 +    fortran_root = temp_dir / "Loader" / "guides" / "fortran"
 +    nginx_root.mkdir(parents=True)
 +    fortran_root.mkdir(parents=True)
 +    reference_index = fortran_root / "index.html"
 +    reference_index.write_text("<html>fortran</html>\n")
 +    output_index = nginx_root / "index.html"
++
 +    implementation_plan = temp_dir / "implementation.md"
 +    implementation_plan.write_text(
 +        "\n".join(
 +            [
 +                "# Implementation Plan",
 +                "",
 +                "## File Changes",
 +                f"- `{output_index}`",
 +                f"- `{nginx_root / 'chapters'}/`",
 +                f"- `{reference_index}`",
 +                "",
 +            ]
 +        )
 +    )
++
 +    dod = create_definition_of_done("Create a multi-file nginx guide.")
 +    dod.implementation_plan = str(implementation_plan)
 +    dod.touched_files.append(str(reference_index))
 +    dod.completed_items.append(
 +        "First, examine the existing Fortran guide structure and content"
 +    )
 +    dod.pending_items.append("Develop the nginx index.html file")
++
 +    decision = repairer.handle_empty_response(
 +        task="Create a multi-file nginx guide.",
 +        original_task=None,
 +        empty_retry_count=2,
 +        max_empty_retries=2,
 +        dod=dod,
 +    )
++
 +    assert decision.should_continue is True
 +    assert decision.retry_message is not None
 +    assert (
 +        f"Prefer one `write(content=...)` call for `{output_index}` before more research."
 +        in decision.retry_message
 +    )
 +    assert str(reference_index) not in decision.retry_message
++
++
  def test_empty_response_retry_points_at_declared_child_file_within_incomplete_output_directory(
      temp_dir: Path,
  ) -> None: