`5b9c14f`

Move conversational fast path into runtime launcher

Authored by

espadonne 1 month ago

SHA: 5b9c14f85ebea90049931c329e1b983ab91d2c38
Parents: c61058b
Tree: b7a78b3

3 changed files

Status	File	+	-
M	`src/loader/agent/loop.py`	2	48
A	`src/loader/runtime/chat_lane.py`	55	0
M	`src/loader/runtime/launcher.py`	11	0

src/loader/agent/loop.pymodified

+         )
          return parse_decomposition(response.content, task)
 -    async def _handle_conversational(
 -        self,
 -        user_message: str,
 -        emit: Callable[[AgentEvent], Awaitable[None]],
 -    ) -> str:
 -        """Fast path for conversational messages - no tools, quick response."""
 -        await emit(AgentEvent(type="thinking"))
+-
 -        # Add to history
 -        self.session.append(Message(role=Role.USER, content=user_message))
+-
 -        # Simple system prompt for chat (no tools)
 -        chat_system = Message(
 -            role=Role.SYSTEM,
 -            content=(
 -                "You are Loader, a friendly local coding assistant. "
 -                "Respond naturally and briefly to conversational messages. "
 -                "If the user wants to do a coding task, tell them to describe it. "
 -                "Keep responses short (1-3 sentences)."
 -            ),
 -        )
+-
 -        # Use only recent context for speed
 -        recent_messages = self.messages[-4:] if len(self.messages) > 4 else self.messages
+-
 -        # Stream the response
 -        full_content = ""
 -        async for chunk in self.backend.stream(
 -            messages=[chat_system] + recent_messages,
 -            tools=None,  # No tools for chat
 -            temperature=0.7,  # More natural
 -            max_tokens=256,  # Short response
 -        ):
 -            if chunk.content:
 -                await emit(AgentEvent(
 -                    type="stream",
 -                    content=chunk.content,
 -                    is_stream_end=chunk.is_done,
 -                ))
 -                full_content += chunk.content
+-
 -        # Add to history
 -        self.session.append(Message(role=Role.ASSISTANT, content=full_content))
+-
 -        await emit(AgentEvent(type="response", content=full_content))
 -        return full_content
+-
      async def run(
          self,
          user_message: str,
      ) -> str:
          """Internal run method that supports steering."""
          cfg = self.config.reasoning
 +        launcher = build_runtime_launcher(self)
          # Fast path: conversational messages don't need tools
          if is_conversational(user_message):
 -            return await self._handle_conversational(user_message, emit)
 +            return await launcher.run_conversational(user_message, emit)
          # Track original task for multi-turn conversations
          # Only set on first non-conversational message

src/loader/runtime/chat_lane.pyadded

 +"""Runtime-owned conversational fast path for non-tool chat turns."""
++
 +from __future__ import annotations
++
 +from ..llm.base import Message, Role
 +from .bootstrap import RuntimeBootstrapSource
 +from .events import AgentEvent
++
 +CHAT_SYSTEM_PROMPT = (
 +    "You are Loader, a friendly local coding assistant. "
 +    "Respond naturally and briefly to conversational messages. "
 +    "If the user wants to do a coding task, tell them to describe it. "
 +    "Keep responses short (1-3 sentences)."
 +)
++
++
 +class ConversationalTurnRunner:
 +    """Own the non-tool conversational fast path outside the agent shell."""
++
 +    def __init__(self, source: RuntimeBootstrapSource) -> None:
 +        self.source = source
++
 +    async def run(self, user_message: str, emit) -> str:
 +        """Stream one short conversational reply and persist the transcript."""
++
 +        await emit(AgentEvent(type="thinking"))
 +        self.source.session.append(Message(role=Role.USER, content=user_message))
++
 +        recent_messages = (
 +            self.source.session.messages[-4:]
 +            if len(self.source.session.messages) > 4
 +            else self.source.session.messages
 +        )
 +        chat_system = Message(role=Role.SYSTEM, content=CHAT_SYSTEM_PROMPT)
++
 +        full_content = ""
 +        async for chunk in self.source.backend.stream(
 +            messages=[chat_system] + recent_messages,
 +            tools=None,
 +            temperature=0.7,
 +            max_tokens=256,
 +        ):
 +            if chunk.content:
 +                await emit(
 +                    AgentEvent(
 +                        type="stream",
 +                        content=chunk.content,
 +                        is_stream_end=chunk.is_done,
 +                    )
 +                )
 +                full_content += chunk.content
++
 +        self.source.session.append(Message(role=Role.ASSISTANT, content=full_content))
 +        await emit(AgentEvent(type="response", content=full_content))
 +        return full_content

src/loader/runtime/launcher.pymodified

  from __future__ import annotations
  from .bootstrap import RuntimeBootstrapSource
 +from .chat_lane import ConversationalTurnRunner
  from .conversation import ConfirmationHandler, ConversationRuntime, EventSink, UserQuestionHandler
  from .events import TurnSummary
  from .explore import ExploreRuntime
      def __init__(self, source: RuntimeBootstrapSource) -> None:
          self.source = source
 +    async def run_conversational(
 +        self,
 +        user_message: str,
 +        emit: EventSink,
 +    ) -> str:
 +        """Run the runtime-owned conversational fast path."""
++
 +        runner = ConversationalTurnRunner(self.source)
 +        return await runner.run(user_message, emit)
++
      async def run_turn(
          self,
          task: str,