cartesia-ai · drago-balto · Apr 11, 2026 · cursor · Apr 13, 2026
diff --git a/line/events.py b/line/events.py
@@ -41,11 +41,13 @@ class AgentToolReturned(BaseModel):
 
 class AgentEndCall(BaseModel):
     type: Literal["end_call"] = "end_call"
+    after_speech: bool = False
 
 
 class AgentTransferCall(BaseModel):
     type: Literal["agent_transfer_call"] = "agent_transfer_call"
     target_phone_number: str
+    after_speech: bool = False
 
 
 class AgentSendDtmf(BaseModel):

diff --git a/line/llm_agent/tools/system.py b/line/llm_agent/tools/system.py
@@ -207,7 +207,7 @@ async def _end_call_impl(
             ctx: ToolEnv,
             reason: Annotated[str, "The reason for ending the call"],
         ):
-            yield AgentEndCall()
+            yield AgentEndCall(after_speech=True)
 
         return construct_function_tool(
             _end_call_impl,
@@ -463,7 +463,7 @@ async def transfer_call(
 
     if message is not None:
         yield AgentSendText(text=message)
-    yield AgentTransferCall(target_phone_number=normalized_number)
+    yield AgentTransferCall(target_phone_number=normalized_number, after_speech=True)
 
 
 def agent_as_handoff(

diff --git a/line/voice_agent_app.py b/line/voice_agent_app.py
@@ -290,6 +290,7 @@ def __init__(self, websocket: WebSocket, agent_spec: AgentSpec, env: AgentEnv):
         self.env = env
         # Lazy-init: asyncio.Event() requires a running event loop on Python 3.9.
         self._shutdown_event: Optional[asyncio.Event] = None
+        self._speech_done: Optional[asyncio.Event] = None
         self.history: List[InputEvent] = []
         self.emitted_agent_text: List[Tuple[str, bool]] = []  # (content, interruptible)
 
@@ -302,6 +303,14 @@ def shutdown_event(self) -> asyncio.Event:
             self._shutdown_event = asyncio.Event()
         return self._shutdown_event
 
+    @property
+    def speech_done(self) -> asyncio.Event:
+        """Event that is set when the agent is not speaking (TTS idle)."""
+        if self._speech_done is None:
+            self._speech_done = asyncio.Event()
+            self._speech_done.set()  # Start in "done" state (no speech pending)
+        return self._speech_done
+
     ######### Initialization Methods #########
 
     def _prepare_agent(
@@ -423,16 +432,28 @@ async def _start_agent_task(self, turn_env: TurnEnv, event: InputEvent) -> None:
         await self._cancel_agent_task()
 
         async def runner():
+            has_sent_text = False
             try:
                 async for output in self.agent_callable(turn_env, event):
                     if isinstance(output, AgentSendText):
                         self.emitted_agent_text.append((output.text, output.interruptible))
+                        has_sent_text = True
                     mapped = self._map_output_event(output)
 
                     if self.shutdown_event.is_set():
                         break
                     if mapped is None:
                         continue
+
+                    # Wait for TTS to finish speaking before sending after_speech events
+                    if getattr(output, "after_speech", False) and has_sent_text:
+                        try:
+                            await asyncio.wait_for(self.speech_done.wait(), timeout=30.0)
+                        except asyncio.TimeoutError:
+                            logger.warning(
+                                f"Timed out waiting for speech to complete before {type(output).__name__}"
+                            )
+
                     await self.websocket.send_json(mapped.model_dump())
             except asyncio.CancelledError:
                 pass
@@ -481,8 +502,10 @@ def _convert_input_message(self, message: InputMessage) -> Optional[InputEvent]:
 
         elif isinstance(message, AgentStateInput):
             if message.value == UserState.SPEAKING:
+                self.speech_done.clear()
                 return AgentTurnStarted()
             elif message.value == UserState.IDLE:
+                self.speech_done.set()
                 content = self._turn_content(
                     self.history,
                     AgentTurnStarted,