Merge pull request #12 from livekit-examples/bcherry/improvements

bcherry · web-flow · commit d0f967cebd5f · 2025-08-07T19:38:13.000-04:00
Add latest agent improvements
diff --git a/pyproject.toml b/pyproject.toml
@@ -10,7 +10,7 @@ requires-python = ">=3.9"
 
 dependencies = [
     "livekit-agents[openai,turn-detector,silero,cartesia,deepgram]~=1.2",
-    "livekit-plugins-noise-cancellation~=0.2.1",
+    "livekit-plugins-noise-cancellation~=0.2",
     "python-dotenv",
 ]
 
diff --git a/src/agent.py b/src/agent.py
@@ -2,19 +2,20 @@
 
 from dotenv import load_dotenv
 from livekit.agents import (
+    NOT_GIVEN,
     Agent,
+    AgentFalseInterruptionEvent,
     AgentSession,
     JobContext,
     JobProcess,
+    MetricsCollectedEvent,
     RoomInputOptions,
-    RoomOutputOptions,
     RunContext,
     WorkerOptions,
     cli,
     metrics,
 )
 from livekit.agents.llm import function_tool
-from livekit.agents.voice import MetricsCollectedEvent
 from livekit.plugins import cartesia, deepgram, noise_cancellation, openai, silero
 from livekit.plugins.turn_detector.multilingual import MultilingualModel
 
@@ -28,7 +29,7 @@ def __init__(self) -> None:
         super().__init__(
             instructions="""You are a helpful voice AI assistant.
             You eagerly assist users with their questions by providing information from your extensive knowledge.
-            Your responses are concise, to the point, and without any complex formatting or punctuation.
+            Your responses are concise, to the point, and without any complex formatting or punctuation including emojis, asterisks, or other symbols.
             You are curious, friendly, and have a sense of humor.""",
         )
 
@@ -75,6 +76,9 @@ async def entrypoint(ctx: JobContext):
         # See more at https://docs.livekit.io/agents/build/turns
         turn_detection=MultilingualModel(),
         vad=ctx.proc.userdata["vad"],
+        # allow the LLM to generate a response while waiting for the end of turn
+        # See more at https://docs.livekit.io/agents/build/audio/#preemptive-generation
+        preemptive_generation=True,
     )
 
     # To use a realtime model instead of a voice pipeline, use the following session setup instead:
@@ -83,6 +87,13 @@ async def entrypoint(ctx: JobContext):
     #     llm=openai.realtime.RealtimeModel()
     # )
 
+    # sometimes background noise could interrupt the agent session, these are considered false positive interruptions
+    # when it's detected, you may resume the agent's speech
+    @session.on("agent_false_interruption")
+    def _on_agent_false_interruption(ev: AgentFalseInterruptionEvent):
+        logger.info("false positive interruption, resuming")
+        session.generate_reply(instructions=ev.extra_instructions or NOT_GIVEN)
+
     # Metrics collection, to measure pipeline performance
     # For more information, see https://docs.livekit.io/agents/build/metrics/
     usage_collector = metrics.UsageCollector()

Original file line number	Diff line number	Diff line change
`@@ -10,7 +10,7 @@ requires-python = ">=3.9"`
`10`	`10`
`11`	`11`	`dependencies = [`
`12`	`12`	`"livekit-agents[openai,turn-detector,silero,cartesia,deepgram]~=1.2",`
`13`		`- "livekit-plugins-noise-cancellation~=0.2.1",`
	`13`	`+ "livekit-plugins-noise-cancellation~=0.2",`
`14`	`14`	`"python-dotenv",`
`15`	`15`	`]`
`16`	`16`