chore: migrate to v1 of agents library (#32)

MichaelSolati · web-flow · commit e208872811af · 2025-05-05T08:31:02.000-07:00
* chore: migrate to v1 of agents library
diff --git a/README.md b/README.md
@@ -39,8 +39,8 @@ python3 -m venv venv
 venv\Scripts\activate
 pip install -r requirements.txt
 ```
-</details>
 
+</details>
 
 Set up the environment by copying `.env.example` to `.env.local` and filling in the required values:
 
@@ -60,7 +60,13 @@ lk app env
 Run the agent:
 
 ```console
-python3 agent.py dev
+python3 agent.py console
 ```
 
-This agent requires a frontend application to communicate with. You can use one of our example frontends in [livekit-examples](https://github.com/livekit-examples/), create your own following one of our [client quickstarts](https://docs.livekit.io/realtime/quickstarts/), or test instantly against one of our hosted [Sandbox](https://cloud.livekit.io/projects/p_/sandbox) frontends.
+This agent can use a frontend application to communicate with. You can use one of our example frontends in [livekit-examples](https://github.com/livekit-examples/), create your own following one of our [client quickstarts](https://docs.livekit.io/realtime/quickstarts/), or test instantly against one of our hosted [Sandbox](https://cloud.livekit.io/projects/p_/sandbox) frontends.
+
+Run the agent with the following command when using a frontend application.
+
+```console
+python3 agent.py dev
+```
diff --git a/agent.py b/agent.py
@@ -2,82 +2,93 @@
 
 from dotenv import load_dotenv
 from livekit.agents import (
+    Agent,
+    AgentSession,
     AutoSubscribe,
     JobContext,
     JobProcess,
     WorkerOptions,
     cli,
-    llm,
     metrics,
+    RoomInputOptions,
 )
-from livekit.agents.pipeline import VoicePipelineAgent
 from livekit.plugins import (
     cartesia,
     openai,
     deepgram,
     noise_cancellation,
     silero,
-    turn_detector,
 )
+from livekit.plugins.turn_detector.multilingual import MultilingualModel
 
 
 load_dotenv(dotenv_path=".env.local")
 logger = logging.getLogger("voice-agent")
 
 
+class Assistant(Agent):
+    def __init__(self) -> None:
+        # This project is configured to use Deepgram STT, OpenAI LLM and Cartesia TTS plugins
+        # Other great providers exist like Cerebras, ElevenLabs, Groq, Play.ht, Rime, and more
+        # Learn more and pick the best one for your app:
+        # https://docs.livekit.io/agents/plugins
+        super().__init__(
+            instructions="You are a voice assistant created by LiveKit. Your interface with users will be voice. "
+            "You should use short and concise responses, and avoiding usage of unpronouncable punctuation. "
+            "You were created as a demo to showcase the capabilities of LiveKit's agents framework.",
+            stt=deepgram.STT(),
+            llm=openai.LLM(model="gpt-4o-mini"),
+            tts=cartesia.TTS(),
+            # use LiveKit's transformer-based turn detector
+            turn_detection=MultilingualModel(),
+        )
+
+    async def on_enter(self):
+        # The agent should be polite and greet the user when it joins :)
+        self.session.generate_reply(
+            instructions="Hey, how can I help you today?", allow_interruptions=True
+        )
+
+
 def prewarm(proc: JobProcess):
     proc.userdata["vad"] = silero.VAD.load()
 
 
 async def entrypoint(ctx: JobContext):
-    initial_ctx = llm.ChatContext().append(
-        role="system",
-        text=(
-            "You are a voice assistant created by LiveKit. Your interface with users will be voice. "
-            "You should use short and concise responses, and avoiding usage of unpronouncable punctuation. "
-            "You were created as a demo to showcase the capabilities of LiveKit's agents framework."
-        ),
-    )
-
     logger.info(f"connecting to room {ctx.room.name}")
     await ctx.connect(auto_subscribe=AutoSubscribe.AUDIO_ONLY)
 
     # Wait for the first participant to connect
     participant = await ctx.wait_for_participant()
     logger.info(f"starting voice assistant for participant {participant.identity}")
 
-    # This project is configured to use Deepgram STT, OpenAI LLM and Cartesia TTS plugins
-    # Other great providers exist like Cerebras, ElevenLabs, Groq, Play.ht, Rime, and more
-    # Learn more and pick the best one for your app:
-    # https://docs.livekit.io/agents/plugins
-    agent = VoicePipelineAgent(
+    usage_collector = metrics.UsageCollector()
+
+    # Log metrics and collect usage data
+    def on_metrics_collected(agent_metrics: metrics.AgentMetrics):
+        metrics.log_metrics(agent_metrics)
+        usage_collector.collect(agent_metrics)
+
+    session = AgentSession(
         vad=ctx.proc.userdata["vad"],
-        stt=deepgram.STT(),
-        llm=openai.LLM(model="gpt-4o-mini"),
-        tts=cartesia.TTS(),
-        # use LiveKit's transformer-based turn detector
-        turn_detector=turn_detector.EOUModel(),
         # minimum delay for endpointing, used when turn detector believes the user is done with their turn
         min_endpointing_delay=0.5,
         # maximum delay for endpointing, used when turn detector does not believe the user is done with their turn
         max_endpointing_delay=5.0,
-        # enable background voice & noise cancellation, powered by Krisp
-        # included at no additional cost with LiveKit Cloud
-        noise_cancellation=noise_cancellation.BVC(),
-        chat_ctx=initial_ctx,
     )
 
-    usage_collector = metrics.UsageCollector()
+    # Trigger the on_metrics_collected function when metrics are collected
+    session.on("metrics_collected", on_metrics_collected)
 
-    @agent.on("metrics_collected")
-    def on_metrics_collected(agent_metrics: metrics.AgentMetrics):
-        metrics.log_metrics(agent_metrics)
-        usage_collector.collect(agent_metrics)
-
-    agent.start(ctx.room, participant)
-
-    # The agent should be polite and greet the user when it joins :)
-    await agent.say("Hey, how can I help you today?", allow_interruptions=True)
+    await session.start(
+        room=ctx.room,
+        agent=Assistant(),
+        room_input_options=RoomInputOptions(
+            # enable background voice & noise cancellation, powered by Krisp
+            # included at no additional cost with LiveKit Cloud
+            noise_cancellation=noise_cancellation.BVC(),
+        ),
+    )
 
 
 if __name__ == "__main__":
diff --git a/requirements.txt b/requirements.txt
@@ -1,10 +1,10 @@
-livekit-agents>=0.12.17,<1.0.0
-livekit-plugins-openai>=0.11.2,<1.0.0
-livekit-plugins-cartesia>=0.4.10,<1.0.0
-livekit-plugins-deepgram>=0.7.0,<1.0.0
-livekit-plugins-silero>=0.7.5,<1.0.0
+livekit-agents~=1.0
+livekit-plugins-openai~=1.0
+livekit-plugins-cartesia~=1.0
+livekit-plugins-deepgram~=1.0
+livekit-plugins-silero~=1.0
 # optional, only when using LiveKit's turn detection model
-livekit-plugins-turn-detector>=0.4.3,<1.0.0
+livekit-plugins-turn-detector~=1.0
 # optional, only if background voice & noise cancellation is needed
 livekit-plugins-noise-cancellation>=0.2.0,<1.0.0
 python-dotenv~=1.0