atropos/environments/community/router_env/engine/agents/gmail_agent.py

84 lines
2.6 KiB
Python

import logging
import os
from typing import List, Optional
from dotenv import load_dotenv
from livekit.agents import (
Agent,
AgentSession,
ChatContext,
JobContext,
WorkerOptions,
cli,
function_tool,
mcp,
)
from livekit.plugins import deepgram, openai, silero
from livekit.plugins.turn_detector.multilingual import MultilingualModel
load_dotenv(os.path.join(os.path.dirname(__file__), "..", "..", ".env"))
logger = logging.getLogger("gmail-agent")
class GmailAgent(Agent):
def __init__(
self, chat_ctx: ChatContext, tools: Optional[List[function_tool]] = None
) -> None:
final_instructions = (
"You are a Gmail specialist. You can manage emails by reading, searching, sending, and "
"updating them (e.g., marking as read/unread, moving to folders). "
+ "Use tools like 'read_emails', 'send_email', and 'update_email' to interact with Gmail. "
+ "If sending an email, you might need a recipient; you know Gabin (gabin.fay@gmail.com). "
+ "If your task is complete or the user asks for something outside your email management "
"capabilities (e.g., math, calendar), "
+ "you MUST use the 'delegate_to_router_agent' tool to return to the main assistant."
)
all_tools = tools if tools is not None else []
mcp_servers_list = []
gumloop_mcp_url = os.getenv("GUMLOOP_GMAIL_MCP_URL")
if gumloop_mcp_url:
mcp_servers_list.append(
mcp.MCPServerHTTP(
url=gumloop_mcp_url,
timeout=5,
client_session_timeout_seconds=5,
)
)
else:
logger.warning(
"GUMLOOP_GMAIL_MCP_URL not set. Gmail agent may not have all its tools."
)
super().__init__(
instructions=final_instructions,
chat_ctx=chat_ctx,
allow_interruptions=True,
mcp_servers=mcp_servers_list,
tools=all_tools,
)
async def on_enter(self):
self.session.generate_reply()
async def entrypoint(ctx: JobContext):
await ctx.connect()
session = AgentSession(
vad=silero.VAD.load(),
stt=deepgram.STT(model="nova-3", language="multi"),
llm=openai.LLM(model="gpt-4o-mini"),
tts=openai.TTS(voice="alloy"),
turn_detection=MultilingualModel(),
)
await session.start(agent=GmailAgent(chat_ctx=session._chat_ctx), room=ctx.room)
if __name__ == "__main__":
cli.run_app(WorkerOptions(entrypoint_fnc=entrypoint))