Add Text-to-Speech (TTS) support with Edge TTS and ElevenLabs integration

- Updated `pyproject.toml` to include Edge TTS and ElevenLabs as dependencies. - Enhanced documentation to detail voice message capabilities across platforms and TTS provider options. - Modified the GatewayRunner to handle MEDIA tags from TTS tool responses, ensuring proper delivery of audio messages.
2026-04-25 00:51:20 +00:00 · 2026-02-14 16:08:14 -08:00 · 2026-02-14 16:08:14 -08:00 · 586b0a7047
commit 586b0a7047
parent 84718d183a
4 changed files with 62 additions and 7 deletions
--- a/pyproject.toml
+++ b/pyproject.toml
@ -27,6 +27,8 @@ dependencies = [
  # Tools
  "firecrawl-py",
  "fal-client",
+  # Text-to-speech (Edge TTS is free, no API key needed)
+  "edge-tts",
  # mini-swe-agent deps (terminal tool)
  "litellm>=1.75.5",
  "typer",
@ -39,12 +41,14 @@ dev = ["pytest", "pytest-asyncio"]
 messaging = ["python-telegram-bot>=20.0", "discord.py>=2.0", "aiohttp>=3.9.0"]
 cron = ["croniter"]
 cli = ["simple-term-menu"]
+tts-premium = ["elevenlabs"]
 all = [
  "hermes-agent[modal]",
  "hermes-agent[messaging]",
  "hermes-agent[cron]",
  "hermes-agent[cli]",
  "hermes-agent[dev]",
+  "hermes-agent[tts-premium]",
 ]

 [project.scripts]