feat: devex help, add Makefile, ruff, pre-commit, and modernize CI

2026-04-29 01:31:41 +00:00 · 2026-03-09 20:36:51 -05:00 · 2026-03-09 20:36:51 -05:00 · f4d7e6a29e
commit f4d7e6a29e
parent 172a38c344
111 changed files with 11655 additions and 10200 deletions
--- a/gateway/platforms/base.py
+++ b/gateway/platforms/base.py
@ -13,20 +13,20 @@ import uuid
 from abc import ABC, abstractmethod

 logger = logging.getLogger(__name__)
+import sys
+from collections.abc import Awaitable, Callable
 from dataclasses import dataclass, field
 from datetime import datetime
-from pathlib import Path
-from typing import Dict, List, Optional, Any, Callable, Awaitable, Tuple
 from enum import Enum
-
-import sys
+from pathlib import Path
 from pathlib import Path as _Path
+from typing import Any
+
 sys.path.insert(0, str(_Path(__file__).resolve().parents[2]))

 from gateway.config import Platform, PlatformConfig
 from gateway.session import SessionSource

-
 # ---------------------------------------------------------------------------
 # Image cache utilities
 #
@ -251,6 +251,7 @@ def cleanup_document_cache(max_age_hours: int = 24) -> int:

 class MessageType(Enum):
    """Types of incoming messages."""
+
    TEXT = "text"
    LOCATION = "location"
    PHOTO = "photo"
@ -266,42 +267,43 @@ class MessageType(Enum):
 class MessageEvent:
    """
    Incoming message from a platform.
-    
+
    Normalized representation that all adapters produce.
    """
+
    # Message content
    text: str
    message_type: MessageType = MessageType.TEXT
-    
+
    # Source information
    source: SessionSource = None
-    
+
    # Original platform data
    raw_message: Any = None
-    message_id: Optional[str] = None
-    
+    message_id: str | None = None
+
    # Media attachments
-    media_urls: List[str] = field(default_factory=list)
-    media_types: List[str] = field(default_factory=list)
-    
+    media_urls: list[str] = field(default_factory=list)
+    media_types: list[str] = field(default_factory=list)
+
    # Reply context
-    reply_to_message_id: Optional[str] = None
-    
+    reply_to_message_id: str | None = None
+
    # Timestamps
    timestamp: datetime = field(default_factory=datetime.now)
-    
+
    def is_command(self) -> bool:
        """Check if this is a command message (e.g., /new, /reset)."""
        return self.text.startswith("/")
-    
-    def get_command(self) -> Optional[str]:
+
+    def get_command(self) -> str | None:
        """Extract command name if this is a command message."""
        if not self.is_command():
            return None
        # Split on space and get first word, strip the /
        parts = self.text.split(maxsplit=1)
        return parts[0][1:].lower() if parts else None
-    
+
    def get_command_args(self) -> str:
        """Get the arguments after a command."""
        if not self.is_command():
@ -310,91 +312,88 @@ class MessageEvent:
        return parts[1] if len(parts) > 1 else ""


-@dataclass 
+@dataclass
 class SendResult:
    """Result of sending a message."""
+
    success: bool
-    message_id: Optional[str] = None
-    error: Optional[str] = None
+    message_id: str | None = None
+    error: str | None = None
    raw_response: Any = None


 # Type for message handlers
-MessageHandler = Callable[[MessageEvent], Awaitable[Optional[str]]]
+MessageHandler = Callable[[MessageEvent], Awaitable[str | None]]


 class BasePlatformAdapter(ABC):
    """
    Base class for platform adapters.
-    
+
    Subclasses implement platform-specific logic for:
    - Connecting and authenticating
    - Receiving messages
    - Sending messages/responses
    - Handling media
    """
-    
+
    def __init__(self, config: PlatformConfig, platform: Platform):
        self.config = config
        self.platform = platform
-        self._message_handler: Optional[MessageHandler] = None
+        self._message_handler: MessageHandler | None = None
        self._running = False
-        
+
        # Track active message handlers per session for interrupt support
        # Key: session_key (e.g., chat_id), Value: (event, asyncio.Event for interrupt)
-        self._active_sessions: Dict[str, asyncio.Event] = {}
-        self._pending_messages: Dict[str, MessageEvent] = {}
-    
+        self._active_sessions: dict[str, asyncio.Event] = {}
+        self._pending_messages: dict[str, MessageEvent] = {}
+
    @property
    def name(self) -> str:
        """Human-readable name for this adapter."""
        return self.platform.value.title()
-    
+
    @property
    def is_connected(self) -> bool:
        """Check if adapter is currently connected."""
        return self._running
-    
+
    def set_message_handler(self, handler: MessageHandler) -> None:
        """
        Set the handler for incoming messages.
-        
+
        The handler receives a MessageEvent and should return
        an optional response string.
        """
        self._message_handler = handler
-    
+
    @abstractmethod
    async def connect(self) -> bool:
        """
        Connect to the platform and start receiving messages.
-        
+
        Returns True if connection was successful.
        """
        pass
-    
+
    @abstractmethod
    async def disconnect(self) -> None:
        """Disconnect from the platform."""
        pass
-    
+
    @abstractmethod
    async def send(
-        self,
-        chat_id: str,
-        content: str,
-        reply_to: Optional[str] = None,
-        metadata: Optional[Dict[str, Any]] = None
+        self, chat_id: str, content: str, reply_to: str | None = None, metadata: dict[str, Any] | None = None
    ) -> SendResult:
        """
        Send a message to a chat.
-        
+
        Args:
            chat_id: The chat/channel ID to send to
            content: Message content (may be markdown)
            reply_to: Optional message ID to reply to
            metadata: Additional platform-specific options
-        
+
        Returns:
            SendResult with success status and message ID
        """
@ -416,21 +415,21 @@ class BasePlatformAdapter(ABC):
    async def send_typing(self, chat_id: str) -> None:
        """
        Send a typing indicator.
-        
+
        Override in subclasses if the platform supports it.
        """
        pass
-    
+
    async def send_image(
        self,
        chat_id: str,
        image_url: str,
-        caption: Optional[str] = None,
-        reply_to: Optional[str] = None,
+        caption: str | None = None,
+        reply_to: str | None = None,
    ) -> SendResult:
        """
        Send an image natively via the platform API.
-        
+
        Override in subclasses to send images as proper attachments
        instead of plain-text URLs. Default falls back to sending the
        URL as a text message.
@ -438,87 +437,91 @@ class BasePlatformAdapter(ABC):
        # Fallback: send URL as text (subclasses override for native images)
        text = f"{caption}\n{image_url}" if caption else image_url
        return await self.send(chat_id=chat_id, content=text, reply_to=reply_to)
-    
+
    async def send_animation(
        self,
        chat_id: str,
        animation_url: str,
-        caption: Optional[str] = None,
-        reply_to: Optional[str] = None,
+        caption: str | None = None,
+        reply_to: str | None = None,
    ) -> SendResult:
        """
        Send an animated GIF natively via the platform API.
-        
+
        Override in subclasses to send GIFs as proper animations
        (e.g., Telegram send_animation) so they auto-play inline.
        Default falls back to send_image.
        """
        return await self.send_image(chat_id=chat_id, image_url=animation_url, caption=caption, reply_to=reply_to)
-    
+
    @staticmethod
    def _is_animation_url(url: str) -> bool:
        """Check if a URL points to an animated GIF (vs a static image)."""
-        lower = url.lower().split('?')[0]  # Strip query params
-        return lower.endswith('.gif')
+        lower = url.lower().split("?")[0]  # Strip query params
+        return lower.endswith(".gif")

    @staticmethod
-    def extract_images(content: str) -> Tuple[List[Tuple[str, str]], str]:
+    def extract_images(content: str) -> tuple[list[tuple[str, str]], str]:
        """
        Extract image URLs from markdown and HTML image tags in a response.
-        
+
        Finds patterns like:
        - ![alt text](https://example.com/image.png)
        - <img src="https://example.com/image.png">
        - <img src="https://example.com/image.png"></img>
-        
+
        Args:
            content: The response text to scan.
-        
+
        Returns:
            Tuple of (list of (url, alt_text) pairs, cleaned content with image tags removed).
        """
        images = []
        cleaned = content
-        
+
        # Match markdown images: ![alt](url)
-        md_pattern = r'!\[([^\]]*)\]\((https?://[^\s\)]+)\)'
+        md_pattern = r"!\[([^\]]*)\]\((https?://[^\s\)]+)\)"
        for match in re.finditer(md_pattern, content):
            alt_text = match.group(1)
            url = match.group(2)
            # Only extract URLs that look like actual images
-            if any(url.lower().endswith(ext) or ext in url.lower() for ext in
-                   ['.png', '.jpg', '.jpeg', '.gif', '.webp', 'fal.media', 'fal-cdn', 'replicate.delivery']):
+            if any(
+                url.lower().endswith(ext) or ext in url.lower()
+                for ext in [".png", ".jpg", ".jpeg", ".gif", ".webp", "fal.media", "fal-cdn", "replicate.delivery"]
+            ):
                images.append((url, alt_text))
-        
+
        # Match HTML img tags: <img src="url"> or <img src="url"></img> or <img src="url"/>
        html_pattern = r'<img\s+src=["\']?(https?://[^\s"\'<>]+)["\']?\s*/?>\s*(?:</img>)?'
        for match in re.finditer(html_pattern, content):
            url = match.group(1)
            images.append((url, ""))
-        
+
        # Remove only the matched image tags from content (not all markdown images)
        if images:
            extracted_urls = {url for url, _ in images}
+
            def _remove_if_extracted(match):
                url = match.group(2) if match.lastindex >= 2 else match.group(1)
-                return '' if url in extracted_urls else match.group(0)
+                return "" if url in extracted_urls else match.group(0)
+
            cleaned = re.sub(md_pattern, _remove_if_extracted, cleaned)
            cleaned = re.sub(html_pattern, _remove_if_extracted, cleaned)
            # Clean up leftover blank lines
-            cleaned = re.sub(r'\n{3,}', '\n\n', cleaned).strip()
-        
+            cleaned = re.sub(r"\n{3,}", "\n\n", cleaned).strip()
+
        return images, cleaned
-    
+
    async def send_voice(
        self,
        chat_id: str,
        audio_path: str,
-        caption: Optional[str] = None,
-        reply_to: Optional[str] = None,
+        caption: str | None = None,
+        reply_to: str | None = None,
    ) -> SendResult:
        """
        Send an audio file as a native voice message via the platform API.
-        
+
        Override in subclasses to send audio as voice bubbles (Telegram)
        or file attachments (Discord). Default falls back to sending the
        file path as text.
@ -532,8 +535,8 @@ class BasePlatformAdapter(ABC):
        self,
        chat_id: str,
        video_path: str,
-        caption: Optional[str] = None,
-        reply_to: Optional[str] = None,
+        caption: str | None = None,
+        reply_to: str | None = None,
    ) -> SendResult:
        """
        Send a video natively via the platform API.
@ -550,9 +553,9 @@ class BasePlatformAdapter(ABC):
        self,
        chat_id: str,
        file_path: str,
-        caption: Optional[str] = None,
-        file_name: Optional[str] = None,
-        reply_to: Optional[str] = None,
+        caption: str | None = None,
+        file_name: str | None = None,
+        reply_to: str | None = None,
    ) -> SendResult:
        """
        Send a document/file natively via the platform API.
@ -569,8 +572,8 @@ class BasePlatformAdapter(ABC):
        self,
        chat_id: str,
        image_path: str,
-        caption: Optional[str] = None,
-        reply_to: Optional[str] = None,
+        caption: str | None = None,
+        reply_to: str | None = None,
    ) -> SendResult:
        """
        Send a local image file natively via the platform API.
@ -585,45 +588,45 @@ class BasePlatformAdapter(ABC):
        return await self.send(chat_id=chat_id, content=text, reply_to=reply_to)

    @staticmethod
-    def extract_media(content: str) -> Tuple[List[Tuple[str, bool]], str]:
+    def extract_media(content: str) -> tuple[list[tuple[str, bool]], str]:
        """
        Extract MEDIA:<path> tags and [[audio_as_voice]] directives from response text.
-        
+
        The TTS tool returns responses like:
            [[audio_as_voice]]
            MEDIA:/path/to/audio.ogg
-        
+
        Args:
            content: The response text to scan.
-        
+
        Returns:
            Tuple of (list of (path, is_voice) pairs, cleaned content with tags removed).
        """
        media = []
        cleaned = content
-        
+
        # Check for [[audio_as_voice]] directive
        has_voice_tag = "[[audio_as_voice]]" in content
        cleaned = cleaned.replace("[[audio_as_voice]]", "")
-        
+
        # Extract MEDIA:<path> tags (path may contain spaces)
-        media_pattern = r'MEDIA:(\S+)'
+        media_pattern = r"MEDIA:(\S+)"
        for match in re.finditer(media_pattern, content):
            path = match.group(1).strip()
            if path:
                media.append((path, has_voice_tag))
-        
+
        # Remove MEDIA tags from content
        if media:
-            cleaned = re.sub(media_pattern, '', cleaned)
-            cleaned = re.sub(r'\n{3,}', '\n\n', cleaned).strip()
-        
+            cleaned = re.sub(media_pattern, "", cleaned)
+            cleaned = re.sub(r"\n{3,}", "\n\n", cleaned).strip()
+
        return media, cleaned
-    
+
    async def _keep_typing(self, chat_id: str, interval: float = 2.0) -> None:
        """
        Continuously send typing indicator until cancelled.
-        
+
        Telegram/Discord typing status expires after ~5 seconds, so we refresh every 2
        to recover quickly after progress messages interrupt it.
        """
@ -633,20 +636,20 @@ class BasePlatformAdapter(ABC):
                await asyncio.sleep(interval)
        except asyncio.CancelledError:
            pass  # Normal cancellation when handler completes
-    
+
    async def handle_message(self, event: MessageEvent) -> None:
        """
        Process an incoming message.
-        
+
        This method returns quickly by spawning background tasks.
        This allows new messages to be processed even while an agent is running,
        enabling interruption support.
        """
        if not self._message_handler:
            return
-        
+
        session_key = event.source.chat_id
-        
+
        # Check if there's already an active handler for this session
        if session_key in self._active_sessions:
            # Store this as a pending message - it will interrupt the running agent
@ -655,10 +658,10 @@ class BasePlatformAdapter(ABC):
            # Signal the interrupt (the processing task checks this)
            self._active_sessions[session_key].set()
            return  # Don't process now - will be handled after current task finishes
-        
+
        # Spawn background task to process this message
        asyncio.create_task(self._process_message_background(event, session_key))
-    
+
    @staticmethod
    def _get_human_delay() -> float:
        """
@ -685,35 +688,40 @@ class BasePlatformAdapter(ABC):
        # Create interrupt event for this session
        interrupt_event = asyncio.Event()
        self._active_sessions[session_key] = interrupt_event
-        
+
        # Start continuous typing indicator (refreshes every 2 seconds)
        typing_task = asyncio.create_task(self._keep_typing(event.source.chat_id))
-        
+
        try:
            # Call the handler (this can take a while with tool calls)
            response = await self._message_handler(event)
-            
+
            # Send response if any
            if not response:
                logger.warning("[%s] Handler returned empty/None response for %s", self.name, event.source.chat_id)
            if response:
                # Extract MEDIA:<path> tags (from TTS tool) before other processing
                media_files, response = self.extract_media(response)
-                
+
                # Extract image URLs and send them as native platform attachments
                images, text_content = self.extract_images(response)
                if images:
-                    logger.info("[%s] extract_images found %d image(s) in response (%d chars)", self.name, len(images), len(response))
-                
+                    logger.info(
+                        "[%s] extract_images found %d image(s) in response (%d chars)",
+                        self.name,
+                        len(images),
+                        len(response),
+                    )
+
                # Send the text portion first (if any remains after extractions)
                if text_content:
-                    logger.info("[%s] Sending response (%d chars) to %s", self.name, len(text_content), event.source.chat_id)
-                    result = await self.send(
-                        chat_id=event.source.chat_id,
-                        content=text_content,
-                        reply_to=event.message_id
+                    logger.info(
+                        "[%s] Sending response (%d chars) to %s", self.name, len(text_content), event.source.chat_id
                    )
-                    
+                    result = await self.send(
+                        chat_id=event.source.chat_id, content=text_content, reply_to=event.message_id
+                    )
+
                    # Log send failures (don't raise - user already saw tool progress)
                    if not result.success:
                        print(f"[{self.name}] Failed to send response: {result.error}")
@ -721,14 +729,14 @@ class BasePlatformAdapter(ABC):
                        fallback_result = await self.send(
                            chat_id=event.source.chat_id,
                            content=f"(Response formatting failed, plain text:)\n\n{text_content[:3500]}",
-                            reply_to=event.message_id
+                            reply_to=event.message_id,
                        )
                        if not fallback_result.success:
                            print(f"[{self.name}] Fallback send also failed: {fallback_result.error}")
-                
+
                # Human-like pacing delay between text and media
                human_delay = self._get_human_delay()
-                
+
                # Send extracted images as native attachments
                if images:
                    logger.info("[%s] Extracted %d image(s) to send as attachments", self.name, len(images))
@ -736,7 +744,12 @@ class BasePlatformAdapter(ABC):
                    if human_delay > 0:
                        await asyncio.sleep(human_delay)
                    try:
-                        logger.info("[%s] Sending image: %s (alt=%s)", self.name, image_url[:80], alt_text[:30] if alt_text else "")
+                        logger.info(
+                            "[%s] Sending image: %s (alt=%s)",
+                            self.name,
+                            image_url[:80],
+                            alt_text[:30] if alt_text else "",
+                        )
                        # Route animated GIFs through send_animation for proper playback
                        if self._is_animation_url(image_url):
                            img_result = await self.send_animation(
@ -754,11 +767,11 @@ class BasePlatformAdapter(ABC):
                            logger.error("[%s] Failed to send image: %s", self.name, img_result.error)
                    except Exception as img_err:
                        logger.error("[%s] Error sending image: %s", self.name, img_err, exc_info=True)
-                
+
                # Send extracted media files — route by file type
-                _AUDIO_EXTS = {'.ogg', '.opus', '.mp3', '.wav', '.m4a'}
-                _VIDEO_EXTS = {'.mp4', '.mov', '.avi', '.mkv', '.3gp'}
-                _IMAGE_EXTS = {'.jpg', '.jpeg', '.png', '.webp', '.gif'}
+                _AUDIO_EXTS = {".ogg", ".opus", ".mp3", ".wav", ".m4a"}
+                _VIDEO_EXTS = {".mp4", ".mov", ".avi", ".mkv", ".3gp"}
+                _IMAGE_EXTS = {".jpg", ".jpeg", ".png", ".webp", ".gif"}

                for media_path, is_voice in media_files:
                    if human_delay > 0:
@ -790,7 +803,7 @@ class BasePlatformAdapter(ABC):
                            print(f"[{self.name}] Failed to send media ({ext}): {media_result.error}")
                    except Exception as media_err:
                        print(f"[{self.name}] Error sending media: {media_err}")
-            
+
            # Check if there's a pending message that was queued during our processing
            if session_key in self._pending_messages:
                pending_event = self._pending_messages.pop(session_key)
@ -806,10 +819,11 @@ class BasePlatformAdapter(ABC):
                # Process pending message in new background task
                await self._process_message_background(pending_event, session_key)
                return  # Already cleaned up
-                
+
        except Exception as e:
            print(f"[{self.name}] Error handling message: {e}")
            import traceback
+
            traceback.print_exc()
        finally:
            # Stop typing indicator
@ -821,26 +835,26 @@ class BasePlatformAdapter(ABC):
            # Clean up session tracking
            if session_key in self._active_sessions:
                del self._active_sessions[session_key]
-    
+
    def has_pending_interrupt(self, session_key: str) -> bool:
        """Check if there's a pending interrupt for a session."""
        return session_key in self._active_sessions and self._active_sessions[session_key].is_set()
-    
-    def get_pending_message(self, session_key: str) -> Optional[MessageEvent]:
+
+    def get_pending_message(self, session_key: str) -> MessageEvent | None:
        """Get and clear any pending message for a session."""
        return self._pending_messages.pop(session_key, None)
-    
+
    def build_source(
        self,
        chat_id: str,
-        chat_name: Optional[str] = None,
+        chat_name: str | None = None,
        chat_type: str = "dm",
-        user_id: Optional[str] = None,
-        user_name: Optional[str] = None,
-        thread_id: Optional[str] = None,
-        chat_topic: Optional[str] = None,
-        user_id_alt: Optional[str] = None,
-        chat_id_alt: Optional[str] = None,
+        user_id: str | None = None,
+        user_name: str | None = None,
+        thread_id: str | None = None,
+        chat_topic: str | None = None,
+        user_id_alt: str | None = None,
+        chat_id_alt: str | None = None,
    ) -> SessionSource:
        """Helper to build a SessionSource for this platform."""
        # Normalize empty topic to None
@ -858,30 +872,30 @@ class BasePlatformAdapter(ABC):
            user_id_alt=user_id_alt,
            chat_id_alt=chat_id_alt,
        )
-    
+
    @abstractmethod
-    async def get_chat_info(self, chat_id: str) -> Dict[str, Any]:
+    async def get_chat_info(self, chat_id: str) -> dict[str, Any]:
        """
        Get information about a chat/channel.
-        
+
        Returns dict with at least:
        - name: Chat name
        - type: "dm", "group", "channel"
        """
        pass
-    
+
    def format_message(self, content: str) -> str:
        """
        Format a message for this platform.
-        
+
        Override in subclasses to handle platform-specific formatting
        (e.g., Telegram MarkdownV2, Discord markdown).
-        
+
        Default implementation returns content as-is.
        """
        return content
-    
-    def truncate_message(self, content: str, max_length: int = 4096) -> List[str]:
+
+    def truncate_message(self, content: str, max_length: int = 4096) -> list[str]:
        """
        Split a long message into chunks, preserving code block boundaries.

@ -900,14 +914,14 @@ class BasePlatformAdapter(ABC):
        if len(content) <= max_length:
            return [content]

-        INDICATOR_RESERVE = 10   # room for " (XX/XX)"
+        INDICATOR_RESERVE = 10  # room for " (XX/XX)"
        FENCE_CLOSE = "\n```"

-        chunks: List[str] = []
+        chunks: list[str] = []
        remaining = content
        # When the previous chunk ended mid-code-block, this holds the
        # language tag (possibly "") so we can reopen the fence.
-        carry_lang: Optional[str] = None
+        carry_lang: str | None = None

        while remaining:
            # If we're continuing a code block from the previous chunk,
@ -965,8 +979,6 @@ class BasePlatformAdapter(ABC):
        # Append chunk indicators when the response spans multiple messages
        if len(chunks) > 1:
            total = len(chunks)
-            chunks = [
-                f"{chunk} ({i + 1}/{total})" for i, chunk in enumerate(chunks)
-            ]
+            chunks = [f"{chunk} ({i + 1}/{total})" for i, chunk in enumerate(chunks)]

        return chunks