feat: devex help, add Makefile, ruff, pre-commit, and modernize CI

2026-04-28 01:21:43 +00:00 · 2026-03-09 20:36:51 -05:00 · 2026-03-09 20:36:51 -05:00 · f4d7e6a29e
commit f4d7e6a29e
parent 172a38c344
111 changed files with 11655 additions and 10200 deletions
--- a/tools/image_generation_tool.py
+++ b/tools/image_generation_tool.py
@ -2,7 +2,7 @@
 """
 Image Generation Tools Module

-This module provides image generation tools using FAL.ai's FLUX 2 Pro model with 
+This module provides image generation tools using FAL.ai's FLUX 2 Pro model with
 automatic upscaling via FAL.ai's Clarity Upscaler for enhanced image quality.

 Available tools:
@ -19,7 +19,7 @@ Features:
 Usage:
    from image_generation_tool import image_generate_tool
    import asyncio
-    
+
    # Generate and automatically upscale an image
    result = await image_generate_tool(
        prompt="A serene mountain landscape with cherry blossoms",
@ -28,12 +28,14 @@ Usage:
    )
 """

+import datetime
 import json
 import logging
 import os
-import datetime
-from typing import Dict, Any, Optional, Union
+from typing import Any
+
 import fal_client
+
 from tools.debug_helpers import DebugSession

 logger = logging.getLogger(__name__)
@ -51,11 +53,7 @@ ENABLE_SAFETY_CHECKER = False
 SAFETY_TOLERANCE = "5"  # Maximum tolerance (1-5, where 5 is most permissive)

 # Aspect ratio mapping - simplified choices for model to select
-ASPECT_RATIO_MAP = {
-    "landscape": "landscape_16_9",
-    "square": "square_hd",
-    "portrait": "portrait_16_9"
-}
+ASPECT_RATIO_MAP = {"landscape": "landscape_16_9", "square": "square_hd", "portrait": "portrait_16_9"}
 VALID_ASPECT_RATIOS = list(ASPECT_RATIO_MAP.keys())

 # Configuration for automatic upscaling
@ -70,9 +68,7 @@ UPSCALER_GUIDANCE_SCALE = 4
 UPSCALER_NUM_INFERENCE_STEPS = 18

 # Valid parameter values for validation based on FLUX 2 Pro documentation
-VALID_IMAGE_SIZES = [
-    "square_hd", "square", "portrait_4_3", "portrait_16_9", "landscape_4_3", "landscape_16_9"
-]
+VALID_IMAGE_SIZES = ["square_hd", "square", "portrait_4_3", "portrait_16_9", "landscape_4_3", "landscape_16_9"]
 VALID_OUTPUT_FORMATS = ["jpeg", "png"]
 VALID_ACCELERATION_MODES = ["none", "regular", "high"]

@ -80,16 +76,16 @@ _debug = DebugSession("image_tools", env_var="IMAGE_TOOLS_DEBUG")


 def _validate_parameters(
-    image_size: Union[str, Dict[str, int]], 
+    image_size: str | dict[str, int],
    num_inference_steps: int,
    guidance_scale: float,
    num_images: int,
    output_format: str,
-    acceleration: str = "none"
-) -> Dict[str, Any]:
+    acceleration: str = "none",
+) -> dict[str, Any]:
    """
    Validate and normalize image generation parameters for FLUX 2 Pro model.
-    
+
    Args:
        image_size: Either a preset string or custom size dict
        num_inference_steps: Number of inference steps
@ -97,15 +93,15 @@ def _validate_parameters(
        num_images: Number of images to generate
        output_format: Output format for images
        acceleration: Acceleration mode for generation speed
-    
+
    Returns:
        Dict[str, Any]: Validated and normalized parameters
-    
+
    Raises:
        ValueError: If any parameter is invalid
    """
    validated = {}
-    
+
    # Validate image_size
    if isinstance(image_size, str):
        if image_size not in VALID_IMAGE_SIZES:
@ -123,52 +119,52 @@ def _validate_parameters(
        validated["image_size"] = image_size
    else:
        raise ValueError("image_size must be either a preset string or a dict with width/height")
-    
+
    # Validate num_inference_steps
    if not isinstance(num_inference_steps, int) or num_inference_steps < 1 or num_inference_steps > 100:
        raise ValueError("num_inference_steps must be an integer between 1 and 100")
    validated["num_inference_steps"] = num_inference_steps
-    
+
    # Validate guidance_scale (FLUX 2 Pro default is 4.5)
    if not isinstance(guidance_scale, (int, float)) or guidance_scale < 0.1 or guidance_scale > 20.0:
        raise ValueError("guidance_scale must be a number between 0.1 and 20.0")
    validated["guidance_scale"] = float(guidance_scale)
-    
+
    # Validate num_images
    if not isinstance(num_images, int) or num_images < 1 or num_images > 4:
        raise ValueError("num_images must be an integer between 1 and 4")
    validated["num_images"] = num_images
-    
+
    # Validate output_format
    if output_format not in VALID_OUTPUT_FORMATS:
        raise ValueError(f"Invalid output_format '{output_format}'. Must be one of: {VALID_OUTPUT_FORMATS}")
    validated["output_format"] = output_format
-    
+
    # Validate acceleration
    if acceleration not in VALID_ACCELERATION_MODES:
        raise ValueError(f"Invalid acceleration '{acceleration}'. Must be one of: {VALID_ACCELERATION_MODES}")
    validated["acceleration"] = acceleration
-    
+
    return validated


-def _upscale_image(image_url: str, original_prompt: str) -> Dict[str, Any]:
+def _upscale_image(image_url: str, original_prompt: str) -> dict[str, Any]:
    """
    Upscale an image using FAL.ai's Clarity Upscaler.
-    
+
    Uses the synchronous fal_client API to avoid event loop lifecycle issues
    when called from threaded contexts (e.g. gateway thread pool).
-    
+
    Args:
        image_url (str): URL of the image to upscale
        original_prompt (str): Original prompt used to generate the image
-    
+
    Returns:
        Dict[str, Any]: Upscaled image data or None if upscaling fails
    """
    try:
        logger.info("Upscaling image with Clarity Upscaler...")
-        
+
        # Prepare arguments for upscaler
        upscaler_arguments = {
            "image_url": image_url,
@ -179,35 +175,36 @@ def _upscale_image(image_url: str, original_prompt: str) -> Dict[str, Any]:
            "resemblance": UPSCALER_RESEMBLANCE,
            "guidance_scale": UPSCALER_GUIDANCE_SCALE,
            "num_inference_steps": UPSCALER_NUM_INFERENCE_STEPS,
-            "enable_safety_checker": UPSCALER_SAFETY_CHECKER
+            "enable_safety_checker": UPSCALER_SAFETY_CHECKER,
        }
-        
+
        # Use sync API — fal_client.submit() uses httpx.Client (no event loop).
        # The async API (submit_async) caches a global httpx.AsyncClient via
        # @cached_property, which breaks when asyncio.run() destroys the loop
        # between calls (gateway thread-pool pattern).
-        handler = fal_client.submit(
-            UPSCALER_MODEL,
-            arguments=upscaler_arguments
-        )
-        
+        handler = fal_client.submit(UPSCALER_MODEL, arguments=upscaler_arguments)
+
        # Get the upscaled result (sync — blocks until done)
        result = handler.get()
-        
+
        if result and "image" in result:
            upscaled_image = result["image"]
-            logger.info("Image upscaled successfully to %sx%s", upscaled_image.get('width', 'unknown'), upscaled_image.get('height', 'unknown'))
+            logger.info(
+                "Image upscaled successfully to %sx%s",
+                upscaled_image.get("width", "unknown"),
+                upscaled_image.get("height", "unknown"),
+            )
            return {
                "url": upscaled_image["url"],
                "width": upscaled_image.get("width", 0),
                "height": upscaled_image.get("height", 0),
                "upscaled": True,
-                "upscale_factor": UPSCALER_FACTOR
+                "upscale_factor": UPSCALER_FACTOR,
            }
        else:
            logger.error("Upscaler returned invalid response")
            return None
-            
+
    except Exception as e:
        logger.error("Error upscaling image: %s", e)
        return None
@ -220,16 +217,16 @@ def image_generate_tool(
    guidance_scale: float = DEFAULT_GUIDANCE_SCALE,
    num_images: int = DEFAULT_NUM_IMAGES,
    output_format: str = DEFAULT_OUTPUT_FORMAT,
-    seed: Optional[int] = None
+    seed: int | None = None,
 ) -> str:
    """
    Generate images from text prompts using FAL.ai's FLUX 2 Pro model with automatic upscaling.
-    
+
    Uses the synchronous fal_client API to avoid event loop lifecycle issues.
    The async API's global httpx.AsyncClient (cached via @cached_property) breaks
    when asyncio.run() destroys and recreates event loops between calls, which
    happens in the gateway's thread-pool pattern.
-    
+
    Args:
        prompt (str): The text prompt describing the desired image
        aspect_ratio (str): Image aspect ratio - "landscape", "square", or "portrait" (default: "landscape")
@ -238,7 +235,7 @@ def image_generate_tool(
        num_images (int): Number of images to generate (1-4, default: 1)
        output_format (str): Image format "jpeg" or "png" (default: "png")
        seed (Optional[int]): Random seed for reproducible results (optional)
-    
+
    Returns:
        str: JSON string containing minimal generation results:
             {
@ -252,7 +249,7 @@ def image_generate_tool(
        logger.warning("Invalid aspect_ratio '%s', defaulting to '%s'", aspect_ratio, DEFAULT_ASPECT_RATIO)
        aspect_ratio_lower = DEFAULT_ASPECT_RATIO
    image_size = ASPECT_RATIO_MAP[aspect_ratio_lower]
-    
+
    debug_call_data = {
        "parameters": {
            "prompt": prompt,
@ -262,32 +259,32 @@ def image_generate_tool(
            "guidance_scale": guidance_scale,
            "num_images": num_images,
            "output_format": output_format,
-            "seed": seed
+            "seed": seed,
        },
        "error": None,
        "success": False,
        "images_generated": 0,
-        "generation_time": 0
+        "generation_time": 0,
    }
-    
+
    start_time = datetime.datetime.now()
-    
+
    try:
        logger.info("Generating %s image(s) with FLUX 2 Pro: %s", num_images, prompt[:80])
-        
+
        # Validate prompt
        if not prompt or not isinstance(prompt, str) or len(prompt.strip()) == 0:
            raise ValueError("Prompt is required and must be a non-empty string")
-        
+
        # Check API key availability
        if not os.getenv("FAL_KEY"):
            raise ValueError("FAL_KEY environment variable not set")
-        
+
        # Validate other parameters
        validated_params = _validate_parameters(
            image_size, num_inference_steps, guidance_scale, num_images, output_format, "none"
        )
-        
+
        # Prepare arguments for FAL.ai FLUX 2 Pro API
        arguments = {
            "prompt": prompt.strip(),
@ -298,51 +295,44 @@ def image_generate_tool(
            "output_format": validated_params["output_format"],
            "enable_safety_checker": ENABLE_SAFETY_CHECKER,
            "safety_tolerance": SAFETY_TOLERANCE,
-            "sync_mode": True  # Use sync mode for immediate results
+            "sync_mode": True,  # Use sync mode for immediate results
        }
-        
+
        # Add seed if provided
        if seed is not None and isinstance(seed, int):
            arguments["seed"] = seed
-        
+
        logger.info("Submitting generation request to FAL.ai FLUX 2 Pro...")
        logger.info("  Model: %s", DEFAULT_MODEL)
        logger.info("  Aspect Ratio: %s -> %s", aspect_ratio_lower, image_size)
-        logger.info("  Steps: %s", validated_params['num_inference_steps'])
-        logger.info("  Guidance: %s", validated_params['guidance_scale'])
-        
+        logger.info("  Steps: %s", validated_params["num_inference_steps"])
+        logger.info("  Guidance: %s", validated_params["guidance_scale"])
+
        # Submit request to FAL.ai using sync API (avoids cached event loop issues)
-        handler = fal_client.submit(
-            DEFAULT_MODEL,
-            arguments=arguments
-        )
-        
+        handler = fal_client.submit(DEFAULT_MODEL, arguments=arguments)
+
        # Get the result (sync — blocks until done)
        result = handler.get()
-        
+
        generation_time = (datetime.datetime.now() - start_time).total_seconds()
-        
+
        # Process the response
        if not result or "images" not in result:
            raise ValueError("Invalid response from FAL.ai API - no images returned")
-        
+
        images = result.get("images", [])
        if not images:
            raise ValueError("No images were generated")
-        
+
        # Format image data and upscale images
        formatted_images = []
        for img in images:
            if isinstance(img, dict) and "url" in img:
-                original_image = {
-                    "url": img["url"],
-                    "width": img.get("width", 0),
-                    "height": img.get("height", 0)
-                }
-                
+                original_image = {"url": img["url"], "width": img.get("width", 0), "height": img.get("height", 0)}
+
                # Attempt to upscale the image
                upscaled_image = _upscale_image(img["url"], prompt.strip())
-                
+
                if upscaled_image:
                    # Use upscaled image if successful
                    formatted_images.append(upscaled_image)
@ -351,52 +341,48 @@ def image_generate_tool(
                    logger.warning("Using original image as fallback")
                    original_image["upscaled"] = False
                    formatted_images.append(original_image)
-        
+
        if not formatted_images:
            raise ValueError("No valid image URLs returned from API")
-        
+
        upscaled_count = sum(1 for img in formatted_images if img.get("upscaled", False))
-        logger.info("Generated %s image(s) in %.1fs (%s upscaled)", len(formatted_images), generation_time, upscaled_count)
-        
+        logger.info(
+            "Generated %s image(s) in %.1fs (%s upscaled)", len(formatted_images), generation_time, upscaled_count
+        )
+
        # Prepare successful response - minimal format
-        response_data = {
-            "success": True,
-            "image": formatted_images[0]["url"] if formatted_images else None
-        }
-        
+        response_data = {"success": True, "image": formatted_images[0]["url"] if formatted_images else None}
+
        debug_call_data["success"] = True
        debug_call_data["images_generated"] = len(formatted_images)
        debug_call_data["generation_time"] = generation_time
-        
+
        # Log debug information
        _debug.log_call("image_generate_tool", debug_call_data)
        _debug.save()
-        
+
        return json.dumps(response_data, indent=2, ensure_ascii=False)
-        
+
    except Exception as e:
        generation_time = (datetime.datetime.now() - start_time).total_seconds()
        error_msg = f"Error generating image: {str(e)}"
        logger.error("%s", error_msg)
-        
+
        # Prepare error response - minimal format
-        response_data = {
-            "success": False,
-            "image": None
-        }
-        
+        response_data = {"success": False, "image": None}
+
        debug_call_data["error"] = error_msg
        debug_call_data["generation_time"] = generation_time
        _debug.log_call("image_generate_tool", debug_call_data)
        _debug.save()
-        
+
        return json.dumps(response_data, indent=2, ensure_ascii=False)


 def check_fal_api_key() -> bool:
    """
    Check if the FAL.ai API key is available in environment variables.
-    
+
    Returns:
        bool: True if API key is set, False otherwise
    """
@ -406,7 +392,7 @@ def check_fal_api_key() -> bool:
 def check_image_generation_requirements() -> bool:
    """
    Check if all requirements for image generation tools are met.
-    
+
    Returns:
        bool: True if requirements are met, False otherwise
    """
@ -414,19 +400,20 @@ def check_image_generation_requirements() -> bool:
        # Check API key
        if not check_fal_api_key():
            return False
-        
+
        # Check if fal_client is available
        import fal_client
+
        return True
-        
+
    except ImportError:
        return False


-def get_debug_session_info() -> Dict[str, Any]:
+def get_debug_session_info() -> dict[str, Any]:
    """
    Get information about the current debug session.
-    
+
    Returns:
        Dict[str, Any]: Dictionary containing debug session information
    """
@ -439,10 +426,10 @@ if __name__ == "__main__":
    """
    print("🎨 Image Generation Tools Module - FLUX 2 Pro + Auto Upscaling")
    print("=" * 60)
-    
+
    # Check if API key is available
    api_available = check_fal_api_key()
-    
+
    if not api_available:
        print("❌ FAL_KEY environment variable not set")
        print("Please set your API key: export FAL_KEY='your-key-here'")
@ -450,27 +437,28 @@ if __name__ == "__main__":
        exit(1)
    else:
        print("✅ FAL.ai API key found")
-    
+
    # Check if fal_client is available
    try:
        import fal_client
+
        print("✅ fal_client library available")
    except ImportError:
        print("❌ fal_client library not found")
        print("Please install: pip install fal-client")
        exit(1)
-    
+
    print("🛠️ Image generation tools ready for use!")
    print(f"🤖 Using model: {DEFAULT_MODEL}")
    print(f"🔍 Auto-upscaling with: {UPSCALER_MODEL} ({UPSCALER_FACTOR}x)")
-    
+
    # Show debug mode status
    if _debug.active:
        print(f"🐛 Debug mode ENABLED - Session ID: {_debug.session_id}")
        print(f"   Debug logs will be saved to: ./logs/image_tools_debug_{_debug.session_id}.json")
    else:
        print("🐛 Debug mode disabled (set IMAGE_TOOLS_DEBUG=true to enable)")
-    
+
    print("\nBasic usage:")
    print("  from image_generation_tool import image_generate_tool")
    print("  import asyncio")
@ -484,23 +472,23 @@ if __name__ == "__main__":
    print("      )")
    print("      print(result)")
    print("  asyncio.run(main())")
-    
+
    print("\nSupported image sizes:")
    for size in VALID_IMAGE_SIZES:
        print(f"  - {size}")
    print("  - Custom: {'width': 512, 'height': 768} (if needed)")
-    
+
    print("\nAcceleration modes:")
    for mode in VALID_ACCELERATION_MODES:
        print(f"  - {mode}")
-    
+
    print("\nExample prompts:")
    print("  - 'A candid street photo of a woman with a pink bob and bold eyeliner'")
    print("  - 'Modern architecture building with glass facade, sunset lighting'")
    print("  - 'Abstract art with vibrant colors and geometric patterns'")
    print("  - 'Portrait of a wise old owl perched on ancient tree branch'")
    print("  - 'Futuristic cityscape with flying cars and neon lights'")
-    
+
    print("\nDebug mode:")
    print("  # Enable debug logging")
    print("  export IMAGE_TOOLS_DEBUG=true")
@ -521,17 +509,17 @@ IMAGE_GENERATE_SCHEMA = {
        "properties": {
            "prompt": {
                "type": "string",
-                "description": "The text prompt describing the desired image. Be detailed and descriptive."
+                "description": "The text prompt describing the desired image. Be detailed and descriptive.",
            },
            "aspect_ratio": {
                "type": "string",
                "enum": ["landscape", "square", "portrait"],
                "description": "The aspect ratio of the generated image. 'landscape' is 16:9 wide, 'portrait' is 16:9 tall, 'square' is 1:1.",
-                "default": "landscape"
-            }
+                "default": "landscape",
+            },
        },
-        "required": ["prompt"]
-    }
+        "required": ["prompt"],
+    },
 }