| | import os |
| | import io |
| | import uuid |
| | import base64 |
| | import numpy as np |
| | from PIL import Image |
| | from langchain_core.tools import tool |
| | from typing import List, Dict, Any, Optional |
| | from PIL import Image, ImageDraw, ImageFont, ImageEnhance, ImageFilter |
| |
|
| | |
| | def encode_image(image_path: str) -> str: |
| | """Convert an image file to base64 string.""" |
| | with open(image_path, "rb") as image_file: |
| | return base64.b64encode(image_file.read()).decode("utf-8") |
| |
|
| |
|
| | def decode_image(base64_string: str) -> Image.Image: |
| | """Convert a base64 string to a PIL Image.""" |
| | image_data = base64.b64decode(base64_string) |
| | return Image.open(io.BytesIO(image_data)) |
| |
|
| |
|
| | def save_image(image: Image.Image, directory: str = "image_outputs") -> str: |
| | """Save a PIL Image to disk and return the path.""" |
| | os.makedirs(directory, exist_ok=True) |
| | image_id = str(uuid.uuid4()) |
| | image_path = os.path.join(directory, f"{image_id}.png") |
| | image.save(image_path) |
| | return image_path |
| |
|
| |
|
| | @tool |
| | def analyze_image(image_base64: str) -> Dict[str, Any]: |
| | """ |
| | Analyze basic properties of an image (size, mode, color analysis, thumbnail preview). |
| | Args: |
| | image_base64 (str): Base64 encoded image string |
| | Returns: |
| | Dictionary with analysis result |
| | """ |
| | try: |
| | img = decode_image(image_base64) |
| | width, height = img.size |
| | mode = img.mode |
| |
|
| | if mode in ("RGB", "RGBA"): |
| | arr = np.array(img) |
| | avg_colors = arr.mean(axis=(0, 1)) |
| | dominant = ["Red", "Green", "Blue"][np.argmax(avg_colors[:3])] |
| | brightness = avg_colors.mean() |
| | color_analysis = { |
| | "average_rgb": avg_colors.tolist(), |
| | "brightness": brightness, |
| | "dominant_color": dominant, |
| | } |
| | else: |
| | color_analysis = {"note": f"No color analysis for mode {mode}"} |
| |
|
| | thumbnail = img.copy() |
| | thumbnail.thumbnail((100, 100)) |
| | thumb_path = save_image(thumbnail, "thumbnails") |
| | thumbnail_base64 = encode_image(thumb_path) |
| |
|
| | return { |
| | "dimensions": (width, height), |
| | "mode": mode, |
| | "color_analysis": color_analysis, |
| | "thumbnail": thumbnail_base64, |
| | } |
| | except Exception as e: |
| | return {"error": str(e)} |
| |
|
| |
|
| | @tool |
| | def transform_image( |
| | image_base64: str, operation: str, params: Optional[Dict[str, Any]] = None |
| | ) -> Dict[str, Any]: |
| | """ |
| | Apply transformations: resize, rotate, crop, flip, brightness, contrast, blur, sharpen, grayscale. |
| | Args: |
| | image_base64 (str): Base64 encoded input image |
| | operation (str): Transformation operation |
| | params (Dict[str, Any], optional): Parameters for the operation |
| | Returns: |
| | Dictionary with transformed image (base64) |
| | """ |
| | try: |
| | img = decode_image(image_base64) |
| | params = params or {} |
| |
|
| | if operation == "resize": |
| | img = img.resize( |
| | ( |
| | params.get("width", img.width // 2), |
| | params.get("height", img.height // 2), |
| | ) |
| | ) |
| | elif operation == "rotate": |
| | img = img.rotate(params.get("angle", 90), expand=True) |
| | elif operation == "crop": |
| | img = img.crop( |
| | ( |
| | params.get("left", 0), |
| | params.get("top", 0), |
| | params.get("right", img.width), |
| | params.get("bottom", img.height), |
| | ) |
| | ) |
| | elif operation == "flip": |
| | if params.get("direction", "horizontal") == "horizontal": |
| | img = img.transpose(Image.FLIP_LEFT_RIGHT) |
| | else: |
| | img = img.transpose(Image.FLIP_TOP_BOTTOM) |
| | elif operation == "adjust_brightness": |
| | img = ImageEnhance.Brightness(img).enhance(params.get("factor", 1.5)) |
| | elif operation == "adjust_contrast": |
| | img = ImageEnhance.Contrast(img).enhance(params.get("factor", 1.5)) |
| | elif operation == "blur": |
| | img = img.filter(ImageFilter.GaussianBlur(params.get("radius", 2))) |
| | elif operation == "sharpen": |
| | img = img.filter(ImageFilter.SHARPEN) |
| | elif operation == "grayscale": |
| | img = img.convert("L") |
| | else: |
| | return {"error": f"Unknown operation: {operation}"} |
| |
|
| | result_path = save_image(img) |
| | result_base64 = encode_image(result_path) |
| | return {"transformed_image": result_base64} |
| |
|
| | except Exception as e: |
| | return {"error": str(e)} |
| |
|
| |
|
| | @tool |
| | def draw_on_image( |
| | image_base64: str, drawing_type: str, params: Dict[str, Any] |
| | ) -> Dict[str, Any]: |
| | """ |
| | Draw shapes (rectangle, circle, line) or text onto an image. |
| | Args: |
| | image_base64 (str): Base64 encoded input image |
| | drawing_type (str): Drawing type |
| | params (Dict[str, Any]): Drawing parameters |
| | Returns: |
| | Dictionary with result image (base64) |
| | """ |
| | try: |
| | img = decode_image(image_base64) |
| | draw = ImageDraw.Draw(img) |
| | color = params.get("color", "red") |
| |
|
| | if drawing_type == "rectangle": |
| | draw.rectangle( |
| | [params["left"], params["top"], params["right"], params["bottom"]], |
| | outline=color, |
| | width=params.get("width", 2), |
| | ) |
| | elif drawing_type == "circle": |
| | x, y, r = params["x"], params["y"], params["radius"] |
| | draw.ellipse( |
| | (x - r, y - r, x + r, y + r), |
| | outline=color, |
| | width=params.get("width", 2), |
| | ) |
| | elif drawing_type == "line": |
| | draw.line( |
| | ( |
| | params["start_x"], |
| | params["start_y"], |
| | params["end_x"], |
| | params["end_y"], |
| | ), |
| | fill=color, |
| | width=params.get("width", 2), |
| | ) |
| | elif drawing_type == "text": |
| | font_size = params.get("font_size", 20) |
| | try: |
| | font = ImageFont.truetype("arial.ttf", font_size) |
| | except IOError: |
| | font = ImageFont.load_default() |
| | draw.text( |
| | (params["x"], params["y"]), |
| | params.get("text", "Text"), |
| | fill=color, |
| | font=font, |
| | ) |
| | else: |
| | return {"error": f"Unknown drawing type: {drawing_type}"} |
| |
|
| | result_path = save_image(img) |
| | result_base64 = encode_image(result_path) |
| | return {"result_image": result_base64} |
| |
|
| | except Exception as e: |
| | return {"error": str(e)} |
| |
|
| |
|
| | @tool |
| | def generate_simple_image( |
| | image_type: str, |
| | width: int = 500, |
| | height: int = 500, |
| | params: Optional[Dict[str, Any]] = None, |
| | ) -> Dict[str, Any]: |
| | """ |
| | Generate a simple image (gradient, noise, pattern, chart). |
| | Args: |
| | image_type (str): Type of image |
| | width (int), height (int) |
| | params (Dict[str, Any], optional): Specific parameters |
| | Returns: |
| | Dictionary with generated image (base64) |
| | """ |
| | try: |
| | params = params or {} |
| |
|
| | if image_type == "gradient": |
| | direction = params.get("direction", "horizontal") |
| | start_color = params.get("start_color", (255, 0, 0)) |
| | end_color = params.get("end_color", (0, 0, 255)) |
| |
|
| | img = Image.new("RGB", (width, height)) |
| | draw = ImageDraw.Draw(img) |
| |
|
| | if direction == "horizontal": |
| | for x in range(width): |
| | r = int( |
| | start_color[0] + (end_color[0] - start_color[0]) * x / width |
| | ) |
| | g = int( |
| | start_color[1] + (end_color[1] - start_color[1]) * x / width |
| | ) |
| | b = int( |
| | start_color[2] + (end_color[2] - start_color[2]) * x / width |
| | ) |
| | draw.line([(x, 0), (x, height)], fill=(r, g, b)) |
| | else: |
| | for y in range(height): |
| | r = int( |
| | start_color[0] + (end_color[0] - start_color[0]) * y / height |
| | ) |
| | g = int( |
| | start_color[1] + (end_color[1] - start_color[1]) * y / height |
| | ) |
| | b = int( |
| | start_color[2] + (end_color[2] - start_color[2]) * y / height |
| | ) |
| | draw.line([(0, y), (width, y)], fill=(r, g, b)) |
| |
|
| | elif image_type == "noise": |
| | noise_array = np.random.randint(0, 256, (height, width, 3), dtype=np.uint8) |
| | img = Image.fromarray(noise_array, "RGB") |
| |
|
| | else: |
| | return {"error": f"Unsupported image_type {image_type}"} |
| |
|
| | result_path = save_image(img) |
| | result_base64 = encode_image(result_path) |
| | return {"generated_image": result_base64} |
| |
|
| | except Exception as e: |
| | return {"error": str(e)} |
| |
|
| |
|
| | @tool |
| | def combine_images( |
| | images_base64: List[str], operation: str, params: Optional[Dict[str, Any]] = None |
| | ) -> Dict[str, Any]: |
| | """ |
| | Combine multiple images (collage, stack, blend). |
| | Args: |
| | images_base64 (List[str]): List of base64 images |
| | operation (str): Combination type |
| | params (Dict[str, Any], optional) |
| | Returns: |
| | Dictionary with combined image (base64) |
| | """ |
| | try: |
| | images = [decode_image(b64) for b64 in images_base64] |
| | params = params or {} |
| |
|
| | if operation == "stack": |
| | direction = params.get("direction", "horizontal") |
| | if direction == "horizontal": |
| | total_width = sum(img.width for img in images) |
| | max_height = max(img.height for img in images) |
| | new_img = Image.new("RGB", (total_width, max_height)) |
| | x = 0 |
| | for img in images: |
| | new_img.paste(img, (x, 0)) |
| | x += img.width |
| | else: |
| | max_width = max(img.width for img in images) |
| | total_height = sum(img.height for img in images) |
| | new_img = Image.new("RGB", (max_width, total_height)) |
| | y = 0 |
| | for img in images: |
| | new_img.paste(img, (0, y)) |
| | y += img.height |
| | else: |
| | return {"error": f"Unsupported combination operation {operation}"} |
| |
|
| | result_path = save_image(new_img) |
| | result_base64 = encode_image(result_path) |
| | return {"combined_image": result_base64} |
| |
|
| | except Exception as e: |
| | return {"error": str(e)} |
| |
|