Spaces:

MCP-1st-Birthday
/

learnbee_mcp

Running

File size: 3,991 Bytes

3b2a4e6

"""Image generation module using Hugging Face Inference API."""

import os
from typing import Optional
from dotenv import load_dotenv
from huggingface_hub import InferenceClient

load_dotenv()


class ImageGenerator:
    """Generate images using Hugging Face Inference API."""
    
    def __init__(self, model: str = "black-forest-labs/FLUX.1-schnell"):
        """
        Initialize the image generator.
        
        Args:
            model: Hugging Face model ID for image generation
        """
        self.api_token = os.getenv("HF_TOKEN")
        self.model = model
        
        if not self.api_token:
            raise ValueError("HF_TOKEN not found in environment variables")
        
        # Initialize Hugging Face Inference Client
        self.client = InferenceClient(token=self.api_token)
    
    def generate_image(self, prompt: str) -> Optional[bytes]:
        """
        Generate an image from a text prompt.
        
        Args:
            prompt: Text description of the image to generate
            
        Returns:
            Image bytes if successful, None otherwise
        """
        # Enhance prompt for child-friendly, educational content
        enhanced_prompt = self._enhance_prompt_for_children(prompt)
        
        try:
            # Use the text_to_image method from InferenceClient
            image = self.client.text_to_image(
                enhanced_prompt,
                model=self.model
            )
            
            # Convert PIL Image to bytes
            from io import BytesIO
            img_byte_arr = BytesIO()
            image.save(img_byte_arr, format='PNG')
            img_byte_arr.seek(0)
            
            return img_byte_arr.read()
                
        except Exception as e:
            print(f"Error generating image: {str(e)}")
            return None
    
    def _enhance_prompt_for_children(self, prompt: str) -> str:
        """
        Enhance the prompt to ensure child-friendly, educational images.
        
        Args:
            prompt: Original prompt
            
        Returns:
            Enhanced prompt
        """
        # Add style modifiers for child-friendly content
        enhancements = [
            "child-friendly",
            "colorful",
            "educational illustration",
            "cartoon style",
            "bright and cheerful"
        ]
        
        # Combine original prompt with enhancements
        enhanced = f"{prompt}, {', '.join(enhancements)}"
        
        return enhanced
    
    def detect_image_request(self, message: str) -> Optional[str]:
        """
        Detect if a message contains an image request and extract the subject.
        
        Args:
            message: User's message
            
        Returns:
            Subject to generate image for, or None if no request detected
        """
        message_lower = message.lower()
        
        # Keywords that indicate image request
        image_keywords = [
            "show me", "muéstrame", "muestra",
            "draw", "dibuja", "dibujar",
            "picture of", "imagen de", "foto de",
            "what does", "cómo es", "como es",
            "i want to see", "quiero ver",
            "can you show", "puedes mostrar"
        ]
        
        # Check if message contains image request keywords
        for keyword in image_keywords:
            if keyword in message_lower:
                # Extract subject (simplified - could be improved with NLP)
                # Remove the keyword and get the remaining text
                subject = message_lower.replace(keyword, "").strip()
                # Remove common words
                subject = subject.replace("a ", "").replace("an ", "").replace("the ", "")
                subject = subject.replace("un ", "").replace("una ", "").replace("el ", "").replace("la ", "")
                
                if subject:
                    return subject
        
        return None