Spaces:
Runtime error
Runtime error
| import torch | |
| from transformers import Pix2StructForConditionalGeneration, Pix2StructProcessor | |
| import gradio as gr | |
| from PIL import Image | |
| # Load model and processor | |
| model_name = "google/pix2struct-docvqa-large" | |
| model = Pix2StructForConditionalGeneration.from_pretrained(model_name) | |
| processor = Pix2StructProcessor.from_pretrained(model_name) | |
| def process_image(image_path): | |
| try: | |
| # Load the image | |
| image = Image.open(image_path).convert("RGB") | |
| # Prepare the input | |
| inputs = processor(images=image, text="What does this image say?", return_tensors="pt") | |
| # Generate prediction | |
| output = model.generate(**inputs) | |
| # Decode the output | |
| solution = processor.decode(output[0], skip_special_tokens=True) | |
| return solution | |
| except Exception as e: | |
| return f"Error processing image: {str(e)}" | |
| def predict(image): | |
| """Handles image input for Gradio.""" | |
| return process_image(image) | |
| # Gradio app | |
| iface = gr.Interface( | |
| fn=predict, | |
| inputs=gr.Image(type="filepath"), | |
| outputs="text", | |
| title="Image Text Solution" | |
| ) | |
| if __name__ == "__main__": | |
| iface.launch() | |