Spaces:
Runtime error
Runtime error
import gradio as gr | |
from transformers import TrOCRProcessor, VisionEncoderDecoderModel, pipeline | |
from PIL import Image | |
# Load OCR model | |
processor = TrOCRProcessor.from_pretrained('microsoft/trocr-base-stage1') | |
model = VisionEncoderDecoderModel.from_pretrained('microsoft/trocr-base-stage1') | |
# Load LLM | |
llm = pipeline("text-generation", model="distilgpt2") | |
def process_image(image): | |
pil_image = Image.fromarray(image) | |
pixel_values = processor(images=pil_image, return_tensors="pt").pixel_values | |
generated_ids = model.generate(pixel_values) | |
text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0] | |
llm_output = llm(text, max_length=100, do_sample=True)[0]["generated_text"] | |
return f"OCR Text:\n{text}\n\nLLM Response:\n{llm_output}" | |
gr.Interface(fn=process_image, | |
inputs=gr.Image(type="numpy"), | |
outputs="text", | |
title="OCR + LLM Text Generator").launch() | |