Spaces:

wanda222
/

Document_OCR_Demo

Sleeping

File size: 2,618 Bytes

4ef4a96
 
 
 
89ed063
 
4ef4a96
 
 
 
89ed063
 
4ef4a96
 
 
89ed063
 
 
 
4ef4a96
89ed063
4ef4a96
 
 
89ed063
4ef4a96
 
 
 
 
89ed063
4ef4a96
 
 
 
 
 
 
89ed063
 
a509a74
 
 
 
 
 
4ef4a96
 
 
 
 
 
89ed063
4ef4a96
 
 
89ed063
 
4ef4a96
 
 
 
89ed063
a509a74
4ef4a96
 
f3600a5
4ef4a96
f3600a5
4ef4a96

import gradio as gr
import requests
import os
from openai import OpenAI
from io import BytesIO


UPSTAGE_API_KEY = os.getenv("UPSTAGE_API_KEY")


def extract_text_from_image(image):

    url = "https://api.upstage.ai/v1/document-digitization"

    headers = {'Authorization': f'Bearer {UPSTAGE_API_KEY}'}
    
    buffer = BytesIO()
    image.save(buffer, format="JPEG")
    buffer.seek(0)

    files = {"document": ("image.jpg", buffer, "image/jpeg")}
    data = {"model": "ocr"}

    response = requests.post(url, headers=headers, files=files, data=data)

    if response.status_code == 200:
        text = response.json().get("text", "")
        return text.strip()
    else:
        return f"OCR 실패: {response.status_code} - {response.text}"

        
def translate_text_with_solar(english_text):
    # Initialize the OpenAI client for Solar LLM
    client = OpenAI(
        api_key=UPSTAGE_API_KEY,
        base_url="https://api.upstage.ai/v1"
    )
    print("== 채팅 함수 호출됨 ==")
    
    prompt = f"""
    다음은 영어 손글씨 편지 내용입니다.\n
    {english_text} \n
    영어를 한국어로 번역해주세요.\n\n  
    한국어로 변역된 편지 내용: "
    """
    response = client.chat.completions.create(
        model="solar-pro",
        messages=[{"role": "user", "content": prompt}],
        temperature=0.5,
        max_tokens=1024
    )
    print(response)
    return response.choices[0].message.content

with gr.Blocks(title="💌 손글씨 편지 번역기") as demo:
    gr.Markdown("💌 손글씨 편지 번역기")
    gr.Markdown("편지 이미지를 업로드하면 Upstage Docuemnt OCR이 영어 텍스트를 추출하고,\n🌐 번역하기 버튼을 누르면 Solar LLM을 호출하여 한국어로 번역합니다!")

    with gr.Row():
        # 왼쪽: 이미지 업로드
        with gr.Column(scale=1):
            image_input = gr.Image(type="pil", label=" 💌 편지 이미지 업로드")
            
        # 오른쪽: 텍스트 결과
        with gr.Column(scale=2):
            english_box = gr.Textbox(label="📝 추출된 영어 텍스트", lines=10)
            translate_button = gr.Button("🌐 번역하기")
            korean_box = gr.Textbox(label="🇰🇷 번역된 한국어 텍스트", lines=10)

    # Step 1: 이미지 업로드 시 OCR 실행
    image_input.change(fn=extract_text_from_image, inputs=image_input, outputs=english_box)

    # Step 2: 버튼 누르면 번역
    translate_button.click(fn=translate_text_with_solar, inputs=english_box, outputs=korean_box)

if __name__ == "__main__":
    demo.launch()