Spaces:

Nayera-2025
/

Police-Vision-Translator

Sleeping

App Files Files Community

Nayera-2025 commited on 4 days ago

Commit

373f022

verified ·

1 Parent(s): 04b3f18

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -7

app.py CHANGED Viewed

@@ -1,23 +1,23 @@
 import gradio as gr
 from paddleocr import PaddleOCR
 import numpy as np
-import openai
 import os
 from langdetect import detect
 # Initialize PaddleOCR
 ocr_reader = PaddleOCR(use_angle_cls=True, lang='en')
 # Initialize Whisper Model via Hugging Face Transformers
-from transformers import pipeline
 whisper_model = pipeline(
     task="automatic-speech-recognition",
     model="openai/whisper-small",
     device=0
 )
-# Set your OpenAI API Key (you should set this securely in your environment)
-openai.api_key = os.getenv("OPENAI_API_KEY")
 def detect_language(text):
     try:
@@ -31,7 +31,7 @@ def gpt_clean_and_translate(text, target_language):
         return "No text detected.", ""
     prompt = f"""
-You are an expert document reader and translator. You will receive a noisy extracted text from a government ID. Your tasks:
 1. Identify and extract these fields: Name, Address, Date of Birth, Expiry Date, Class, Sex.
 2. Output the information in full English sentences.
@@ -39,7 +39,7 @@ You are an expert document reader and translator. You will receive a noisy extra
 If the target language is English, just output clean English sentences.
 """
-    response = openai.ChatCompletion.create(
         model="gpt-4o",
         messages=[
             {"role": "system", "content": prompt},
@@ -48,7 +48,7 @@ If the target language is English, just output clean English sentences.
         temperature=0.2
     )
-    cleaned_translation = response["choices"][0]["message"]["content"].strip()
     return cleaned_translation
 def process_document(image, target_language, language_group):

 import gradio as gr
 from paddleocr import PaddleOCR
 import numpy as np
 import os
 from langdetect import detect
+from openai import OpenAI
+from transformers import pipeline
 # Initialize PaddleOCR
 ocr_reader = PaddleOCR(use_angle_cls=True, lang='en')
 # Initialize Whisper Model via Hugging Face Transformers
 whisper_model = pipeline(
     task="automatic-speech-recognition",
     model="openai/whisper-small",
     device=0
 )
+# Initialize OpenAI Client
+client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
 def detect_language(text):
     try:
         return "No text detected.", ""
     prompt = f"""
+You are an expert document reader and translator. You will receive noisy extracted text from a government ID. Your tasks:
 1. Identify and extract these fields: Name, Address, Date of Birth, Expiry Date, Class, Sex.
 2. Output the information in full English sentences.
 If the target language is English, just output clean English sentences.
 """
+    response = client.chat.completions.create(
         model="gpt-4o",
         messages=[
             {"role": "system", "content": prompt},
         temperature=0.2
     )
+    cleaned_translation = response.choices[0].message.content.strip()
     return cleaned_translation
 def process_document(image, target_language, language_group):