Spaces:

Nayera-2025
/

Police-Vision-Translator

Sleeping

App Files Files Community

Nayera-2025 commited on 7 days ago

Commit

09cc49d

verified ·

1 Parent(s): 52e3b04

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -19

app.py CHANGED Viewed

@@ -1,20 +1,20 @@
 import gradio as gr
 import easyocr
-import torch
 from transformers import pipeline
 import numpy as np
-# Load OCR model (English, Arabic, French, Chinese)
-reader = easyocr.Reader(['en', 'ar', 'fr', 'zh'])
-# Load YOLOv5 model (small model for faster performance)
-model = torch.hub.load('ultralytics/yolov5', 'yolov5s', pretrained=True)
-# Load translation model (multilingual to English)
-translator = pipeline("translation", model="Helsinki-NLP/opus-mt-mul-en")
 def process_image(image):
-    # Convert PIL Image to numpy array if needed
     if not isinstance(image, np.ndarray):
         image = np.array(image)
@@ -23,29 +23,41 @@ def process_image(image):
     extracted_texts = [res[1] for res in text_results]
     extracted_text = " ".join(extracted_texts)
-    # Step 2: Translate Text
     if extracted_text:
         translation = translator(extracted_text)[0]['translation_text']
     else:
         translation = "No text detected."
-    # Step 3: Object Detection - Bounding Boxes
-    results = model(image)
-    detected_img = results.render()[0]  # returns a list, take first image
-    return detected_img, extracted_text, translation
-# Define Gradio Interface
 iface = gr.Interface(
     fn=process_image,
-    inputs=gr.Image(type="pil", label="Upload Image (Signs, ID, License Plate)"),
     outputs=[
-        gr.Image(label="Detected Objects in Image"),
         gr.Textbox(label="Extracted Text"),
-        gr.Textbox(label="Translated Text to English")
     ],
-    title="🚨 Police Smart Glasses AI Demo",
-    description="Upload an image to simulate smart glasses detecting text, translating it, and recognizing objects."
 )
 if __name__ == "__main__":

 import gradio as gr
 import easyocr
 from transformers import pipeline
 import numpy as np
+from PIL import Image, ImageDraw
+# Load OCR Reader (GPU-enabled)
+reader = easyocr.Reader(['en', 'ar', 'fr', 'zh'], gpu=True)  # Enable GPU if available
+# Load Translation Model
+translator = pipeline("translation", model="Helsinki-NLP/opus-mt-mul-en", device=0)  # device=0 means use GPU
+# Load Object Detection Model
+detector = pipeline("object-detection", model="facebook/detr-resnet-50", device=0)
 def process_image(image):
+    # Ensure image is numpy
     if not isinstance(image, np.ndarray):
         image = np.array(image)
     extracted_texts = [res[1] for res in text_results]
     extracted_text = " ".join(extracted_texts)
+    # Step 2: Translation
     if extracted_text:
         translation = translator(extracted_text)[0]['translation_text']
     else:
         translation = "No text detected."
+    # Step 3: Object Detection
+    detections = detector(Image.fromarray(image))
+    image_draw = Image.fromarray(image).convert("RGB")
+    draw = ImageDraw.Draw(image_draw)
+    for det in detections:
+        box = det['box']
+        label = det['label']
+        score = det['score']
+        if score > 0.5:
+            draw.rectangle(
+                [box['xmin'], box['ymin'], box['xmax'], box['ymax']],
+                outline="red", width=3
+            )
+            draw.text((box['xmin'], box['ymin'] - 10), f"{label} ({score:.2f})", fill="red")
+    return image_draw, extracted_text, translation
+# Gradio Interface
 iface = gr.Interface(
     fn=process_image,
+    inputs=gr.Image(type="pil", label="Upload an Image (e.g., Signs, IDs, License Plates)"),
     outputs=[
+        gr.Image(label="Detected Objects"),
         gr.Textbox(label="Extracted Text"),
+        gr.Textbox(label="Translated Text (English)")
     ],
+    title="🚨 Police Smart Glasses - AI Demo (GPU Optimized)",
+    description="Upload an image to simulate smart glasses detecting text, translating it, and recognizing objects in real-time."
 )
 if __name__ == "__main__":