Spaces:

practisebook
/

Blind_Assistance2

Sleeping

App Files Files Community

practisebook commited on Jan 5

Commit

a225f19

verified ·

1 Parent(s): 55d719d

Update app.py

Browse files

Files changed (1) hide show

app.py +97 -26

app.py CHANGED Viewed

@@ -1,36 +1,107 @@
-import os
-import gradio as gr
-from ultralytics import YOLO
 import cv2
 # Load YOLOv8 model
-model = YOLO("yolov8n.pt")
-def detect_objects(video):
-    cap = cv2.VideoCapture(video)
-    frames = []
-    while cap.isOpened():
         ret, frame = cap.read()
         if not ret:
-            break
-        results = model(frame)
-        annotated_frame = results[0].plot()
-        _, buffer = cv2.imencode('.jpg', annotated_frame)
-        frames.append(buffer.tobytes())
-    cap.release()
-    return frames
-# Create Gradio interface
-with gr.Blocks() as demo:
-    gr.Markdown("# Real-Time Object Detection for Blind Assistance")
-    gr.Markdown("This app detects objects in real-time using your webcam.")
-    # Remove the `source` argument
-    video_input = gr.Video(label="Webcam Stream", type="filepath")
-    output_gallery = gr.Video(label="Detection Output")
-    detect_button = gr.Button("Start Detection")
-    detect_button.click(detect_objects, inputs=[video_input], outputs=[output_gallery])
-# Launch the app
-demo.launch()

 import cv2
+import random
+import time
+from ultralytics import YOLO
+from gtts import gTTS
+import pygame
+import threading
+from datetime import datetime, timedelta
+import gradio as gr
+# Initialize pygame mixer
+pygame.mixer.quit()
+pygame.mixer.init()
 # Load YOLOv8 model
+yolo = YOLO("yolov8n.pt")
+# Audio alert settings
+audio_temp_dir = "audio_temp_files"
+alert_categories = {"person", "cat", "dog", "knife", "fire", "gun"}
+last_alert_time = {}
+alert_cooldown = timedelta(seconds=10)
+# Create audio alert
+def play_audio_alert(label, position):
+    phrases = [
+        f"Be careful, there's a {label} on your {position}.",
+        f"Watch out! {label} detected on your {position}.",
+        f"Alert! A {label} is on your {position}.",
+    ]
+    caution_note = random.choice(phrases)
+    temp_file_path = f"{audio_temp_dir}/temp_{datetime.now().strftime('%Y%m%d_%H%M%S_%f')}.mp3"
+    tts = gTTS(caution_note)
+    tts.save(temp_file_path)
+    try:
+        pygame.mixer.music.load(temp_file_path)
+        pygame.mixer.music.play()
+        def cleanup_audio_file():
+            while pygame.mixer.music.get_busy():
+                time.sleep(0.1)
+            pygame.mixer.music.stop()
+        threading.Thread(target=cleanup_audio_file, daemon=True).start()
+    except Exception as e:
+        print(f"Error playing audio alert: {e}")
+# Process a single frame
+def process_frame(image, enable_audio):
+    results = yolo(image)
+    result = results[0]
+    detected_objects = {}
+    for box in result.boxes:
+        x1, y1, x2, y2 = map(int, box.xyxy[0])
+        label = result.names[int(box.cls[0])]
+        if enable_audio and label in alert_categories:
+            frame_center_x = image.shape[1] // 2
+            obj_center_x = (x1 + x2) // 2
+            position = "left" if obj_center_x < frame_center_x else "right"
+            detected_objects[label] = position
+            current_time = datetime.now()
+            if (
+                label not in last_alert_time
+                or current_time - last_alert_time[label] > alert_cooldown
+            ):
+                play_audio_alert(label, position)
+                last_alert_time[label] = current_time
+        # Draw bounding boxes
+        cv2.rectangle(image, (x1, y1), (x2, y2), (0, 255, 0), 2)
+        cv2.putText(image, label, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
+    return image
+# Gradio interface function
+def object_detection_webcam(enable_audio):
+    cap = cv2.VideoCapture(0)
+    if not cap.isOpened():
+        return "Error: Unable to access the camera."
+    while True:
         ret, frame = cap.read()
         if not ret:
+            return "Error: Unable to read from camera."
+        frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        processed_frame = process_frame(frame, enable_audio)
+        yield processed_frame
+    cap.release()
+# Create Gradio interface
+def gradio_app():
+    return gr.Interface(
+        fn=object_detection_webcam,
+        inputs=[gr.Checkbox(label="Enable Audio Alerts", value=False)],
+        outputs="image",
+        live=True,
+    )
+gradio_app().launch()