Spaces:

IAMTFRMZA
/

documentaitestv2

Sleeping

App Files Files Community

IAMTFRMZA commited on 17 days ago

Commit

d6d49d6

verified ·

1 Parent(s): 4a071d5

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -9

app.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import gradio as gr
 import os
 import uuid
-import threading
 from openai import OpenAI
 from realtime_transcriber import WebSocketClient, connections, WEBSOCKET_URI, WEBSOCKET_HEADERS
@@ -15,12 +14,14 @@ client = OpenAI(api_key=OPENAI_API_KEY)
 session_id = str(uuid.uuid4())
 if session_id not in connections:
     connections[session_id] = WebSocketClient(WEBSOCKET_URI, WEBSOCKET_HEADERS, session_id)
     threading.Thread(target=connections[session_id].run, daemon=True).start()
 # Functions for Document Assistant
 def process_user_input(message, history):
     if not message:
         return "Please enter a message.", history
     try:
         thread = client.beta.threads.create()
         client.beta.threads.messages.create(
@@ -44,7 +45,7 @@ def process_user_input(message, history):
         history.append((message, assistant_reply))
         return "", history
     except Exception as e:
-        return f"\u274c Error: {str(e)}", history
 # Functions for Realtime Voice Transcription
 def send_audio_chunk_realtime(mic_chunk):
@@ -61,23 +62,23 @@ def clear_transcript():
     return ""
 # Gradio UI Components
-doc_image = gr.Image(label="\ud83d\udcd8 Extracted Document Image", show_label=True, elem_id="docimg", height=480, width=340)
-chatbot = gr.Chatbot(label="\ud83e\udde0 Document Assistant", elem_id="chatbox", bubble_full_width=False, height=480)
 prompt = gr.Textbox(placeholder="Ask about the document...", label="Ask about the document")
 send_btn = gr.Button("Send")
 # Voice Section
-audio_in = gr.Audio(label="\ud83c\udfb5 Audio", type="numpy", streaming=True)
 live_transcript = gr.Textbox(label="Live Transcript", lines=6)
 clear_btn = gr.Button("Clear Transcript")
 with gr.Blocks(theme=gr.themes.Base(), css="""
     #docimg img { object-fit: contain !important; }
-    #chatbox { border-radius: 10px; }
     .gr-box { border-radius: 12px; }
 """) as demo:
-    gr.Markdown("# \ud83e\uddd0 Document AI + \ud83c\udfa7 Voice Assistant")
     with gr.Row():
         with gr.Column(scale=1):
             doc_image.render()
@@ -90,7 +91,7 @@ with gr.Blocks(theme=gr.themes.Base(), css="""
     send_btn.click(fn=process_user_input, inputs=[prompt, chatbot], outputs=[prompt, chatbot])
-    with gr.Accordion("\ud83c\udf99\ufe0f Or Use Voice Instead", open=False):
         live_transcript.render()
         with gr.Row():
             audio_in.render()
@@ -98,4 +99,5 @@ with gr.Blocks(theme=gr.themes.Base(), css="""
         audio_in.stream(fn=send_audio_chunk_realtime, inputs=audio_in, outputs=live_transcript)
         clear_btn.click(fn=clear_transcript, outputs=live_transcript)
-demo.launch()

 import gradio as gr
 import os
 import uuid
 from openai import OpenAI
 from realtime_transcriber import WebSocketClient, connections, WEBSOCKET_URI, WEBSOCKET_HEADERS
 session_id = str(uuid.uuid4())
 if session_id not in connections:
     connections[session_id] = WebSocketClient(WEBSOCKET_URI, WEBSOCKET_HEADERS, session_id)
+    import threading
     threading.Thread(target=connections[session_id].run, daemon=True).start()
 # Functions for Document Assistant
 def process_user_input(message, history):
     if not message:
         return "Please enter a message.", history
     try:
         thread = client.beta.threads.create()
         client.beta.threads.messages.create(
         history.append((message, assistant_reply))
         return "", history
     except Exception as e:
+        return f"❌ Error: {str(e)}", history
 # Functions for Realtime Voice Transcription
 def send_audio_chunk_realtime(mic_chunk):
     return ""
 # Gradio UI Components
+doc_image = gr.Image(label="📘 Extracted Document Image", show_label=True, elem_id="docimg", height=500, width=360)
+chatbot = gr.Chatbot(label="🧠 Document Assistant", elem_id="chatbox", bubble_full_width=False)
 prompt = gr.Textbox(placeholder="Ask about the document...", label="Ask about the document")
 send_btn = gr.Button("Send")
 # Voice Section
+audio_in = gr.Audio(label="🎵 Audio", type="numpy", streaming=True)
 live_transcript = gr.Textbox(label="Live Transcript", lines=6)
 clear_btn = gr.Button("Clear Transcript")
 with gr.Blocks(theme=gr.themes.Base(), css="""
     #docimg img { object-fit: contain !important; }
+    #chatbox { height: 500px; }
     .gr-box { border-radius: 12px; }
 """) as demo:
+    gr.Markdown("# 🧠 Document AI + 🎙️ Voice Assistant")
     with gr.Row():
         with gr.Column(scale=1):
             doc_image.render()
     send_btn.click(fn=process_user_input, inputs=[prompt, chatbot], outputs=[prompt, chatbot])
+    with gr.Accordion("🎙️ Or Use Voice Instead", open=False):
         live_transcript.render()
         with gr.Row():
             audio_in.render()
         audio_in.stream(fn=send_audio_chunk_realtime, inputs=audio_in, outputs=live_transcript)
         clear_btn.click(fn=clear_transcript, outputs=live_transcript)
+# LAUNCH WITH SHARE ENABLED FOR PUBLIC URL
+demo.launch(share=True)