Spaces:

IAMTFRMZA
/

documentaitestv2

Sleeping

App Files Files Community

IAMTFRMZA commited on Apr 16

Commit

6b189d0

verified ·

1 Parent(s): 442d49c

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -9

app.py CHANGED Viewed

@@ -21,7 +21,6 @@ if session_id not in connections:
 def process_user_input(message, history):
     if not message:
         return "Please enter a message.", history
     try:
         thread = client.beta.threads.create()
         client.beta.threads.messages.create(
@@ -45,7 +44,7 @@ def process_user_input(message, history):
         history.append((message, assistant_reply))
         return "", history
     except Exception as e:
-        return f"❌ Error: {str(e)}", history
 # Functions for Realtime Voice Transcription
 def send_audio_chunk_realtime(mic_chunk):
@@ -62,13 +61,13 @@ def clear_transcript():
     return ""
 # Gradio UI Components
-doc_image = gr.Image(label="📘 Extracted Document Image", show_label=True, elem_id="docimg", height=500, width=360)
-chatbot = gr.Chatbot(label="🧠 Document Assistant", elem_id="chatbox", bubble_full_width=False)
 prompt = gr.Textbox(placeholder="Ask about the document...", label="Ask about the document")
 send_btn = gr.Button("Send")
 # Voice Section
-audio_in = gr.Audio(label="🎵 Audio", type="numpy", streaming=True)
 live_transcript = gr.Textbox(label="Live Transcript", lines=6)
 clear_btn = gr.Button("Clear Transcript")
@@ -78,7 +77,7 @@ with gr.Blocks(theme=gr.themes.Base(), css="""
     .gr-box { border-radius: 12px; }
 """) as demo:
-    gr.Markdown("# 🧠 Document AI + 🎙️ Voice Assistant")
     with gr.Row():
         with gr.Column(scale=1):
             doc_image.render()
@@ -91,7 +90,7 @@ with gr.Blocks(theme=gr.themes.Base(), css="""
     send_btn.click(fn=process_user_input, inputs=[prompt, chatbot], outputs=[prompt, chatbot])
-    with gr.Accordion("🎙️ Or Use Voice Instead", open=False):
         live_transcript.render()
         with gr.Row():
             audio_in.render()
@@ -99,5 +98,7 @@ with gr.Blocks(theme=gr.themes.Base(), css="""
         audio_in.stream(fn=send_audio_chunk_realtime, inputs=audio_in, outputs=live_transcript)
         clear_btn.click(fn=clear_transcript, outputs=live_transcript)
-if __name__ == "__main__":
-    demo.launch()

 def process_user_input(message, history):
     if not message:
         return "Please enter a message.", history
     try:
         thread = client.beta.threads.create()
         client.beta.threads.messages.create(
         history.append((message, assistant_reply))
         return "", history
     except Exception as e:
+        return f"\u274c Error: {str(e)}", history
 # Functions for Realtime Voice Transcription
 def send_audio_chunk_realtime(mic_chunk):
     return ""
 # Gradio UI Components
+doc_image = gr.Image(label="\ud83d\udcd8 Extracted Document Image", show_label=True, elem_id="docimg", height=500, width=280, type="filepath")
+chatbot = gr.Chatbot(label="\ud83e\udde0 Document Assistant", elem_id="chatbox", bubble_full_width=False)
 prompt = gr.Textbox(placeholder="Ask about the document...", label="Ask about the document")
 send_btn = gr.Button("Send")
 # Voice Section
+audio_in = gr.Audio(label="\ud83c\udfb5 Audio", type="numpy", streaming=True)
 live_transcript = gr.Textbox(label="Live Transcript", lines=6)
 clear_btn = gr.Button("Clear Transcript")
     .gr-box { border-radius: 12px; }
 """) as demo:
+    gr.Markdown("# \ud83e\udde0 Document AI + \ud83c\udf99\ufe0f Voice Assistant")
     with gr.Row():
         with gr.Column(scale=1):
             doc_image.render()
     send_btn.click(fn=process_user_input, inputs=[prompt, chatbot], outputs=[prompt, chatbot])
+    with gr.Accordion("\ud83c\udf99\ufe0f Or Use Voice Instead", open=False):
         live_transcript.render()
         with gr.Row():
             audio_in.render()
         audio_in.stream(fn=send_audio_chunk_realtime, inputs=audio_in, outputs=live_transcript)
         clear_btn.click(fn=clear_transcript, outputs=live_transcript)
+    demo.load(lambda: None, js="document.getElementById('docimg').scrollIntoView({ behavior: 'smooth', block: 'start' })")
+demo.launch()