documentaitestv4

Sleeping

App Files Files Community

IAMTFRMZA commited on Apr 22

Commit

9ee7546

verified ·

1 Parent(s): f06d67c

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -59

app.py CHANGED Viewed

@@ -34,7 +34,7 @@ class WebSocketClient:
                 await self.websocket.send(f.read())
             await asyncio.gather(self.receive_messages(), self.send_audio_chunks())
         except Exception as e:
-            print(f"🔴 WebSocket Connection Failed: {e}")
     def run(self):
         asyncio.set_event_loop(self.loop)
@@ -94,21 +94,17 @@ def clear_chat_only():
 def handle_chat(user_input, history, thread_id, image_url):
     if not OPENAI_API_KEY or not ASSISTANT_ID:
         return "❌ Missing secrets!", history, thread_id, image_url
     try:
         if thread_id is None:
             thread = client.beta.threads.create()
             thread_id = thread.id
         client.beta.threads.messages.create(thread_id=thread_id, role="user", content=user_input)
         run = client.beta.threads.runs.create(thread_id=thread_id, assistant_id=ASSISTANT_ID)
         while True:
             status = client.beta.threads.runs.retrieve(thread_id=thread_id, run_id=run.id)
             if status.status == "completed":
                 break
             time.sleep(1)
         msgs = client.beta.threads.messages.list(thread_id=thread_id)
         for msg in reversed(msgs.data):
             if msg.role == "assistant":
@@ -116,14 +112,11 @@ def handle_chat(user_input, history, thread_id, image_url):
                 history.append((user_input, content))
                 match = re.search(
                     r'https://raw\.githubusercontent\.com/AndrewLORTech/surgical-pathology-manual/main/[\w\-/]*\.png',
-                    content
-                )
                 if match:
                     image_url = match.group(0)
                 break
         return "", history, thread_id, image_url
     except Exception as e:
         return f"❌ {e}", history, thread_id, image_url
@@ -139,8 +132,6 @@ def update_image_display(image_url):
         return image_url
     return None
-# ============ Gradio UI ============
 with gr.Blocks(theme=gr.themes.Soft()) as app:
     gr.Markdown("# 📄 Document AI Assistant")
@@ -154,11 +145,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
         margin-top: 10px;
         white-space: nowrap;
     }
-    .voice-area {
-        padding-top: 12px;
-        border-top: 1px solid #444;
-        margin-top: 12px;
-    }
     </style>
     """)
@@ -167,64 +154,50 @@ with gr.Blocks(theme=gr.themes.Soft()) as app:
     image_state = gr.State()
     client_id = gr.State()
-    with gr.Row(equal_height=True):
-        with gr.Column(scale=1):
-            with gr.Accordion("📄 Document Viewer", open=True):
-                image_display = gr.Image(
-                    label="🖼️ Document",
-                    type="filepath",
-                    show_download_button=False,
-                    height=480
-                )
-        with gr.Column(scale=2):
             chat = gr.Chatbot(label="💬 Chat", height=480)
             with gr.Row():
                 user_prompt = gr.Textbox(placeholder="Ask your question...", show_label=False, scale=8)
                 send_btn = gr.Button("Send", variant="primary", scale=2)
             with gr.Row():
                 clear_chat_btn = gr.Button("🗑️ Clear Chat", elem_classes="big-btn")
-        with gr.Column(scale=1):
-            with gr.Accordion("🎙️ Voice Input", open=True):
-                gr.Markdown("### 🎙️ Voice Input")
-                voice_input = gr.Audio(label="Tap to Record", streaming=True, type="numpy", show_label=True)
-                voice_transcript = gr.Textbox(label="Transcript", lines=2, interactive=False)
-                with gr.Row(equal_height=True):
-                    with gr.Column(scale=1):
-                        voice_send_btn = gr.Button("🟢 Send Voice to Assistant", elem_classes="big-btn")
-                    with gr.Column(scale=1):
-                        clear_transcript_btn = gr.Button("🧹 Clear Transcript", elem_classes="big-btn")
-    # Bindings
-    send_btn.click(fn=handle_chat,
-                   inputs=[user_prompt, chat_state, thread_state, image_state],
-                   outputs=[user_prompt, chat, thread_state, image_state])
-    voice_input.stream(fn=send_audio,
-                       inputs=[voice_input, client_id],
-                       outputs=voice_transcript,
-                       stream_every=0.5)
-    voice_send_btn.click(fn=feed_transcript,
-                         inputs=[voice_transcript, chat_state, thread_state, image_state, client_id],
-                         outputs=[user_prompt, chat, thread_state, image_state])
-    clear_transcript_btn.click(fn=clear_transcript_only,
-                               inputs=[client_id],
-                               outputs=voice_transcript)
-    clear_chat_btn.click(fn=clear_chat_only,
-                         outputs=[chat, thread_state, image_state])
-    image_state.change(fn=update_image_display,
-                       inputs=image_state,
-                       outputs=image_display)
     app.load(fn=create_ws, outputs=[client_id])
 app.launch()

                 await self.websocket.send(f.read())
             await asyncio.gather(self.receive_messages(), self.send_audio_chunks())
         except Exception as e:
+            print(f"\U0001F534 WebSocket Connection Failed: {e}")
     def run(self):
         asyncio.set_event_loop(self.loop)
 def handle_chat(user_input, history, thread_id, image_url):
     if not OPENAI_API_KEY or not ASSISTANT_ID:
         return "❌ Missing secrets!", history, thread_id, image_url
     try:
         if thread_id is None:
             thread = client.beta.threads.create()
             thread_id = thread.id
         client.beta.threads.messages.create(thread_id=thread_id, role="user", content=user_input)
         run = client.beta.threads.runs.create(thread_id=thread_id, assistant_id=ASSISTANT_ID)
         while True:
             status = client.beta.threads.runs.retrieve(thread_id=thread_id, run_id=run.id)
             if status.status == "completed":
                 break
             time.sleep(1)
         msgs = client.beta.threads.messages.list(thread_id=thread_id)
         for msg in reversed(msgs.data):
             if msg.role == "assistant":
                 history.append((user_input, content))
                 match = re.search(
                     r'https://raw\.githubusercontent\.com/AndrewLORTech/surgical-pathology-manual/main/[\w\-/]*\.png',
+                    content)
                 if match:
                     image_url = match.group(0)
                 break
         return "", history, thread_id, image_url
     except Exception as e:
         return f"❌ {e}", history, thread_id, image_url
         return image_url
     return None
 with gr.Blocks(theme=gr.themes.Soft()) as app:
     gr.Markdown("# 📄 Document AI Assistant")
         margin-top: 10px;
         white-space: nowrap;
     }
+    .toggle-btn { margin-bottom: 8px; }
     </style>
     """)
     image_state = gr.State()
     client_id = gr.State()
+    with gr.Row():
+        toggle_left = gr.Button("📄 Toggle Document Panel", elem_classes="toggle-btn")
+        toggle_right = gr.Button("🎙️ Toggle Voice Panel", elem_classes="toggle-btn")
+    with gr.Row(equal_height=True) as layout_row:
+        with gr.Column(scale=1, visible=True) as left_col:
+            image_display = gr.Image(label="🖼️ Document", type="filepath", show_download_button=False, height=480)
+        with gr.Column(scale=2, visible=True) as center_col:
             chat = gr.Chatbot(label="💬 Chat", height=480)
             with gr.Row():
                 user_prompt = gr.Textbox(placeholder="Ask your question...", show_label=False, scale=8)
                 send_btn = gr.Button("Send", variant="primary", scale=2)
             with gr.Row():
                 clear_chat_btn = gr.Button("🗑️ Clear Chat", elem_classes="big-btn")
+        with gr.Column(scale=1, visible=True) as right_col:
+            gr.Markdown("### 🎙️ Voice Input")
+            voice_input = gr.Audio(label="Tap to Record", streaming=True, type="numpy", show_label=True)
+            voice_transcript = gr.Textbox(label="Transcript", lines=2, interactive=False)
+            with gr.Row(equal_height=True):
+                with gr.Column(scale=1):
+                    voice_send_btn = gr.Button("🟢 Send Voice to Assistant", elem_classes="big-btn")
+                with gr.Column(scale=1):
+                    clear_transcript_btn = gr.Button("🧹 Clear Transcript", elem_classes="big-btn")
+    def toggle_column_visibility(current_vis):
+        return gr.update(visible=not current_vis)
+    toggle_left.click(lambda v: toggle_column_visibility(v), inputs=[left_col], outputs=[left_col])
+    toggle_right.click(lambda v: toggle_column_visibility(v), inputs=[right_col], outputs=[right_col])
+    send_btn.click(fn=handle_chat, inputs=[user_prompt, chat_state, thread_state, image_state],
+                   outputs=[user_prompt, chat, thread_state, image_state])
+    voice_input.stream(fn=send_audio, inputs=[voice_input, client_id],
+                       outputs=voice_transcript, stream_every=0.5)
+    voice_send_btn.click(fn=feed_transcript, inputs=[voice_transcript, chat_state, thread_state, image_state, client_id],
+                         outputs=[user_prompt, chat, thread_state, image_state])
+    clear_transcript_btn.click(fn=clear_transcript_only, inputs=[client_id], outputs=voice_transcript)
+    clear_chat_btn.click(fn=clear_chat_only, outputs=[chat, thread_state, image_state])
+    image_state.change(fn=update_image_display, inputs=image_state, outputs=image_display)
     app.load(fn=create_ws, outputs=[client_id])
 app.launch()