Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -222,9 +222,10 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Base().set(
|
|
222 |
inputs=[msg, chatbot, system_prompt, temperature, max_new_tokens, top_p, top_k],
|
223 |
outputs=[chatbot, audio_output])
|
224 |
clear_btn.click(lambda: (None, None), None, [chatbot, audio_output], queue=False)
|
225 |
-
|
226 |
with gr.Tab("Vision Model with TTS (Phi-3.5-vision)"):
|
227 |
-
|
|
|
228 |
with gr.Column(scale=1):
|
229 |
vision_input_img = gr.Image(label="Upload an Image", type="pil")
|
230 |
vision_text_input = gr.Textbox(label="Ask a question about the image", placeholder="What do you see in this image?")
|
@@ -236,6 +237,9 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Base().set(
|
|
236 |
vision_submit_btn.click(process_vision_query,
|
237 |
inputs=[vision_input_img, vision_text_input],
|
238 |
outputs=[vision_output_text, vision_output_audio])
|
|
|
|
|
|
|
239 |
|
240 |
|
241 |
with gr.Tab("Text-to-Speech (Parler-TTS)"):
|
|
|
222 |
inputs=[msg, chatbot, system_prompt, temperature, max_new_tokens, top_p, top_k],
|
223 |
outputs=[chatbot, audio_output])
|
224 |
clear_btn.click(lambda: (None, None), None, [chatbot, audio_output], queue=False)
|
225 |
+
|
226 |
with gr.Tab("Vision Model with TTS (Phi-3.5-vision)"):
|
227 |
+
|
228 |
+
with gr.Row():
|
229 |
with gr.Column(scale=1):
|
230 |
vision_input_img = gr.Image(label="Upload an Image", type="pil")
|
231 |
vision_text_input = gr.Textbox(label="Ask a question about the image", placeholder="What do you see in this image?")
|
|
|
237 |
vision_submit_btn.click(process_vision_query,
|
238 |
inputs=[vision_input_img, vision_text_input],
|
239 |
outputs=[vision_output_text, vision_output_audio])
|
240 |
+
|
241 |
+
|
242 |
+
|
243 |
|
244 |
|
245 |
with gr.Tab("Text-to-Speech (Parler-TTS)"):
|