sagar007 commited on
Commit
dceec72
·
verified ·
1 Parent(s): 2b390ac

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -2
app.py CHANGED
@@ -222,9 +222,10 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Base().set(
222
  inputs=[msg, chatbot, system_prompt, temperature, max_new_tokens, top_p, top_k],
223
  outputs=[chatbot, audio_output])
224
  clear_btn.click(lambda: (None, None), None, [chatbot, audio_output], queue=False)
225
-
226
  with gr.Tab("Vision Model with TTS (Phi-3.5-vision)"):
227
- with gr.Row():
 
228
  with gr.Column(scale=1):
229
  vision_input_img = gr.Image(label="Upload an Image", type="pil")
230
  vision_text_input = gr.Textbox(label="Ask a question about the image", placeholder="What do you see in this image?")
@@ -236,6 +237,9 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Base().set(
236
  vision_submit_btn.click(process_vision_query,
237
  inputs=[vision_input_img, vision_text_input],
238
  outputs=[vision_output_text, vision_output_audio])
 
 
 
239
 
240
 
241
  with gr.Tab("Text-to-Speech (Parler-TTS)"):
 
222
  inputs=[msg, chatbot, system_prompt, temperature, max_new_tokens, top_p, top_k],
223
  outputs=[chatbot, audio_output])
224
  clear_btn.click(lambda: (None, None), None, [chatbot, audio_output], queue=False)
225
+
226
  with gr.Tab("Vision Model with TTS (Phi-3.5-vision)"):
227
+
228
+ with gr.Row():
229
  with gr.Column(scale=1):
230
  vision_input_img = gr.Image(label="Upload an Image", type="pil")
231
  vision_text_input = gr.Textbox(label="Ask a question about the image", placeholder="What do you see in this image?")
 
237
  vision_submit_btn.click(process_vision_query,
238
  inputs=[vision_input_img, vision_text_input],
239
  outputs=[vision_output_text, vision_output_audio])
240
+
241
+
242
+
243
 
244
 
245
  with gr.Tab("Text-to-Speech (Parler-TTS)"):