Spaces:

krishnapal2308
/

eye_for_blind

Running

App Files Files Community

krishnapal2308 commited on Feb 9, 2024

Commit

35e87cb

verified ·

1 Parent(s): 4e40bc0

Basic model's label and description changed.

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ This project aims to develop a deep learning model to verbally describe image co
 # Define solution overview
 solution_overview = """
 ### Solution Overview
-The basic model, trained for a limited duration without extensive hyperparameter tuning, primarily focuses on exploring the integration of the attention mechanism with the Encoder-Decoder architecture for image processing. To improve inference quality, Vit-GPT2 architecture is integrated. [Visit the Kaggle notebook](https://www.kaggle.com/code/krishna2308/eye-for-blind) for implementation details.
 """
 # Define real-life scenario application
@@ -30,7 +30,7 @@ While this current implementation may not support real-time processing, the pote
 def process_image_and_generate_output(image, model_selection):
     if image is None:
         return "Please select an image", None
-    if model_selection == 'Basic Model':
         result = inference_script.evaluate(image)
         pred_caption = ' '.join(result).rsplit(' ', 1)[0]
         pred_caption = pred_caption.replace('<unk>', '')
@@ -57,16 +57,16 @@ def process_image_and_generate_output(image, model_selection):
 sample_images = [
     [os.path.join(os.path.dirname(__file__), "sample_images/1.jpg"), "ViT-GPT2"],
-    [os.path.join(os.path.dirname(__file__), "sample_images/1.jpg"), 'Basic Model'],
     [os.path.join(os.path.dirname(__file__), "sample_images/3.jpg"), "ViT-GPT2"],
-    [os.path.join(os.path.dirname(__file__), "sample_images/3.jpg"), 'Basic Model']
 ]
 # Create a dropdown to select sample image
 image_input = gr.Image(label="Upload Image")
 # Create a dropdown to choose the model
-model_selection_input = gr.Radio(["Basic Model",
                                   "ViT-GPT2"],
                                  label="Choose Model")

 # Define solution overview
 solution_overview = """
 ### Solution Overview
+The basic model, **trained for only 20 epochs without extensive hyperparameter tuning,** primarily focuses on exploring the integration of the attention mechanism with the Encoder-Decoder architecture for image processing utilizing subclassing. To improve inference quality, Vit-GPT2 architecture is integrated. [Visit the Kaggle notebook](https://www.kaggle.com/code/krishna2308/eye-for-blind) for implementation details.
 """
 # Define real-life scenario application
 def process_image_and_generate_output(image, model_selection):
     if image is None:
         return "Please select an image", None
+    if model_selection == 'Basic Model (Results won't be good)':
         result = inference_script.evaluate(image)
         pred_caption = ' '.join(result).rsplit(' ', 1)[0]
         pred_caption = pred_caption.replace('<unk>', '')
 sample_images = [
     [os.path.join(os.path.dirname(__file__), "sample_images/1.jpg"), "ViT-GPT2"],
+    [os.path.join(os.path.dirname(__file__), "sample_images/1.jpg"), 'Basic Model (Results won't be good)'],
     [os.path.join(os.path.dirname(__file__), "sample_images/3.jpg"), "ViT-GPT2"],
+    [os.path.join(os.path.dirname(__file__), "sample_images/3.jpg"), 'Basic Model (Results won't be good)']
 ]
 # Create a dropdown to select sample image
 image_input = gr.Image(label="Upload Image")
 # Create a dropdown to choose the model
+model_selection_input = gr.Radio(["Basic Model (Results won't be good)",
                                   "ViT-GPT2"],
                                  label="Choose Model")