Spaces:

Narayana02
/

image_caption_description

Sleeping

App Files Files Community

Narayana02 commited on Dec 20, 2024

Commit

19e494c

verified ·

1 Parent(s): 7ec2b4b

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -29

app.py CHANGED Viewed

@@ -2,41 +2,48 @@ import streamlit as st
 from huggingface_hub import InferenceClient
 from config import HUGGINGFACE_API_KEY  # Import your API key from a separate config file
 from PIL import Image
 from io import BytesIO
 # Streamlit App Configuration
 st.set_page_config(page_title="Llama-3.2 Demo App", page_icon="🤖", layout="wide")
 st.title("🖼️ Llama-3.2-90B-Vision-Instruct Demo App")
-st.markdown("<p style='text-align: center; font-size: 18px; color: #555;'>Upload an image and receive a text description of its content</p>", unsafe_allow_html=True)
-# User Inputs
-uploaded_image = st.file_uploader("Upload an Image", type=["png", "jpg", "jpeg"])
 user_prompt = st.text_input("Enter your prompt", value="Describe this image in a paragraph", placeholder="e.g., What is shown in the image?")
-# Function to display the uploaded image
-def show_uploaded_image(uploaded_image):
     try:
-        img = Image.open(uploaded_image)
-        st.image(img, caption="Uploaded Image", use_container_width=True)
-        return img
     except Exception as e:
-        st.error(f"❌ Unable to display image. Error: {e}")
-        return None
 # Process user input
 if st.button("Get Description", key="get_description"):
-    if uploaded_image and user_prompt:
         try:
-            # Display the uploaded image
-            img = show_uploaded_image(uploaded_image)
-            if img is None:
-                st.error("❌ Image processing failed.")
-                st.stop()
-            # Convert the image to bytes for model input
-            img_buffer = BytesIO()
-            img.save(img_buffer, format="PNG")
-            img_bytes = img_buffer.getvalue()
             # Initialize the InferenceClient
             client = InferenceClient(api_key=HUGGINGFACE_API_KEY)
@@ -47,7 +54,7 @@ if st.button("Get Description", key="get_description"):
                     "role": "user",
                     "content": [
                         {"type": "text", "text": user_prompt},
-                        {"type": "image", "image": {"bytes": img_bytes}}
                     ]
                 }
             ]
@@ -62,14 +69,16 @@ if st.button("Get Description", key="get_description"):
             # Extract JSON response
             model_response = completion.choices[0].message
-            # Display the result
             st.subheader("📝 Model Response")
             st.markdown(f"**Description**: {model_response.get('content', 'No description available')}")
         except Exception as e:
             st.error(f"❌ An error occurred: {e}")
     else:
-        st.warning("⚠️ Please upload an image and enter a prompt.")
 # Clean UI Enhancements
 st.markdown("""
@@ -93,10 +102,6 @@ st.markdown("""
             border-radius: 10px;
         }
-        .stFileUploader>div>div {
-            border-radius: 10px;
-        }
         /* Center the image */
         .stImage {
             display: block;
@@ -104,4 +109,4 @@ st.markdown("""
             margin-right: auto;
         }
     </style>
-""", unsafe_allow_html=True)

 from huggingface_hub import InferenceClient
 from config import HUGGINGFACE_API_KEY  # Import your API key from a separate config file
 from PIL import Image
+import requests
 from io import BytesIO
 # Streamlit App Configuration
 st.set_page_config(page_title="Llama-3.2 Demo App", page_icon="🤖", layout="wide")
 st.title("🖼️ Llama-3.2-90B-Vision-Instruct Demo App")
+st.markdown("<p style='text-align: center; font-size: 18px; color: #555;'>Enter an image URL and get a description</p>", unsafe_allow_html=True)
+# User Inputs with placeholder
+image_url = st.text_input("Enter Image URL", value="", placeholder="Paste image URL here...", max_chars=400)
 user_prompt = st.text_input("Enter your prompt", value="Describe this image in a paragraph", placeholder="e.g., What is shown in the image?")
+# Function to display the image from URL with height limit based on its actual size
+def show_image_from_url(image_url, max_height=200):
     try:
+        response = requests.get(image_url)
+        img = Image.open(BytesIO(response.content))
+        # Get the original image size
+        img_width, img_height = img.size
+        # Calculate the new height and width based on the max height while maintaining the aspect ratio
+        if img_height > max_height:
+            aspect_ratio = img_width / img_height
+            new_height = max_height
+            new_width = int(new_height * aspect_ratio)
+            img_resized = img.resize((new_width, new_height))
+        else:
+            img_resized = img  # No resizing needed if the image is smaller than the max height
+        # Center the image and display it
+        st.image(img_resized, caption=f"Source: {image_url}", use_container_width=True)
     except Exception as e:
+        st.error(f"❌ Unable to load image. Error: {e}")
 # Process user input
 if st.button("Get Description", key="get_description"):
+    if image_url and user_prompt:
         try:
+            # Show the image with dynamic resizing based on the image size
+            show_image_from_url(image_url, max_height=600)
             # Initialize the InferenceClient
             client = InferenceClient(api_key=HUGGINGFACE_API_KEY)
                     "role": "user",
                     "content": [
                         {"type": "text", "text": user_prompt},
+                        {"type": "image_url", "image_url": {"url": image_url}}
                     ]
                 }
             ]
             # Extract JSON response
             model_response = completion.choices[0].message
+            # Display the result in a clean and simple format
             st.subheader("📝 Model Response")
+            # Display Content
             st.markdown(f"**Description**: {model_response.get('content', 'No description available')}")
         except Exception as e:
             st.error(f"❌ An error occurred: {e}")
     else:
+        st.warning("⚠️ Please enter an image URL and a prompt.")
 # Clean UI Enhancements
 st.markdown("""
             border-radius: 10px;
         }
         /* Center the image */
         .stImage {
             display: block;
             margin-right: auto;
         }
     </style>
+""", unsafe_allow_html=True)