Spaces:

AiCodeCarft
/

Gemini-Interface

Running

App Files Files Community

Alibrown commited on Nov 17, 2024

Commit

254bad9

verified ·

1 Parent(s): dc9257c

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -4

app.py CHANGED Viewed

@@ -4,12 +4,21 @@ import streamlit as st
 import google.generativeai as genai
 from PIL import Image
 import io
 st.set_page_config(page_title="Gemini AI Chat", layout="wide")
 st.title("🤖 Gemini AI Chat Interface by Volkan Sah")
 st.markdown("Chat with Google's Gemini AI models. Supports both text and image inputs. Follow me on Github@volkansah for more cool stuff!")
 # Sidebar for settings
 with st.sidebar:
     api_key = st.text_input("Enter Google AI API Key", type="password")
@@ -41,7 +50,7 @@ uploaded_file = st.file_uploader("Upload an image (optional)", type=["jpg", "jpe
 uploaded_image = None
 if uploaded_file is not None:
     uploaded_image = Image.open(uploaded_file).convert('RGB')
-    st.image(uploaded_image, caption="Uploaded Image", use_container_width=True)  # Fixed here
 # Chat input
 user_input = st.chat_input("Type your message here...")
@@ -59,9 +68,21 @@ if user_input and api_key:
         # Prepare the model and content
         model_instance = genai.GenerativeModel(model_name=model)
-        content = [{"text": user_input}]
         if uploaded_image:
-            content.append({"inline_data": {"mime_type": "image/jpeg", "data": uploaded_image}})
         # Generate response
         response = model_instance.generate_content(
@@ -81,6 +102,7 @@ if user_input and api_key:
     except Exception as e:
         st.error(f"Error: {str(e)}")
 elif not api_key and user_input:
     st.warning("Please enter your API key in the sidebar first.")
@@ -90,7 +112,7 @@ with st.sidebar:
     st.markdown("""
     ## 📝 Instructions:
     1. Enter your Google AI API key
-    2. Select a model
     3. Adjust temperature and max tokens if needed
     4. Optional: Set a system prompt
     5. Upload an image (optional)

 import google.generativeai as genai
 from PIL import Image
 import io
+import base64
 st.set_page_config(page_title="Gemini AI Chat", layout="wide")
 st.title("🤖 Gemini AI Chat Interface by Volkan Sah")
 st.markdown("Chat with Google's Gemini AI models. Supports both text and image inputs. Follow me on Github@volkansah for more cool stuff!")
+def encode_image(image):
+    """Convert PIL Image to base64 string"""
+    buffered = io.BytesIO()
+    image.save(buffered, format="JPEG")
+    image_bytes = buffered.getvalue()
+    encoded_image = base64.b64encode(image_bytes).decode('utf-8')
+    return encoded_image
 # Sidebar for settings
 with st.sidebar:
     api_key = st.text_input("Enter Google AI API Key", type="password")
 uploaded_image = None
 if uploaded_file is not None:
     uploaded_image = Image.open(uploaded_file).convert('RGB')
+    st.image(uploaded_image, caption="Uploaded Image", use_container_width=True)
 # Chat input
 user_input = st.chat_input("Type your message here...")
         # Prepare the model and content
         model_instance = genai.GenerativeModel(model_name=model)
+        content = []
         if uploaded_image:
+            # Convert image to base64
+            encoded_image = encode_image(uploaded_image)
+            content = [
+                {"text": user_input},
+                {
+                    "inline_data": {
+                        "mime_type": "image/jpeg",
+                        "data": encoded_image
+                    }
+                }
+            ]
+        else:
+            content = [{"text": user_input}]
         # Generate response
         response = model_instance.generate_content(
     except Exception as e:
         st.error(f"Error: {str(e)}")
+        st.error("If using an image, make sure to select a vision-enabled model (ones with 'vision' in the name)")
 elif not api_key and user_input:
     st.warning("Please enter your API key in the sidebar first.")
     st.markdown("""
     ## 📝 Instructions:
     1. Enter your Google AI API key
+    2. Select a model (use vision models for image analysis)
     3. Adjust temperature and max tokens if needed
     4. Optional: Set a system prompt
     5. Upload an image (optional)