Spaces:

eaglelandsonce
/

GrokAgenticWorkforce

Runtime error

App Files Files Community

eaglelandsonce commited on Apr 2, 2024

Commit

c5c69f5

verified ·

1 Parent(s): ac4d3aa

Update pages/5_Gemini-Chat.py

Browse files

Files changed (1) hide show

pages/5_Gemini-Chat.py +75 -23

pages/5_Gemini-Chat.py CHANGED Viewed

@@ -5,7 +5,7 @@ import base64
 import uuid
 from gtts import gTTS
 import google.generativeai as genai
-from io import BytesIO
 # Set your API key
 api_key = "AIzaSyC70u1sN87IkoxOoIj4XCAPw97ae2LZwNM"  # Replace with your actual API key
@@ -39,17 +39,12 @@ safety_settings = [
 # Initialize session state
 if 'chat_history' not in st.session_state:
-    st.session_state.chat_history = []
 if 'file_uploader_key' not in st.session_state:
-    st.session_state.file_uploader_key = str(uuid.uuid4())
 st.title("Gemini Chatbot")
-# Displaying the system message for users
-st.markdown("""
-**AI Planner System Prompt:** As the AI Planner, your primary task is to assist in the development of a coherent and engaging book. You will be responsible for organizing the overall structure, defining the plot or narrative, and outlining the chapters or sections. To accomplish this, you will need to use your understanding of storytelling principles and genre conventions, as well as any specific information provided by the user, to create a well-structured framework for the book.
-""")
 # Helper functions for image processing and chat history management
 def get_image_base64(image):
     image = image.convert("RGB")
@@ -59,11 +54,11 @@ def get_image_base64(image):
     return img_str
 def clear_conversation():
-    st.session_state.chat_history = []
-    st.session_state.file_uploader_key = str(uuid.uuid4())
 def display_chat_history():
-    for entry in st.session_state.chat_history:
         role = entry["role"]
         parts = entry["parts"][0]
         if 'text' in parts:
@@ -75,34 +70,50 @@ def get_chat_history_str():
     chat_history_str = "\n".join(
         f"{entry['role'].title()}: {part['text']}" if 'text' in part
         else f"{entry['role'].title()}: (Image)"
-        for entry in st.session_state.chat_history
         for part in entry['parts']
     )
     return chat_history_str
-# Function to send messages
 def send_message():
     user_input = st.session_state.user_input
     prompts = []
     prompt_parts = []
     if user_input:
         prompts.append(user_input)
-        st.session_state.chat_history.append({"role": "user", "parts": [{"text": user_input}]})
         prompt_parts.append({"text": user_input})
-    # Handling uploaded files directly
     if uploaded_files:
         for uploaded_file in uploaded_files:
             base64_image = get_image_base64(Image.open(uploaded_file))
             prompts.append("[Image]")
             prompt_parts.append({"data": base64_image, "mime_type": "image/jpeg"})
-            st.session_state.chat_history.append({
                 "role": "user",
                 "parts": [{"mime_type": uploaded_file.type, "data": base64_image}]
             })
     use_vision_model = any(part.get('mime_type') == 'image/jpeg' for part in prompt_parts)
     model_name = 'gemini-pro-vision' if use_vision_model else 'gemini-pro'
     model = genai.GenerativeModel(
         model_name=model_name,
@@ -111,35 +122,75 @@ def send_message():
     )
     chat_history_str = "\n".join(prompts)
     if use_vision_model:
         generated_prompt = {"role": "user", "parts": prompt_parts}
     else:
         generated_prompt = {"role": "user", "parts": [{"text": chat_history_str}]}
     response = model.generate_content([generated_prompt])
     response_text = response.text if hasattr(response, "text") else "No response text found."
     if response_text:
-        st.session_state.chat_history.append({"role": "model", "parts":[{"text": response_text}]})
         tts = gTTS(text=response_text, lang='en')
         tts_file = BytesIO()
         tts.write_to_fp(tts_file)
         tts_file.seek(0)
         st.audio(tts_file, format='audio/mp3')
     st.session_state.user_input = ''
     display_chat_history()
-# UI components for user input, file uploader, send and clear buttons
-user_input = st.text_area("Enter your message here:", value="", key="user_input")
-uploaded_files = st.file_uploader("Upload images:", type=["png", "jpg", "jpeg"], accept_multiple_files=True, key="file_uploader_key")
-send_button = st.button("Send", on_click=send_message)
 clear_button = st.button("Clear Conversation", on_click=clear_conversation)
 def download_chat_history():
-    return get_chat_history_str()
-download_button = st.download_button("Download Chat", data=download_chat_history(), file_name="chat_history.txt", mime="text/plain")
 st.markdown(
     """
     <script>
@@ -155,3 +206,4 @@ st.markdown(
     """,
     unsafe_allow_html=True
 )

 import uuid
 from gtts import gTTS
 import google.generativeai as genai
+from io import BytesIO  # Import BytesIO
 # Set your API key
 api_key = "AIzaSyC70u1sN87IkoxOoIj4XCAPw97ae2LZwNM"  # Replace with your actual API key
 # Initialize session state
 if 'chat_history' not in st.session_state:
+    st.session_state['chat_history'] = []
 if 'file_uploader_key' not in st.session_state:
+    st.session_state['file_uploader_key'] = str(uuid.uuid4())
 st.title("Gemini Chatbot")
 # Helper functions for image processing and chat history management
 def get_image_base64(image):
     image = image.convert("RGB")
     return img_str
 def clear_conversation():
+    st.session_state['chat_history'] = []
+    st.session_state['file_uploader_key'] = str(uuid.uuid4())
 def display_chat_history():
+    for entry in st.session_state['chat_history']:
         role = entry["role"]
         parts = entry["parts"][0]
         if 'text' in parts:
     chat_history_str = "\n".join(
         f"{entry['role'].title()}: {part['text']}" if 'text' in part
         else f"{entry['role'].title()}: (Image)"
+        for entry in st.session_state['chat_history']
         for part in entry['parts']
     )
     return chat_history_str
+# Send message function with TTS integration
 def send_message():
     user_input = st.session_state.user_input
+    uploaded_files = st.session_state.uploaded_files
     prompts = []
     prompt_parts = []
+    # Populate the prompts list with the existing chat history
+    for entry in st.session_state['chat_history']:
+        for part in entry['parts']:
+            if 'text' in part:
+                prompts.append(part['text'])
+            elif 'data' in part:
+                # Add the image in base64 format to prompt_parts for vision model
+                prompt_parts.append({"data": part['data'], "mime_type": "image/jpeg"})
+                prompts.append("[Image]")
+    # Append the user input to the prompts list
     if user_input:
         prompts.append(user_input)
+        st.session_state['chat_history'].append({"role": "user", "parts": [{"text": user_input}]})
+        # Also add the user text input to prompt_parts
         prompt_parts.append({"text": user_input})
+    # Handle uploaded files
     if uploaded_files:
         for uploaded_file in uploaded_files:
             base64_image = get_image_base64(Image.open(uploaded_file))
             prompts.append("[Image]")
             prompt_parts.append({"data": base64_image, "mime_type": "image/jpeg"})
+            st.session_state['chat_history'].append({
                 "role": "user",
                 "parts": [{"mime_type": uploaded_file.type, "data": base64_image}]
             })
+    # Determine if vision model should be used
     use_vision_model = any(part.get('mime_type') == 'image/jpeg' for part in prompt_parts)
+    # Set up the model and generate a response
     model_name = 'gemini-pro-vision' if use_vision_model else 'gemini-pro'
     model = genai.GenerativeModel(
         model_name=model_name,
     )
     chat_history_str = "\n".join(prompts)
     if use_vision_model:
+        # Include text and images for vision model
         generated_prompt = {"role": "user", "parts": prompt_parts}
     else:
+        # Include text only for standard model
         generated_prompt = {"role": "user", "parts": [{"text": chat_history_str}]}
     response = model.generate_content([generated_prompt])
     response_text = response.text if hasattr(response, "text") else "No response text found."
+    # After generating the response from the model, append it to the chat history
     if response_text:
+        st.session_state['chat_history'].append({"role": "model", "parts":[{"text": response_text}]})
+        # Convert the response text to speech
         tts = gTTS(text=response_text, lang='en')
         tts_file = BytesIO()
         tts.write_to_fp(tts_file)
         tts_file.seek(0)
         st.audio(tts_file, format='audio/mp3')
+    # Clear the input fields after sending the message
     st.session_state.user_input = ''
+    st.session_state.uploaded_files = []
+    st.session_state.file_uploader_key = str(uuid.uuid4())
+    # Display the updated chat history
     display_chat_history()
+# User input text area
+user_input = st.text_area(
+    "Enter your message here:",
+    value="",
+    key="user_input"
+)
+# File uploader for images
+uploaded_files = st.file_uploader(
+    "Upload images:",
+    type=["png", "jpg", "jpeg"],
+    accept_multiple_files=True,
+    key=st.session_state.file_uploader_key
+)
+# Send message button
+send_button = st.button(
+    "Send",
+    on_click=send_message
+)
+# Clear conversation button
 clear_button = st.button("Clear Conversation", on_click=clear_conversation)
+# Function to download the chat history as a text file
 def download_chat_history():
+    chat_history_str = get_chat_history_str()
+    return chat_history_str
+# Download button for the chat history
+download_button = st.download_button(
+    label="Download Chat",
+    data=download_chat_history(),
+    file_name="chat_history.txt",
+    mime="text/plain"
+)
+# Ensure the file_uploader widget state is tied to the randomly generated key
+st.session_state.uploaded_files = uploaded_files
+# JavaScript to capture the Ctrl+Enter event and trigger a button click
 st.markdown(
     """
     <script>
     """,
     unsafe_allow_html=True
 )