Spaces:

ProfessorLeVesseur
/

VisionTexts

Sleeping

App Files Files Community

ProfessorLeVesseur commited on Feb 22, 2024

Commit

61752c9

verified ·

1 Parent(s): 235a4b4

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -77

app.py CHANGED Viewed

@@ -23,9 +23,10 @@ openai.api_key = st.secrets["openai_api_key"]
 uploaded_file = st.file_uploader("Upload an image", type=["jpg", "png", "jpeg"])
 if uploaded_file:
-    # Display the uploaded image
-    with st.expander("Image", expanded = True):
-        st.image(uploaded_file, caption=uploaded_file.name, use_column_width=True)
 # Toggle for showing additional details input
 show_details = st.toggle("Add details about the image", value=False)
@@ -40,79 +41,6 @@ if show_details:
 # Button to trigger the analysis
 analyze_button = st.button("Analyze the Image", type="secondary")
-# # Check if an image has been uploaded, if the API key is available, and if the button has been pressed
-# if uploaded_file is not None and analyze_button:
-#     with st.spinner("Analyzing the image ..."):
-#         # Encode the image
-#         base64_image = encode_image(uploaded_file)
-#         # Optimized prompt for additional clarity and detail
-#         prompt_text = (
-#             "You are a highly knowledgeable accessibility expert. "
-#             "Your task is to examine the following image in detail. "
-#             "Provide a comprehensive, factual, and accurate explanation of what the image depicts. "
-#             "Highlight key elements and their significance, and present your analysis in clear, well-structured paragraph format. "
-#             "Create a detailed image caption in explaining in 150 words or less."
-#         )
-#         if show_details and additional_details:
-#             prompt_text += (
-#                 f"\n\nAdditional Context Provided by the User:\n{additional_details}"
-#             )
-#         # Create the payload for the completion request
-#         messages = [
-#             {
-#                 "role": "user",
-#                 "content": [
-#                     {"type": "text", "text": prompt_text},
-#                     {
-#                         "type": "image_url",
-#                         "image_url": f"data:image/jpeg;base64,{base64_image}",
-#                     },
-#                 ],
-#             }
-#         ]
-#         # Make the request to the OpenAI API
-#         try:
-#             # Without Stream
-#             # response = openai.chat.completions.create(
-#             #     model="gpt-4-vision-preview", messages=messages, max_tokens=500, stream=False
-#             # )
-#             # Stream the response
-#             full_response = ""
-#             message_placeholder = st.empty()
-#             for completion in openai.chat.completions.create(
-#                 model="gpt-4-vision-preview", messages=messages,
-#                 max_tokens=150, stream=True
-#             ):
-#                 # Check if there is content to display
-#                 if completion.choices[0].delta.content is not None:
-#                     full_response += completion.choices[0].delta.content
-#                     message_placeholder.markdown(full_response + "▌")
-#             # Final update to placeholder after the stream ends
-#             message_placeholder.markdown(full_response)
-#             # Display the response in the app
-#             # st.write(response.choices[0].message.content)
-#         except Exception as e:
-#             st.error(f"An error occurred: {e}")
-# else:
-#     # Warnings for user action required
-#     if not uploaded_file and analyze_button:
-#         st.warning("Please upload an image.")
 # Check if an image has been uploaded, if the API key is available, and if the button has been pressed
 if uploaded_file is not None and analyze_button:
@@ -126,7 +54,7 @@ if uploaded_file is not None and analyze_button:
             "Your task is to examine the following image in detail. "
             "Provide a comprehensive, factual, and accurate explanation of what the image depicts. "
             "Highlight key elements and their significance, and present your analysis in clear, well-structured paragraph format. "
-            "Create a detailed image caption in explaining in 150 words or less."
         )
         if show_details and additional_details:
@@ -163,6 +91,13 @@ if uploaded_file is not None and analyze_button:
                 model="gpt-4-vision-preview", messages=messages,
                 max_tokens=150, stream=True
             ):
                 # Check if there is content to display
                 if completion.choices[0].delta.content is not None:
                     full_response += completion.choices[0].delta.content

 uploaded_file = st.file_uploader("Upload an image", type=["jpg", "png", "jpeg"])
 if uploaded_file:
+    # Display the uploaded image with specified width
+    image_width = 300  # Set the desired width in pixels
+    with st.expander("Image", expanded=True):
+        st.image(uploaded_file, caption=uploaded_file.name, width=image_width, use_column_width=False)
 # Toggle for showing additional details input
 show_details = st.toggle("Add details about the image", value=False)
 # Button to trigger the analysis
 analyze_button = st.button("Analyze the Image", type="secondary")
 # Check if an image has been uploaded, if the API key is available, and if the button has been pressed
 if uploaded_file is not None and analyze_button:
             "Your task is to examine the following image in detail. "
             "Provide a comprehensive, factual, and accurate explanation of what the image depicts. "
             "Highlight key elements and their significance, and present your analysis in clear, well-structured paragraph format. "
+            "Create a detailed image caption explaining in 150 words or less, using no bullet points, just one paragraph."
         )
         if show_details and additional_details:
                 model="gpt-4-vision-preview", messages=messages,
                 max_tokens=150, stream=True
             ):
+            #     # Check if there is content to display
+            #     if completion.choices[0].delta.content is not None:
+            #         full_response += completion.choices[0].delta.content
+            #         message_placeholder.markdown(full_response + "▌")
+            # # Final update to placeholder after the stream ends
+            # message_placeholder.markdown(full_response) # stream text
                 # Check if there is content to display
                 if completion.choices[0].delta.content is not None:
                     full_response += completion.choices[0].delta.content