GPT-4o-omni-ReactTypescriptGenerator

Runtime error

App Files Files Community

awacke1 commited on May 25, 2024

Commit

f019b7a

verified ·

1 Parent(s): 053774d

Update app.py

Browse files

Files changed (1) hide show

app.py +203 -149

app.py CHANGED Viewed

@@ -53,7 +53,14 @@ st.set_page_config(
     }
 )
 # HTML5 based Speech Synthesis (Text to Speech in Browser)
 @st.cache_resource
@@ -359,6 +366,19 @@ def display_glossary_grid(roleplaying_glossary):
                     st.markdown(f"**{term}** <small>{links_md}</small>", unsafe_allow_html=True)
 @st.cache_resource
 def get_table_download_link(file_path):
@@ -576,10 +596,26 @@ def FileSidebar():
         if next_action=='md':
             st.markdown(file_contents)
             buttonlabel = '🔍Run'
             if st.button(key='Runmd', label = buttonlabel):
-                user_prompt = file_contents
-            #try:
                 #search_glossary(file_contents)
             #except:
                 #st.markdown('GPT is sleeping.  Restart ETA 30 seconds.')
@@ -1241,79 +1277,6 @@ def get_audio_download_link(file_path):
-# 🎵 Wav Audio files - Transcription History in Wav
-audio_files = glob.glob("*.wav")
-audio_files = [file for file in audio_files if len(os.path.splitext(file)[0]) >= 10]  # exclude files with short names
-audio_files.sort(key=lambda x: (os.path.splitext(x)[1], x), reverse=True)  # sort by file type and file name in descending order
-# 🖼 PNG Image files
-image_files = glob.glob("*.png")
-image_files = [file for file in image_files if len(os.path.splitext(file)[0]) >= 10]  # exclude files with short names
-image_files.sort(key=lambda x: (os.path.splitext(x)[1], x), reverse=True)  # sort by file type and file name in descending order
-# 🎥 MP4 Video files
-video_files = glob.glob("*.mp4")
-video_files = [file for file in video_files if len(os.path.splitext(file)[0]) >= 10]  # exclude files with short names
-video_files.sort(key=lambda x: (os.path.splitext(x)[1], x), reverse=True)  # sort by file type and file name in descending order
-# Delete All button for each file type
-if st.sidebar.button("🗑 Delete All Audio"):
-    for file in audio_files:
-        os.remove(file)
-    st.rerun()
-if st.sidebar.button("🗑 Delete All Images"):
-    for file in image_files:
-        os.remove(file)
-    st.rerun()
-if st.sidebar.button("🗑 Delete All Videos"):
-    for file in video_files:
-        os.remove(file)
-    st.rerun()
-# Display and handle audio files
-for file in audio_files:
-    col1, col2 = st.sidebar.columns([6, 1])  # adjust the ratio as needed
-    with col1:
-        st.markdown(file)
-        if st.button("🎵", key="play_" + file):  # play emoji button
-            audio_file = open(file, 'rb')
-            audio_bytes = audio_file.read()
-            st.audio(audio_bytes, format='audio/wav')
-    with col2:
-        if st.button("🗑", key="delete_" + file):
-            os.remove(file)
-            st.rerun()
-# Display and handle image files
-for file in image_files:
-    col1, col2 = st.sidebar.columns([6, 1])  # adjust the ratio as needed
-    with col1:
-        st.markdown(file)
-        if st.button("🖼", key="show_" + file):  # show emoji button
-            image = open(file, 'rb').read()
-            st.image(image)
-    with col2:
-        if st.button("🗑", key="delete_" + file):
-            os.remove(file)
-            st.rerun()
-# Display and handle video files
-for file in video_files:
-    col1, col2 = st.sidebar.columns([6, 1])  # adjust the ratio as needed
-    with col1:
-        st.markdown(file)
-        if st.button("🎥", key="play_" + file):  # play emoji button
-            video_file = open(file, 'rb')
-            video_bytes = video_file.read()
-            st.video(video_bytes)
-    with col2:
-        if st.button("🗑", key="delete_" + file):
-            os.remove(file)
-            st.rerun()
 GiveFeedback=False
 if GiveFeedback:
@@ -1380,18 +1343,6 @@ def transcribe_canary(filename):
     st.write(result)
     return result
-# ChatBot client chat completions -------------------------  !!
-def process_text2(MODEL='gpt-4o-2024-05-13', text_input='What is 2+2 and what is an imaginary number'):
-    if text_input:
-        completion = client.chat.completions.create(
-            model=MODEL,
-            messages=st.session_state.messages
-        )
-        return_text = completion.choices[0].message.content
-        st.write("Assistant: " + return_text)
-        filename = generate_filename(text_input, "md")
-        create_file(filename, text_input, return_text, should_save)
-        return return_text
 # Transcript to arxiv and client chat completion -------------------------  !!
 filename = save_and_play_audio(audio_recorder)
@@ -1441,12 +1392,12 @@ if example_input:
 for example_input in session_state["search_queries"]:
     st.write(example_input)
-if st.button("Run Prompt", help="Click to run."):
-    try:
-        response=StreamLLMChatResponse(example_input)
-        create_file(filename, example_input, response, should_save)
-    except:
-        st.write('model is asleep. Starting now on A10 GPU.  Please wait one minute then retry.  KEDA triggered.')
 openai.api_key = os.getenv('OPENAI_API_KEY')
 if openai.api_key == None: openai.api_key = st.secrets['OPENAI_API_KEY']
@@ -1490,7 +1441,7 @@ if AddAFileForContext:
                     st.sidebar.markdown(get_table_download_link(filename), unsafe_allow_html=True)
-# documentation
 # 1. Cookbook:  https://cookbook.openai.com/examples/gpt4o/introduction_to_gpt4o
 # 2. Configure your Project and Orgs to limit/allow Models:  https://platform.openai.com/settings/organization/general
 # 3. Watch your Billing!  https://platform.openai.com/settings/organization/billing/overview
@@ -1531,11 +1482,6 @@ def process_text(text_input):
         #st.write("Assistant: " + completion.choices[0].message.content)
 def create_file(filename, prompt, response, is_image=False):
     with open(filename, "w", encoding="utf-8") as f:
         f.write(prompt + "\n\n" + response)
@@ -1607,12 +1553,13 @@ def process_image(image_input, user_prompt):
             return image_response
-def save_imageold(image_input, filename_txt):
-    # Save the uploaded video file
-    with open(filename_txt, "wb") as f:
-        f.write(image_input.getbuffer())
-    return image_input.name
 def process_audio(audio_input, text_input):
     if audio_input:
@@ -1620,15 +1567,20 @@ def process_audio(audio_input, text_input):
             model="whisper-1",
             file=audio_input,
         )
-        response = client.chat.completions.create(
-            model=MODEL,
-            messages=[
-            {"role": "system", "content":{text_input}},
-            {"role": "user", "content": [{"type": "text", "text": f"The audio transcription is: {transcription.text}"}],}
-            ],
-            temperature=0,
-        )
-        st.markdown(response.choices[0].message.content)
 def process_audio_for_video(video_input):
     if video_input:
@@ -1733,55 +1685,134 @@ def main():
         image_input = st.file_uploader("Upload an image", type=["jpg", "jpeg", "png"])
         image_response = process_image(image_input, text_input)
     elif option == "Audio":
-        text = "Transcribe and answer questions as a helpful audio music and speech assistant.  "
-        #text = "You are generating a transcript summary. Create a summary of the provided transcription. Respond in Markdown."
         text_input = st.text_input(label="Enter text prompt to use with Audio context.", value=text)
-        audio_input = st.file_uploader("Upload an audio file", type=["mp3", "wav"])
-        audio_response = process_audio(audio_input, text_input)
     elif option == "Video":
         video_input = st.file_uploader("Upload a video file", type=["mp4"])
         process_audio_and_video(video_input)
-    # Image and Video Galleries
-    num_columns_images=st.slider(key="num_columns_images", label="Choose Number of Image Columns", min_value=1, max_value=15, value=5)
-    display_images_and_wikipedia_summaries(num_columns_images)   # Image Jump Grid
-    num_columns_video=st.slider(key="num_columns_video", label="Choose Number of Video Columns", min_value=1, max_value=15, value=5)
-    display_videos_and_links(num_columns_video)   # Video Jump Grid
-# Optional UI's
-showExtendedTextInterface=False
-if showExtendedTextInterface:
-    display_glossary_grid(roleplaying_glossary)  # Word Glossary Jump Grid - Dynamically calculates columns based on details length to keep topic together
-    num_columns_text=st.slider(key="num_columns_text", label="Choose Number of Text Columns", min_value=1, max_value=15, value=4)
-    display_buttons_with_scores(num_columns_text)  # Feedback Jump Grid
-    st.markdown(personality_factors)
-# st.title("GPT-4o ChatBot")
-client = OpenAI(api_key= os.getenv('OPENAI_API_KEY'), organization=os.getenv('OPENAI_ORG_ID'))
-MODEL = "gpt-4o-2024-05-13"
-if "openai_model" not in st.session_state:
-    st.session_state["openai_model"] = MODEL
-if "messages" not in st.session_state:
-    st.session_state.messages = []
-if st.button("Clear Session"):
-    st.session_state.messages = []
-current_messages=[]
-for message in st.session_state.messages:
-    with st.chat_message(message["role"]):
-        current_messages.append(message)
-        st.markdown(message["content"])
 # ChatBot Entry
 if prompt := st.chat_input("GPT-4o Multimodal ChatBot - What can I help you with?"):
@@ -1797,5 +1828,28 @@ if prompt := st.chat_input("GPT-4o Multimodal ChatBot - What can I help you with
         response = process_text2(text_input=prompt)
     st.session_state.messages.append({"role": "assistant", "content": response})
-if __name__ == "__main__":
-    main()

     }
 )
+client = OpenAI(api_key= os.getenv('OPENAI_API_KEY'), organization=os.getenv('OPENAI_ORG_ID'))
+MODEL = "gpt-4o-2024-05-13"
+if "openai_model" not in st.session_state:
+    st.session_state["openai_model"] = MODEL
+if "messages" not in st.session_state:
+    st.session_state.messages = []
+if st.button("Clear Session"):
+    st.session_state.messages = []
 # HTML5 based Speech Synthesis (Text to Speech in Browser)
 @st.cache_resource
                     st.markdown(f"**{term}** <small>{links_md}</small>", unsafe_allow_html=True)
+# ChatBot client chat completions -------------------------  !!
+def process_text2(MODEL='gpt-4o-2024-05-13', text_input='What is 2+2 and what is an imaginary number'):
+    if text_input:
+        completion = client.chat.completions.create(
+            model=MODEL,
+            messages=st.session_state.messages
+        )
+        return_text = completion.choices[0].message.content
+        st.write("Assistant: " + return_text)
+        filename = generate_filename(text_input, "md")
+        create_file(filename, text_input, return_text, should_save)
+        return return_text
 @st.cache_resource
 def get_table_download_link(file_path):
         if next_action=='md':
             st.markdown(file_contents)
+            SpeechSynthesis(file_contents)
             buttonlabel = '🔍Run'
             if st.button(key='Runmd', label = buttonlabel):
+                MODEL = "gpt-4o-2024-05-13"
+                openai.api_key = os.getenv('OPENAI_API_KEY')
+                openai.organization = os.getenv('OPENAI_ORG_ID')
+                client = OpenAI(api_key= os.getenv('OPENAI_API_KEY'), organization=os.getenv('OPENAI_ORG_ID'))
+                st.session_state.messages.append({"role": "user", "content": transcript})
+                with st.chat_message("user"):
+                    st.markdown(transcript)
+                with st.chat_message("assistant"):
+                    completion = client.chat.completions.create(
+                        model=MODEL,
+                        messages = st.session_state.messages,
+                        stream=True
+                    )
+                    response = process_text2(text_input=prompt)
+                st.session_state.messages.append({"role": "assistant", "content": response})
+                #try:
                 #search_glossary(file_contents)
             #except:
                 #st.markdown('GPT is sleeping.  Restart ETA 30 seconds.')
 GiveFeedback=False
 if GiveFeedback:
     st.write(result)
     return result
 # Transcript to arxiv and client chat completion -------------------------  !!
 filename = save_and_play_audio(audio_recorder)
 for example_input in session_state["search_queries"]:
     st.write(example_input)
+#if st.button("Run Prompt", help="Click to run."):
+#    try:
+#        response=StreamLLMChatResponse(example_input)
+#        create_file(filename, example_input, response, should_save)
+#    except:
+#        st.write('model is asleep. Starting now on A10 GPU.  Please wait one minute then retry.  KEDA triggered.')
 openai.api_key = os.getenv('OPENAI_API_KEY')
 if openai.api_key == None: openai.api_key = st.secrets['OPENAI_API_KEY']
                     st.sidebar.markdown(get_table_download_link(filename), unsafe_allow_html=True)
+# GPT4o documentation
 # 1. Cookbook:  https://cookbook.openai.com/examples/gpt4o/introduction_to_gpt4o
 # 2. Configure your Project and Orgs to limit/allow Models:  https://platform.openai.com/settings/organization/general
 # 3. Watch your Billing!  https://platform.openai.com/settings/organization/billing/overview
         #st.write("Assistant: " + completion.choices[0].message.content)
 def create_file(filename, prompt, response, is_image=False):
     with open(filename, "w", encoding="utf-8") as f:
         f.write(prompt + "\n\n" + response)
             return image_response
+def create_audio_file(filename, audio_data, should_save):
+    if should_save:
+        with open(filename, "wb") as file:
+            file.write(audio_data.getvalue())
+        st.success(f"Audio file saved as {filename}")
+    else:
+        st.warning("Audio file not saved.")
 def process_audio(audio_input, text_input):
     if audio_input:
             model="whisper-1",
             file=audio_input,
         )
+        st.session_state.messages.append({"role": "user", "content": transcription.text})
+        with st.chat_message("assistant"):
+            st.markdown(transcription.text)
+            SpeechSynthesis(transcription.text)
+            filename = generate_filename(transcription.text, "wav")
+            create_audio_file(filename, audio_input, should_save)
+        #SpeechSynthesis(transcription.text)
+        filename = generate_filename(transcription.text, "md")
+        create_file(filename, transcription.text, transcription.text, should_save)
+        #st.markdown(response.choices[0].message.content)
 def process_audio_for_video(video_input):
     if video_input:
         image_input = st.file_uploader("Upload an image", type=["jpg", "jpeg", "png"])
         image_response = process_image(image_input, text_input)
     elif option == "Audio":
+        text = "You are generating a transcript summary. Create a summary of the provided transcription. Respond in Markdown."
+        text_input = st.text_input(label="Enter text prompt to use with Audio context.", value=text)
+        uploaded_files = st.file_uploader("Upload an audio file", type=["mp3", "wav"], accept_multiple_files=True)
+        for audio_input in uploaded_files:
+            st.write(audio_input.name)
+            if audio_input is not None:
+                process_audio(audio_input, text_input)
+    elif option == "Audio old":
+        #text = "Transcribe and answer questions as a helpful audio music and speech assistant.  "
+        text = "You are generating a transcript summary. Create a summary of the provided transcription. Respond in Markdown."
         text_input = st.text_input(label="Enter text prompt to use with Audio context.", value=text)
+        uploaded_files = st.file_uploader("Upload an audio file", type=["mp3", "wav"], accept_multiple_files=True)
+        for audio_input in uploaded_files:
+            st.write(audio_input.name)
+        if audio_input is not None:
+            # To read file as bytes:
+            bytes_data = uploaded_file.getvalue()
+            #st.write(bytes_data)
+            # To convert to a string based IO:
+            #stringio = StringIO(uploaded_file.getvalue().decode("utf-8"))
+            #st.write(stringio)
+            # To read file as string:
+            #string_data = stringio.read()
+            #st.write(string_data)
+        process_audio(audio_input, text_input)
     elif option == "Video":
         video_input = st.file_uploader("Upload a video file", type=["mp4"])
         process_audio_and_video(video_input)
+# Enter the GPT-4o omni model in streamlit chatbot
+current_messages=[]
+for message in st.session_state.messages:
+    with st.chat_message(message["role"]):
+        current_messages.append(message)
+        st.markdown(message["content"])
+# 🎵 Wav Audio files - Transcription History in Wav
+audio_files = glob.glob("*.wav")
+audio_files = [file for file in audio_files if len(os.path.splitext(file)[0]) >= 10]  # exclude files with short names
+audio_files.sort(key=lambda x: (os.path.splitext(x)[1], x), reverse=True)  # sort by file type and file name in descending order
+# 🖼 PNG Image files
+image_files = glob.glob("*.png")
+image_files = [file for file in image_files if len(os.path.splitext(file)[0]) >= 10]  # exclude files with short names
+image_files.sort(key=lambda x: (os.path.splitext(x)[1], x), reverse=True)  # sort by file type and file name in descending order
+# 🎥 MP4 Video files
+video_files = glob.glob("*.mp4")
+video_files = [file for file in video_files if len(os.path.splitext(file)[0]) >= 10]  # exclude files with short names
+video_files.sort(key=lambda x: (os.path.splitext(x)[1], x), reverse=True)  # sort by file type and file name in descending order
+main()
+# Delete All button for each file type
+if st.sidebar.button("🗑 Delete All Audio"):
+    for file in audio_files:
+        os.remove(file)
+    st.rerun()
+if st.sidebar.button("🗑 Delete All Images"):
+    for file in image_files:
+        os.remove(file)
+    st.rerun()
+if st.sidebar.button("🗑 Delete All Videos"):
+    for file in video_files:
+        os.remove(file)
+    st.rerun()
+# Display and handle audio files
+for file in audio_files:
+    col1, col2 = st.sidebar.columns([6, 1])  # adjust the ratio as needed
+    with col1:
+        st.markdown(file)
+        if st.button("🎵", key="play_" + file):  # play emoji button
+            audio_file = open(file, 'rb')
+            audio_bytes = audio_file.read()
+            st.audio(audio_bytes, format='audio/wav')
+    with col2:
+        if st.button("🗑", key="delete_" + file):
+            os.remove(file)
+            st.rerun()
+# Display and handle image files
+for file in image_files:
+    col1, col2 = st.sidebar.columns([6, 1])  # adjust the ratio as needed
+    with col1:
+        st.markdown(file)
+        if st.button("🖼", key="show_" + file):  # show emoji button
+            image = open(file, 'rb').read()
+            st.image(image)
+    with col2:
+        if st.button("🗑", key="delete_" + file):
+            os.remove(file)
+            st.rerun()
+# Display and handle video files
+for file in video_files:
+    col1, col2 = st.sidebar.columns([6, 1])  # adjust the ratio as needed
+    with col1:
+        st.markdown(file)
+        if st.button("🎥", key="play_" + file):  # play emoji button
+            video_file = open(file, 'rb')
+            video_bytes = video_file.read()
+            st.video(video_bytes)
+    with col2:
+        if st.button("🗑", key="delete_" + file):
+            os.remove(file)
+            st.rerun()
 # ChatBot Entry
 if prompt := st.chat_input("GPT-4o Multimodal ChatBot - What can I help you with?"):
         response = process_text2(text_input=prompt)
     st.session_state.messages.append({"role": "assistant", "content": response})
+# Image and Video Galleries
+num_columns_images=st.slider(key="num_columns_images", label="Choose Number of Image Columns", min_value=1, max_value=15, value=3)
+display_images_and_wikipedia_summaries(num_columns_images)   # Image Jump Grid
+num_columns_video=st.slider(key="num_columns_video", label="Choose Number of Video Columns", min_value=1, max_value=15, value=3)
+display_videos_and_links(num_columns_video)   # Video Jump Grid
+# Optional UI's
+showExtendedTextInterface=False
+if showExtendedTextInterface:
+    display_glossary_grid(roleplaying_glossary)  # Word Glossary Jump Grid - Dynamically calculates columns based on details length to keep topic together
+    num_columns_text=st.slider(key="num_columns_text", label="Choose Number of Text Columns", min_value=1, max_value=15, value=4)
+    display_buttons_with_scores(num_columns_text)  # Feedback Jump Grid
+    st.markdown(personality_factors)
+#if __name__ == "__main__":