Spaces:

hanchraizedai
/

semsearch

Running

App Files Files

hanoch.rahimi@gmail commited on Nov 15, 2023

Commit

e54b3e0

1 Parent(s): 6a2ae7a

Added conversation

Browse files

Files changed (4) hide show

app.py +7 -0
openai_utils.py +28 -0
semsearch.pyproj +1 -0
utils.py +27 -3

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ from langchain.chains import RetrievalQA
 from langchain.embeddings.openai import OpenAIEmbeddings
 from langchain.prompts import PromptTemplate
 from langchain.vectorstores import Pinecone
 import openai
 import pinecone
 import streamlit as st
@@ -42,8 +43,14 @@ def init_models():
     #reader = pipeline(tokenizer=model_name, model=model_name, task='question-answering')
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     #vectorstore = Pinecone(st.session_state.index, embed.embed_query, text_field)
     return retriever, tokenizer#, vectorstore
 retriever, tokenizer = init_models()
 #st.session_state.messages = [{"role":"system", "content":"You are an assistant who helps users find startups to invest in."}]

 from langchain.embeddings.openai import OpenAIEmbeddings
 from langchain.prompts import PromptTemplate
 from langchain.vectorstores import Pinecone
+from streamlit.runtime.state import session_state
 import openai
 import pinecone
 import streamlit as st
     #reader = pipeline(tokenizer=model_name, model=model_name, task='question-answering')
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     #vectorstore = Pinecone(st.session_state.index, embed.embed_query, text_field)
+    st.session_state.openai_client = openai.OpenAI(api_key = OPENAI_API_KEY,organization='org-EEpryZYLlh0mZJOGxVko32qP')
+    # client.beta.assistants.create(
+    #     instructions=utils.assistant_instructions,
+    #     model="gpt-4-1106-preview",
+    #     tools=[{"type": "code_interpreter"}])
     return retriever, tokenizer#, vectorstore
 retriever, tokenizer = init_models()
 #st.session_state.messages = [{"role":"system", "content":"You are an assistant who helps users find startups to invest in."}]

openai_utils.py ADDED Viewed

	@@ -0,0 +1,28 @@

+import time
+import streamlit as st
+def send_message(role, content):
+    message = st.session_state.openai_client.beta.threads.messages.create(
+        thread_id=st.session_state.assistant_thread.id,
+        role=role,
+        content=content
+    )
+def start_conversation():
+    st.session_state.assistant_thread = st.session_state.openai_client.beta.threads.create()
+def run_assistant():
+    run = st.session_state.openai_client.beta.threads.runs.create(
+        thread_id=st.session_state.assistant_thread.id,
+        assistant_id=st.session_state.assistant.id,
+    )
+    while run.status == "queued" or run.status == "in_progress":
+        run = st.session_state.openai_client.beta.threads.runs.retrieve(
+            thread_id=st.session_state.assistant_thread.id,
+            run_id=run.id,
+        )
+        time.sleep(0.5)
+    return run

semsearch.pyproj CHANGED Viewed

@@ -38,6 +38,7 @@
   </ItemGroup>
   <ItemGroup>
     <Compile Include="app.py" />
     <Compile Include="utils.py" />
   </ItemGroup>
   <ItemGroup>

   </ItemGroup>
   <ItemGroup>
     <Compile Include="app.py" />
+    <Compile Include="openai_utils.py" />
     <Compile Include="utils.py" />
   </ItemGroup>
   <ItemGroup>

utils.py CHANGED Viewed

@@ -21,17 +21,18 @@ import openai
 def call_openai(prompt, engine="gpt-3.5-turbo", temp=0, top_p=1.0, max_tokens=4048):
     try:
-        response = openai.ChatCompletion.create(
             model=engine,
             messages=st.session_state.messages,
             temperature=temp,
             max_tokens=max_tokens
         )
         print(f"Open AI response\n {response}")
-        text = response.choices[0].message["content"].strip()
         st.session_state.messages.append({"role": "system", "content": text})
         return text
-    except openai.error.OpenAIError as e:
         print(f"An error occurred: {str(e)}")
     return "Failed to generate a response."
@@ -80,6 +81,29 @@ def get_prompt(title):
     # print(f"Results getting {title}")
     # return res
 # default_prompt = """
 # summarize the outcome of this search. The context is a list of company names followed by the company's description and a relevance score to the user query.
 # the report should mention the most important companies and how they compare to each other and contain the following sections:

 def call_openai(prompt, engine="gpt-3.5-turbo", temp=0, top_p=1.0, max_tokens=4048):
     try:
+        response = st.session_state.openai_client.chat.completions.create(
             model=engine,
             messages=st.session_state.messages,
             temperature=temp,
             max_tokens=max_tokens
         )
         print(f"Open AI response\n {response}")
+        text = response.choices[0].message.content.strip()
         st.session_state.messages.append({"role": "system", "content": text})
         return text
+    except Exception as e:
+    #except openai.error.OpenAIError as e:
         print(f"An error occurred: {str(e)}")
     return "Failed to generate a response."
     # print(f"Results getting {title}")
     # return res
+assistant_instructions = """Start like this:
+Please find here a list of startups that match the criteria you gave me (right now make a list up, later we will retrieve the list in a step before this).
+I like you to present a list view with the option to open up a more detailed view per startup including the location of the startup, the founders and the founding year.
+Ask the user to select startups that are of interest for them (just indicate the numbers).
+Also invite users to think of other criteria that could help them qualify the startups further such as
+1) founder and team characteristics:
+- serial entrepreneurs in the team
+- strong tech capabilities in the team
+- female founders or younger / older founders in the team
+- founders who graduated from top 100 universities
+ask the user if they would like to use those criteria for filtering (with the downside of seeing potentially very few startups) or rather apply it for ranking the companies (with the downside that there will be a lot of companies at the bottom of the list that are not a match at all).
+Invite users to name other criteria even if we are currently not able to provide such features. Ideally, they are possible to extract from a company's website or public founder profiles on social media.
+Output a json that specifies the filter criteria important to a user with the output variable.
+Also name the ranking criteria and suggest how to combine them to best meet the user's preferences.
+"""
 # default_prompt = """
 # summarize the outcome of this search. The context is a list of company names followed by the company's description and a relevance score to the user query.
 # the report should mention the most important companies and how they compare to each other and contain the following sections: