Spaces:

pseudotensor
/

open-strawberry

Running

App Files Files Community

pseudotensor commited on Sep 22, 2024

Commit

046eafc

1 Parent(s): 56980e9

fix secrets handling

Browse files

Files changed (4) hide show

app.py +4 -0
cli.py +2 -0
models.py +21 -17
open_strawberry.py +5 -2

app.py CHANGED Viewed

@@ -50,6 +50,8 @@ if "verbose" not in st.session_state:
     st.session_state.verbose = verbose
 if "max_tokens" not in st.session_state:
     st.session_state.max_tokens = max_tokens
 if "temperature" not in st.session_state:
     st.session_state.temperature = temperature
 if "next_prompts" not in st.session_state:
@@ -272,6 +274,8 @@ try:
                 num_turns=st.session_state.num_turns,
                 temperature=st.session_state.temperature,
                 max_tokens=st.session_state.max_tokens,
                 verbose=st.session_state.verbose,
             )
         chunk = next(st.session_state.generator)

     st.session_state.verbose = verbose
 if "max_tokens" not in st.session_state:
     st.session_state.max_tokens = max_tokens
+if "seed" not in st.session_state:
+    st.session_state.seed = 0
 if "temperature" not in st.session_state:
     st.session_state.temperature = temperature
 if "next_prompts" not in st.session_state:
                 num_turns=st.session_state.num_turns,
                 temperature=st.session_state.temperature,
                 max_tokens=st.session_state.max_tokens,
+                seed=st.session_state.seed,
+                secrets=st.session_state.secrets,
                 verbose=st.session_state.verbose,
             )
         chunk = next(st.session_state.generator)

cli.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import argparse
 import time
 from src.open_strawberry import get_defaults, manage_conversation
@@ -54,6 +55,7 @@ def go_cli():
                                     temperature=args.temperature,
                                     max_tokens=args.max_tokens,
                                     seed=args.seed,
                                     cli_mode=True)
     response = ''
     conversation_history = []

 import argparse
+import os
 import time
 from src.open_strawberry import get_defaults, manage_conversation
                                     temperature=args.temperature,
                                     max_tokens=args.max_tokens,
                                     seed=args.seed,
+                                    secrets=dict(os.environ),
                                     cli_mode=True)
     response = ''
     conversation_history = []

models.py CHANGED Viewed

@@ -25,6 +25,7 @@ def get_anthropic(model: str,
                   max_tokens: int = 4096,
                   system: str = '',
                   chat_history: List[Dict] = None,
                   verbose=False) -> \
         Generator[dict, None, None]:
     model = model.replace('anthropic:', '')
@@ -32,7 +33,7 @@ def get_anthropic(model: str,
     # https://docs.anthropic.com/en/docs/build-with-claude/prompt-caching
     import anthropic
-    clawd_key = os.getenv('ANTHROPIC_API_KEY')
     clawd_client = anthropic.Anthropic(api_key=clawd_key) if clawd_key else None
     if chat_history is None:
@@ -118,16 +119,16 @@ def get_openai(model: str,
                max_tokens: int = 4096,
                system: str = '',
                chat_history: List[Dict] = None,
                verbose=False) -> Generator[dict, None, None]:
-    anthropic_models, openai_models, google_models, groq_models, azure_models, ollama = get_model_names()
-    if model in ollama:
         model = model.replace('ollama:', '')
-        openai_key = os.getenv('OLLAMA_OPENAI_API_KEY')
-        openai_base_url = os.getenv('OLLAMA_OPENAI_BASE_URL', 'http://localhost:11434/v1/')
     else:
         model = model.replace('openai:', '')
-        openai_key = os.getenv('OPENAI_API_KEY')
-        openai_base_url = os.getenv('OPENAI_BASE_URL', 'https://api.openai.com/v1')
     from openai import OpenAI
@@ -206,12 +207,13 @@ def get_google(model: str,
                max_tokens: int = 4096,
                system: str = '',
                chat_history: List[Dict] = None,
                verbose=False) -> Generator[dict, None, None]:
     model = model.replace('google:', '').replace('gemini:', '')
     import google.generativeai as genai
-    gemini_key = os.getenv("GEMINI_API_KEY")
     genai.configure(api_key=gemini_key)
     # Create the model
     generation_config = {
@@ -308,12 +310,13 @@ def get_groq(model: str,
              max_tokens: int = 4096,
              system: str = '',
              chat_history: List[Dict] = None,
              verbose=False) -> Generator[dict, None, None]:
     model = model.replace('groq:', '')
     from groq import Groq
-    groq_key = os.getenv("GROQ_API_KEY")
     client = Groq(api_key=groq_key)
     if chat_history is None:
@@ -352,15 +355,16 @@ def get_openai_azure(model: str,
                      max_tokens: int = 4096,
                      system: str = '',
                      chat_history: List[Dict] = None,
                      verbose=False) -> Generator[dict, None, None]:
     model = model.replace('azure:', '').replace('openai_azure:', '')
     from openai import AzureOpenAI
-    azure_endpoint = os.getenv("AZURE_OPENAI_ENDPOINT")  # e.g. https://project.openai.azure.com
-    azure_key = os.getenv("AZURE_OPENAI_API_KEY")
-    azure_deployment = os.getenv("AZURE_OPENAI_DEPLOYMENT")  # i.e. deployment name with some models deployed
-    azure_api_version = os.getenv('AZURE_OPENAI_API_VERSION', '2024-07-01-preview')
     assert azure_endpoint is not None, "Azure OpenAI endpoint not set"
     assert azure_key is not None, "Azure OpenAI API key not set"
     assert azure_deployment is not None, "Azure OpenAI deployment not set"
@@ -420,15 +424,15 @@ def get_model_names(secrets, on_hf_spaces=False):
     else:
         anthropic_models = []
     if secrets.get('OPENAI_API_KEY'):
-        if os.getenv('OPENAI_MODEL_NAME'):
-            openai_models = to_list(os.getenv('OPENAI_MODEL_NAME'))
         else:
             openai_models = ['gpt-4o', 'gpt-4-turbo-2024-04-09', 'gpt-4o-mini']
     else:
         openai_models = []
     if secrets.get('AZURE_OPENAI_API_KEY'):
-        if os.getenv('AZURE_OPENAI_MODEL_NAME'):
-            azure_models = to_list(os.getenv('AZURE_OPENAI_MODEL_NAME'))
         else:
             azure_models = ['gpt-4o', 'gpt-4-turbo-2024-04-09', 'gpt-4o-mini']
     else:

                   max_tokens: int = 4096,
                   system: str = '',
                   chat_history: List[Dict] = None,
+                  secrets: Dict = {},
                   verbose=False) -> \
         Generator[dict, None, None]:
     model = model.replace('anthropic:', '')
     # https://docs.anthropic.com/en/docs/build-with-claude/prompt-caching
     import anthropic
+    clawd_key = secrets.get('ANTHROPIC_API_KEY')
     clawd_client = anthropic.Anthropic(api_key=clawd_key) if clawd_key else None
     if chat_history is None:
                max_tokens: int = 4096,
                system: str = '',
                chat_history: List[Dict] = None,
+               secrets: Dict = {},
                verbose=False) -> Generator[dict, None, None]:
+    if model.startswith('ollama:'):
         model = model.replace('ollama:', '')
+        openai_key = secrets.get('OLLAMA_OPENAI_API_KEY')
+        openai_base_url = secrets.get('OLLAMA_OPENAI_BASE_URL', 'http://localhost:11434/v1/')
     else:
         model = model.replace('openai:', '')
+        openai_key = secrets.get('OPENAI_API_KEY')
+        openai_base_url = secrets.get('OPENAI_BASE_URL', 'https://api.openai.com/v1')
     from openai import OpenAI
                max_tokens: int = 4096,
                system: str = '',
                chat_history: List[Dict] = None,
+               secrets: Dict = {},
                verbose=False) -> Generator[dict, None, None]:
     model = model.replace('google:', '').replace('gemini:', '')
     import google.generativeai as genai
+    gemini_key = secrets.get("GEMINI_API_KEY")
     genai.configure(api_key=gemini_key)
     # Create the model
     generation_config = {
              max_tokens: int = 4096,
              system: str = '',
              chat_history: List[Dict] = None,
+             secrets: Dict = {},
              verbose=False) -> Generator[dict, None, None]:
     model = model.replace('groq:', '')
     from groq import Groq
+    groq_key = secrets.get("GROQ_API_KEY")
     client = Groq(api_key=groq_key)
     if chat_history is None:
                      max_tokens: int = 4096,
                      system: str = '',
                      chat_history: List[Dict] = None,
+                     secrets: Dict = {},
                      verbose=False) -> Generator[dict, None, None]:
     model = model.replace('azure:', '').replace('openai_azure:', '')
     from openai import AzureOpenAI
+    azure_endpoint = secrets.get("AZURE_OPENAI_ENDPOINT")  # e.g. https://project.openai.azure.com
+    azure_key = secrets.get("AZURE_OPENAI_API_KEY")
+    azure_deployment = secrets.get("AZURE_OPENAI_DEPLOYMENT")  # i.e. deployment name with some models deployed
+    azure_api_version = secrets.get('AZURE_OPENAI_API_VERSION', '2024-07-01-preview')
     assert azure_endpoint is not None, "Azure OpenAI endpoint not set"
     assert azure_key is not None, "Azure OpenAI API key not set"
     assert azure_deployment is not None, "Azure OpenAI deployment not set"
     else:
         anthropic_models = []
     if secrets.get('OPENAI_API_KEY'):
+        if secrets.get('OPENAI_MODEL_NAME'):
+            openai_models = to_list(secrets.get('OPENAI_MODEL_NAME'))
         else:
             openai_models = ['gpt-4o', 'gpt-4-turbo-2024-04-09', 'gpt-4o-mini']
     else:
         openai_models = []
     if secrets.get('AZURE_OPENAI_API_KEY'):
+        if secrets.get('AZURE_OPENAI_MODEL_NAME'):
+            azure_models = to_list(secrets.get('AZURE_OPENAI_MODEL_NAME'))
         else:
             azure_models = ['gpt-4o', 'gpt-4-turbo-2024-04-09', 'gpt-4o-mini']
     else:

open_strawberry.py CHANGED Viewed

@@ -290,7 +290,8 @@ def manage_conversation(model: str,
                         temperature: float = 0.3,
                         max_tokens: int = 4096,
                         seed: int = 1234,
-                        verbose: bool = False
                         ) -> Generator[Dict, None, list]:
     if seed == 0:
         seed = random.randint(0, 1000000)
@@ -344,7 +345,9 @@ def manage_conversation(model: str,
         thinking_time = time.time()
         response_text = ''
         for chunk in get_model_func(model, prompt, system=system, chat_history=chat_history,
-                                    temperature=temperature, max_tokens=max_tokens, verbose=verbose):
             if 'text' in chunk and chunk['text']:
                 response_text += chunk['text']
                 yield {"role": "assistant", "content": chunk['text'], "streaming": True, "chat_history": chat_history,

                         temperature: float = 0.3,
                         max_tokens: int = 4096,
                         seed: int = 1234,
+                        secrets: Dict = {},
+                        verbose: bool = False,
                         ) -> Generator[Dict, None, list]:
     if seed == 0:
         seed = random.randint(0, 1000000)
         thinking_time = time.time()
         response_text = ''
         for chunk in get_model_func(model, prompt, system=system, chat_history=chat_history,
+                                    temperature=temperature, max_tokens=max_tokens,
+                                    secrets=secrets,
+                                    verbose=verbose):
             if 'text' in chunk and chunk['text']:
                 response_text += chunk['text']
                 yield {"role": "assistant", "content": chunk['text'], "streaming": True, "chat_history": chat_history,