Spaces:

pseudotensor
/

open-strawberry

Running

App Files Files Community

pseudotensor commited on Sep 22

Commit

6f2c714

•

1 Parent(s): 046eafc

cerebras and assert

Browse files

Files changed (2) hide show

app.py +6 -4
models.py +56 -8

app.py CHANGED Viewed

@@ -2,11 +2,12 @@ import os
 import streamlit as st
 import time
 try:
-    from src.models import get_all_model_names
     from src.open_strawberry import get_defaults, manage_conversation
 except (ModuleNotFoundError, ImportError):
-    from models import get_all_model_names
     from open_strawberry import get_defaults, manage_conversation
 (model, system_prompt, initial_prompt, expected_answer,
@@ -158,6 +159,7 @@ if 'secrets' not in st.session_state:
                                         GEMINI_API_KEY='',
                                         # MISTRAL_API_KEY='',
                                         GROQ_API_KEY='',
                                         ANTHROPIC_API_KEY='',
                                         )
@@ -166,7 +168,7 @@ if 'secrets' not in st.session_state:
 def update_model_selection():
-    visible_models1 = get_all_model_names(st.session_state.secrets, on_hf_spaces)
     if visible_models1 and "model_name" in st.session_state:
         if st.session_state.model_name not in visible_models1:
             st.session_state.model_name = visible_models1[0]
@@ -177,7 +179,7 @@ if 'model_name' not in st.session_state or not st.session_state.model_name:
     update_model_selection()
 # Model selection
-visible_models = get_all_model_names(st.session_state.secrets, on_hf_spaces)
 st.sidebar.selectbox("Select Model", visible_models, key="model_name",
                      disabled=st.session_state.conversation_started)
 st.sidebar.checkbox("Show Next", value=show_next, key="show_next", disabled=st.session_state.conversation_started)

 import streamlit as st
 import time
 try:
+    from src.models import get_model_names
     from src.open_strawberry import get_defaults, manage_conversation
 except (ModuleNotFoundError, ImportError):
+    from models import get_model_names
     from open_strawberry import get_defaults, manage_conversation
 (model, system_prompt, initial_prompt, expected_answer,
                                         GEMINI_API_KEY='',
                                         # MISTRAL_API_KEY='',
                                         GROQ_API_KEY='',
+                                        CEREBRAS_OPENAI_API_KEY='',
                                         ANTHROPIC_API_KEY='',
                                         )
 def update_model_selection():
+    visible_models1 = get_model_names(st.session_state.secrets, on_hf_spaces)
     if visible_models1 and "model_name" in st.session_state:
         if st.session_state.model_name not in visible_models1:
             st.session_state.model_name = visible_models1[0]
     update_model_selection()
 # Model selection
+visible_models = get_model_names(st.session_state.secrets, on_hf_spaces)
 st.sidebar.selectbox("Select Model", visible_models, key="model_name",
                      disabled=st.session_state.conversation_started)
 st.sidebar.checkbox("Show Next", value=show_next, key="show_next", disabled=st.session_state.conversation_started)

models.py CHANGED Viewed

@@ -349,6 +349,52 @@ def get_groq(model: str,
     yield dict(output_tokens=output_tokens, input_tokens=input_tokens)
 def get_openai_azure(model: str,
                      prompt: str,
                      temperature: float = 0,
@@ -449,6 +495,10 @@ def get_model_names(secrets, on_hf_spaces=False):
                        'mixtral-8x7b-32768']
     else:
         groq_models = []
     if secrets.get('OLLAMA_OPENAI_API_KEY'):
         ollama_model = os.environ['OLLAMA_OPENAI_MODEL_NAME']
         ollama_model = to_list(ollama_model)
@@ -456,22 +506,18 @@ def get_model_names(secrets, on_hf_spaces=False):
         ollama_model = []
     groq_models = ['groq:' + x for x in groq_models]
     azure_models = ['azure:' + x for x in azure_models]
     openai_models = ['openai:' + x for x in openai_models]
     google_models = ['google:' + x for x in google_models]
     anthropic_models = ['anthropic:' + x for x in anthropic_models]
     ollama = ['ollama:' + x if 'ollama:' not in x else x for x in ollama_model]
-    return anthropic_models, openai_models, google_models, groq_models, azure_models, ollama
-def get_all_model_names(secrets, on_hf_spaces=False):
-    anthropic_models, openai_models, google_models, groq_models, azure_models, ollama = get_model_names(secrets,
-                                                                                                        on_hf_spaces=on_hf_spaces)
-    return anthropic_models + openai_models + google_models + groq_models + azure_models + ollama
 def get_model_api(model: str):
     if model.startswith('anthropic:'):
         return get_anthropic
     elif model.startswith('openai:') or model.startswith('ollama:'):
@@ -480,8 +526,10 @@ def get_model_api(model: str):
         return get_google
     elif model.startswith('groq:'):
         return get_groq
     elif model.startswith('azure:'):
         return get_openai_azure
     else:
         raise ValueError(
-            f"Unsupported model: {model}.  Ensure to add prefix (e.g. openai:, google:, groq:, azure:, ollama:, anthropic:)")

     yield dict(output_tokens=output_tokens, input_tokens=input_tokens)
+def get_cerebras(model: str,
+                 prompt: str,
+                 temperature: float = 0,
+                 max_tokens: int = 4096,
+                 system: str = '',
+                 chat_history: List[Dict] = None,
+                 secrets: Dict = {},
+                 verbose=False) -> Generator[dict, None, None]:
+    # context_length is only 8207
+    model = model.replace('cerebras:', '')
+    from cerebras.cloud.sdk import Cerebras
+    api_key = secrets.get("CEREBRAS_OPENAI_API_KEY")
+    client = Cerebras(api_key=api_key)
+    if chat_history is None:
+        chat_history = []
+    chat_history = chat_history.copy()
+    messages = [{"role": "system", "content": system}] + chat_history + [{"role": "user", "content": prompt}]
+    stream = openai_completion_with_backoff(client,
+                                            messages=messages,
+                                            model=model,
+                                            temperature=temperature,
+                                            max_tokens=max_tokens,
+                                            stream=True,
+                                            )
+    output_tokens = 0
+    input_tokens = 0
+    for chunk in stream:
+        if chunk.choices[0].delta.content:
+            yield dict(text=chunk.choices[0].delta.content)
+        if chunk.usage:
+            output_tokens = chunk.usage.completion_tokens
+            input_tokens = chunk.usage.prompt_tokens
+    if verbose:
+        print(f"Output tokens: {output_tokens}")
+        print(f"Input tokens: {input_tokens}")
+    yield dict(output_tokens=output_tokens, input_tokens=input_tokens)
 def get_openai_azure(model: str,
                      prompt: str,
                      temperature: float = 0,
                        'mixtral-8x7b-32768']
     else:
         groq_models = []
+    if secrets.get('CEREBRAS_OPENAI_API_KEY'):
+        cerebras_models = ['llama3.1-70b', 'llama3.1-8b']
+    else:
+        cerebras_models = []
     if secrets.get('OLLAMA_OPENAI_API_KEY'):
         ollama_model = os.environ['OLLAMA_OPENAI_MODEL_NAME']
         ollama_model = to_list(ollama_model)
         ollama_model = []
     groq_models = ['groq:' + x for x in groq_models]
+    cerebras_models = ['cerebras:' + x for x in cerebras_models]
     azure_models = ['azure:' + x for x in azure_models]
     openai_models = ['openai:' + x for x in openai_models]
     google_models = ['google:' + x for x in google_models]
     anthropic_models = ['anthropic:' + x for x in anthropic_models]
     ollama = ['ollama:' + x if 'ollama:' not in x else x for x in ollama_model]
+    return anthropic_models + openai_models + google_models + groq_models + cerebras_models + azure_models + ollama
 def get_model_api(model: str):
+    assert model not in ['', None], "Model not set, need to add API key to have models appear and select one."
     if model.startswith('anthropic:'):
         return get_anthropic
     elif model.startswith('openai:') or model.startswith('ollama:'):
         return get_google
     elif model.startswith('groq:'):
         return get_groq
+    elif model.startswith('cerebras:'):
+        return get_cerebras
     elif model.startswith('azure:'):
         return get_openai_azure
     else:
         raise ValueError(
+            f"Unsupported model: {model}.  Ensure to add prefix (e.g. openai:, google:, groq:, cerebras:, azure:, ollama:, anthropic:)")