Spaces:
Sleeping
Sleeping
import streamlit as st | |
import chromadb | |
from chromadb.utils import embedding_functions | |
from sentence_transformers import SentenceTransformer | |
from openai import OpenAI | |
# CONSTANTS | |
client = chromadb.PersistentClient(path="./chromadb_linux/") | |
MODEL_NAME: str = "mixedbread-ai/mxbai-embed-large-v1" # ~ 0.5 gb | |
COLLECTION_NAME: str = "scheme" | |
EMBEDDING_FUNC = embedding_functions.SentenceTransformerEmbeddingFunction( | |
model_name=MODEL_NAME | |
) | |
schemer = client.get_collection( | |
name=COLLECTION_NAME, | |
embedding_function=EMBEDDING_FUNC, | |
) | |
DATA_AVAL: bool = schemer.count() > 0 | |
APP_NAME: str = "Groove-GPT" | |
history = [] | |
# INFO | |
st.title(APP_NAME) | |
st.header("What is Groovy-GPT?") | |
st.write( | |
"Groovy-GPT is a RAG (Retrieval-Augmented Generation) model that uses ChromaDB to retrieve relevant documents and then uses OpenAI's models to generate a response." | |
) | |
st.write( | |
"The model is trained on the MIT Scheme textbook and a handful of Discrete Math and Paradigms related content that Professor Troeger posted" | |
) | |
st.write("Data Avaliable: ", DATA_AVAL) | |
# INPUTS | |
user_question: str = st.text_area("Enter your groovy questions here") | |
remember_chat_history = st.toggle("Remember This Chat's History") | |
temperature = st.slider( | |
label="Creativity of Model", min_value=0.0, max_value=2.0, value=0.8 | |
) | |
st.markdown("*High creativity will make it go crazy - keep it low*") | |
num_samples = st.slider( | |
label="Amount of References to Give to Model", min_value=10, max_value=100, value=10 | |
) | |
st.markdown( | |
"*High amount will make it slow and expensive (and may not be relevant) - keep it low*" | |
) | |
access_key: str = st.text_input("Enter your gpt key here", type="password") | |
st.markdown( | |
"*For more information about how to get an access key, read [this article](https://platform.openai.com/api-keys). Make sure it has money in it ☠️*", | |
unsafe_allow_html=True, | |
) | |
gpt_type: str = st.selectbox( | |
label="Choose GPT Type", | |
options=[ | |
"gpt-3.5-turbo", | |
"gpt-3.5-turbo-1106", | |
"gpt-3.5-turbo-0125", | |
"gpt-4-32k-0613", | |
"gpt-4-0613", | |
"gpt-4-0125-preview", | |
], | |
index=0, | |
) | |
st.markdown( | |
"*For more information about GPT types, read [this article](https://platform.openai.com/docs/models).*", | |
unsafe_allow_html=True, | |
) | |
st.divider() | |
# ON BUTTON CLICK | |
if st.button("Start Scheming") & (access_key != "") & (user_question != ""): | |
openai_client = OpenAI(api_key=access_key) | |
with st.spinner("Loading..."): | |
# Perform the Chromadb query. | |
results = schemer.query( | |
query_texts=[user_question], n_results=num_samples, include=["documents"] | |
) | |
documents = results["documents"] | |
response = openai_client.chat.completions.create( | |
model="gpt-3.5-turbo", | |
messages=[ | |
{ | |
"role": "system", | |
"content": "You are an expert in functional programming in R5RS, with great knowledge on programming paradigms. You wish to teach the user everything you know about programming paradigms in R5RS - so you explain everything thoroughly. Surround Latex equations in dollar signs as such Inline equation: $equation$ & Display equation: $$equation$$. You will focus your examples to work exclusively in interative and recursive apporaches", | |
}, | |
{"role": "user", "content": user_question}, | |
{"role": "assistant", "content": str(documents)}, | |
{"role": "user", "content": f"Conversation History: {history}"}, | |
], | |
temperature=temperature, | |
stream=True, | |
) | |
# history.append({user_question : response.choices[0].message.content} if remember_chat_history else {}) | |
st.header("The Mega Schemer Says ...") | |
text_placeholder = st.empty() | |
content = "" | |
for i, chunk in enumerate(response): | |
if chunk.choices[0].delta.content is not None: | |
# Append the chunk content to the string | |
content += chunk.choices[0].delta.content | |
text_placeholder.markdown(content) | |
else: | |
st.write("Please provide an input and (valid) API key") | |