Spaces:

ishvalin
/

BabblerQA

Sleeping

Kryko7 commited on Aug 29, 2023

Commit

144690a

•

1 Parent(s): 81d98d1

updated requirements

Files changed (2) hide show

app.py CHANGED Viewed

@@ -6,6 +6,8 @@ from langchain.document_loaders import GutenbergLoader
 import langchain
 from langchain.text_splitter import RecursiveCharacterTextSplitter
@@ -35,6 +37,21 @@ llm = Replicate(
 )
 # Function to search for a book by name and return the best match URL
 def search_book_by_name(book_name):
@@ -100,8 +117,7 @@ def create_book_embeddings(book_content):
     text_splitter = RecursiveCharacterTextSplitter(chunk_size = Configuration.split_chunk_size,
                                                chunk_overlap = Configuration.split_overlap)
     texts = text_splitter.split_documents(book_content)
-    instructor_embeddings = HuggingFaceInstructEmbeddings(model_name = Configuration.embeddings_model_repo,
-                                                      model_kwargs = {"device": "cuda"})
     vectordb = None
     try:
@@ -173,4 +189,19 @@ def generate_answer_from_embeddings(query, book_embeddings):
     llm_response = qa_chain(query)
     ans = process_llm_response(llm_response)
-    return ans

 import langchain
+from fastapi import FastAPI
 from langchain.text_splitter import RecursiveCharacterTextSplitter
 )
+class Configuration:
+    model_name = 'llama2-13b'
+    temperature = 0.5
+    top_p = 0.95
+    repetition_penalty = 1.15
+    split_chunk_size = 1000
+    split_overlap = 100
+    embeddings_model_repo = 'hkunlp/instructor-large'
+    k = 3
+    Embeddings_path = '/book-vectordb-chroma'
+    Persist_directory = './book-vectordb-chroma'
 # Function to search for a book by name and return the best match URL
 def search_book_by_name(book_name):
     text_splitter = RecursiveCharacterTextSplitter(chunk_size = Configuration.split_chunk_size,
                                                chunk_overlap = Configuration.split_overlap)
     texts = text_splitter.split_documents(book_content)
     vectordb = None
     try:
     llm_response = qa_chain(query)
     ans = process_llm_response(llm_response)
+    return ans
+app = FastAPI()
+llm = Replicate(
+    model=  "replicate/llama-2-70b-chat:2796ee9483c3fd7aa2e171d38f4ca12251a30609463dcfd4cd76703f22e96cdf",
+    input={"temperature": 0.75, "max_length": 500, "top_p": 1},
+)
+instructor_embeddings = HuggingFaceInstructEmbeddings(model_name = Configuration.embeddings_model_repo,
+                                                      model_kwargs = {"device": "cpu"})

requirements.txt CHANGED Viewed

@@ -11,9 +11,9 @@ xformers
 einops
 replicate
 beautifulsoup4
-fastapi==0.74.*
-requests==2.27.*
-uvicorn==0.17.*
 sentencepiece
-torch==1.11.*

 einops
 replicate
 beautifulsoup4
+fastapi
+requests
+uvicorn
 sentencepiece
+torch