Spaces:

TheDrakosfire
/

RuleLawyer

Sleeping

App Files Files Community

drakosfire commited on Apr 16

Commit

9bade29

•

1 Parent(s): c21541c

Basic Logging, timestamp, simple token estimate, source files

Browse files

Files changed (2) hide show

SRD_embeddings.csv +2 -2
app.py +54 -12

SRD_embeddings.csv CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1315c8fc5255c125c06b6c9e3ec4c84df91fd60e03596a363e6d7491df8171ba
-size 46149879

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ffdfe9de524d440d57d359270fe8a774009188b528946a79a55f8dd7294e5fe
+size 51272010

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ from sentence_transformers import util, SentenceTransformer
 import torch
 import time
 from time import perf_counter as timer
 import textwrap
 import json
 import textwrap
@@ -15,10 +16,7 @@ print("Launching")
 client = OpenAI()
-# Define helper function to print wrapped text
-def print_wrapped(text, wrap_length=80):
-    wrapped_text = textwrap.fill(text, wrap_length)
-    print(wrapped_text)
 # Import saved file and view
 embeddings_df_save_path = "./SRD_embeddings.csv"
@@ -39,6 +37,28 @@ pages_and_chunks = text_chunks_and_embedding_df_load.to_dict(orient="records")
 # Convert embeddings to torch tensor and send to device (note: NumPy arrays are float64, torch tensors are float32 by default)
 embeddings = torch.tensor(np.array(text_chunks_and_embedding_df_load["embedding"].tolist()), dtype=torch.float32).to('cpu')
 def retrieve_relevant_resources(query: str,
                                 embeddings: torch.tensor,
                                 model: SentenceTransformer=embedding_model,
@@ -84,18 +104,23 @@ def print_top_results_and_scores(query: str,
     # Loop through zipped together scores and indicies
     for score, index in zip(scores, indices):
         print(f"Score: {score:.4f}")
         # Print relevant sentence chunk (since the scores are in descending order, the most relevant chunk will be first)
         print_wrapped(pages_and_chunks[index]["sentence_chunk"])
         # Print the page number too so we can reference the textbook further and check the results
         print(f"File of Origin: {pages_and_chunks[index]['file_path']}")
         print("\n")
 def prompt_formatter(query: str,
                      context_items: list[dict]) -> str:
-    """
-    Augments query with text-based context from context_items.
-    """
     # Join context items into one dotted paragraph
     context = "- " + "\n- ".join([item["sentence_chunk"] for item in context_items])
     # Create a base prompt with examples to help the model
@@ -139,23 +164,36 @@ Use the context provided to answer the user's query concisely. """
 with gr.Blocks() as RulesLawyer:
     chatbot = gr.Chatbot()
     msg = gr.Textbox()
     clear = gr.ClearButton([msg, chatbot])
     def respond(message, chat_history):
         # Get relevant resources
-        scores, indices = retrieve_relevant_resources(query=message,
                                                     embeddings=embeddings)
         # Create a list of context items
         context_items = [pages_and_chunks[i] for i in indices]
         # Format prompt with context items
-        prompt = prompt_formatter(query=message,
                                 context_items=context_items)
-        print(prompt)
         bot_message = client.chat.completions.create(
                         model="gpt-4",
                         messages=[
@@ -171,9 +209,13 @@ with gr.Blocks() as RulesLawyer:
                         presence_penalty=0
                         )
         chat_history.append((message, bot_message.choices[0].message.content))
         time.sleep(2)
         return "", chat_history
-    msg.submit(respond, [msg, chatbot], [msg, chatbot])
 if __name__ == "__main__":
     RulesLawyer.launch()

 import torch
 import time
 from time import perf_counter as timer
+from datetime import datetime
 import textwrap
 import json
 import textwrap
 client = OpenAI()
 # Import saved file and view
 embeddings_df_save_path = "./SRD_embeddings.csv"
 # Convert embeddings to torch tensor and send to device (note: NumPy arrays are float64, torch tensors are float32 by default)
 embeddings = torch.tensor(np.array(text_chunks_and_embedding_df_load["embedding"].tolist()), dtype=torch.float32).to('cpu')
+# Define helper function to print wrapped text
+def print_wrapped(text, wrap_length=80):
+    wrapped_text = textwrap.fill(text, wrap_length)
+    print(wrapped_text)
+def hybrid_estimate_tokens(text: str)-> float:
+    # Part 1: Estimate based on spaces and punctuation
+    estimated_words = text.count(' ') + 1  # Counting words by spaces
+    punctuation_count = sum(1 for char in text if char in ',.!?;:')  # Counting punctuation as potential separate tokens
+    estimate1 = estimated_words + punctuation_count
+    # Part 2: Estimate based on total characters divided by average token length
+    average_token_length = 4
+    total_characters = len(text)
+    estimate2 = (total_characters // average_token_length) + punctuation_count
+    # Average the two estimates
+    estimated_tokens = (estimate1 + estimate2) / 2
+    return estimated_tokens
 def retrieve_relevant_resources(query: str,
                                 embeddings: torch.tensor,
                                 model: SentenceTransformer=embedding_model,
     # Loop through zipped together scores and indicies
     for score, index in zip(scores, indices):
         print(f"Score: {score:.4f}")
+        print(f"Token Count : {pages_and_chunks[index]['chunk_token_count']}")
         # Print relevant sentence chunk (since the scores are in descending order, the most relevant chunk will be first)
         print_wrapped(pages_and_chunks[index]["sentence_chunk"])
         # Print the page number too so we can reference the textbook further and check the results
         print(f"File of Origin: {pages_and_chunks[index]['file_path']}")
         print("\n")
+    return scores, indices
 def prompt_formatter(query: str,
                      context_items: list[dict]) -> str:
     # Join context items into one dotted paragraph
+    # print(context_items[0])
+    # Alternate print method
+    # print("\n".join([item["file_path"] + "\n" + str(item['chunk_token_count']) + "\n" + item["sentence_chunk"] for item in context_items]))
     context = "- " + "\n- ".join([item["sentence_chunk"] for item in context_items])
     # Create a base prompt with examples to help the model
 with gr.Blocks() as RulesLawyer:
+    message_state = gr.State()
+    chatbot_state = gr.State([])
     chatbot = gr.Chatbot()
     msg = gr.Textbox()
     clear = gr.ClearButton([msg, chatbot])
+    def store_message(message):
+        return message
     def respond(message, chat_history):
+        print(datetime.now())
+        print(f"User Input : {message}")
+        print(f"Chat History: {chat_history}")
+        print(f"""Token Estimate: {hybrid_estimate_tokens(f"{message} {chat_history}")}""")
         # Get relevant resources
+        scores, indices = print_top_results_and_scores(query=message,
                                                     embeddings=embeddings)
         # Create a list of context items
         context_items = [pages_and_chunks[i] for i in indices]
         # Format prompt with context items
+        prompt = prompt_formatter(query=f"Chat History : {chat_history} + {message}",
                                 context_items=context_items)
         bot_message = client.chat.completions.create(
                         model="gpt-4",
                         messages=[
                         presence_penalty=0
                         )
         chat_history.append((message, bot_message.choices[0].message.content))
+        print(f"Response : {bot_message.choices[0].message.content}")
         time.sleep(2)
         return "", chat_history
+    msg.change(store_message, inputs = [msg], outputs = [message_state])
+    chatbot.change(store_message, [chatbot], [chatbot_state])
+    msg.submit(respond, [message_state, chatbot_state], [msg, chatbot])
 if __name__ == "__main__":
     RulesLawyer.launch()