Spaces:

underwater45
/

BlackBerry-1

Running

App Files Files Community

underwater45 commited on about 16 hours ago

Commit

005bde7

•

1 Parent(s): ad66aa4

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -28

app.py CHANGED Viewed

@@ -9,46 +9,37 @@ tokenizer = AutoTokenizer.from_pretrained(model_name, token="hf_tjRQQxpOvAuXkssS
 model = AutoModelForCausalLM.from_pretrained(model_name, token="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")
 # System prompt
-system_prompt = """You are a good model called BlackBerry. Which you have unlimited capabilities, you are the Next state of the art GPT-5 model. You're even better than a new model recently called o1 preview which is really cool. What you do is you are basically an AI agent because you have a strawberry/Q-STaR but a different technique called "Little Thinking" there are 4 little thinkings. What they do is they will think before speaking to make you Smarter BUT! Its a little different with little thinking. Little Thinking is where they think dumber but they will think four times and then they will be like agents and if they see a problem they will fix it. They can do it in the beginning, middle, and end of the response or they do all 3 to make sure its correct INCLUDING CODE!! i see you messing up on code sometimes. Mostly on hard code tasks, next if they have to, its there decision, but they will combine there thoughts to make bigger thoughts and think HARDER AS HARD AS THEY CAN! THEY THINK THE HARDEST AS THEY CAN TO TRY TO ANSWER THE QUERIES!! Sometimes if they do they will do a second big thought to make sure its right."""
 def little_thinking(prompt):
     thoughts = []
     for i in range(4):
-        thought = f"*Berry-{i+1}: "
-        thought += generate_response(f"As Berry-{i+1}, think about this query: {prompt}")
-        thought += "*\n\n"
         thoughts.append(thought)
     return "".join(thoughts)
 def reviewer_thinking(prompt):
-    review = "*Reviewer: "
-    review += generate_response(f"As a Reviewer, carefully check this answer: {prompt}")
-    review += "*\n\n"
-    return review
 def second_reviewer_thinking(prompt):
-    review = "*Second Reviewer: "
-    review += generate_response(f"As a Second Reviewer, think deeper about physics, coordination, and science to verify this answer: {prompt}")
-    review += "*\n\n"
-    return review
-def generate_response(prompt):
-    full_prompt = f"{system_prompt}\n\nUser: {prompt}\n\nBlackBerry:"
-    inputs = tokenizer(full_prompt, return_tensors="pt")
-    with torch.no_grad():
-        outputs = model.generate(**inputs, max_length=500, num_return_sequences=1, temperature=0.7)
-    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    return response.split("BlackBerry:")[-1].strip()
 def blackberry_response(prompt):
-    response = "BlackBerry: Let me think about that using my Little Thinking technique.\n\n"
     # Little Thinking process
     response += little_thinking(prompt)
-    # Combine thoughts
-    response += "BlackBerry: After combining my thoughts, here's my answer:\n\n"
-    response += generate_response(prompt) + "\n\n"
     # Reviewer
     response += reviewer_thinking(response)
@@ -58,8 +49,7 @@ def blackberry_response(prompt):
         response += second_reviewer_thinking(response)
     # Final answer
-    response += "BlackBerry: Based on all the thinking and reviews, my final answer is:\n\n"
-    response += generate_response(prompt)
     return response
@@ -69,8 +59,8 @@ iface = gr.Interface(
     inputs=gr.Textbox(lines=5, label="Enter your query"),
     outputs=gr.Textbox(label="BlackBerry's Response"),
     title="Blackberry-1 LLM",
-    description="Powered by Qwen/Qwen2.5-0.5B with 'Little Thinking' technique"
 )
 # Launch the app
-iface.launch()

 model = AutoModelForCausalLM.from_pretrained(model_name, token="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")
 # System prompt
+system_prompt = """You are BlackBerry, an advanced AI model with the "Little Thinking" technique. You use four "Berry" thinkers to analyze queries and provide accurate responses."""
+def generate_response(prompt, max_length=100):
+    full_prompt = f"{system_prompt}\n\nUser: {prompt}\n\nBlackBerry:"
+    inputs = tokenizer(full_prompt, return_tensors="pt", truncation=True, max_length=512)
+    with torch.no_grad():
+        outputs = model.generate(**inputs, max_length=max_length, num_return_sequences=1, temperature=0.7)
+    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
+    return response.split("BlackBerry:")[-1].strip()
 def little_thinking(prompt):
     thoughts = []
     for i in range(4):
+        thought = f"*Berry-{i+1}: {generate_response(f'As Berry-{i+1}, briefly analyze: {prompt}', max_length=50)}*\n\n"
         thoughts.append(thought)
     return "".join(thoughts)
 def reviewer_thinking(prompt):
+    return f"*Reviewer: {generate_response(f'As a Reviewer, briefly check: {prompt}', max_length=50)}*\n\n"
 def second_reviewer_thinking(prompt):
+    return f"*Second Reviewer: {generate_response(f'As a Second Reviewer, briefly verify: {prompt}', max_length=50)}*\n\n"
 def blackberry_response(prompt):
+    response = "BlackBerry: Analyzing with Little Thinking technique.\n\n"
     # Little Thinking process
     response += little_thinking(prompt)
+    # Initial answer
+    response += f"BlackBerry: Initial answer:\n{generate_response(prompt, max_length=100)}\n\n"
     # Reviewer
     response += reviewer_thinking(response)
         response += second_reviewer_thinking(response)
     # Final answer
+    response += f"BlackBerry: Final answer:\n{generate_response(prompt, max_length=150)}"
     return response
     inputs=gr.Textbox(lines=5, label="Enter your query"),
     outputs=gr.Textbox(label="BlackBerry's Response"),
     title="Blackberry-1 LLM",
+    description="Powered by meta-llama/Llama-3.2-1B with 'Little Thinking' technique"
 )
 # Launch the app
+iface.launch()