Spaces:
Runtime error
Runtime error
File size: 3,900 Bytes
228c64d 506ffe2 228c64d 777d688 228c64d ff2dfa9 228c64d 777d688 228c64d 777d688 db92ed0 777d688 506ffe2 a79caca 228c64d 506ffe2 777d688 506ffe2 228c64d 4568132 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 |
from __future__ import annotations
from typing import Iterable
import gradio as Gradio
from gradio.themes.utils import colors, fonts, sizes
from gradio.themes import Base
from llama_cpp import Llama
from huggingface_hub import hf_hub_download
hf_hub_download(repo_id="TheBloke/dolphin-2_6-phi-2-GGUF", filename="dolphin-2_6-phi-2.Q5_K_S.gguf", local_dir=".")
llm = Llama(model_path="./dolphin-2_6-phi-2.Q5_K_S.gguf", n_ctx=1024)
ins = '''<|im_start|>user
{question}<|im_end|>
<|im_start|>assistant
'''
class BlueTheme(Gradio.themes.Soft):
def __init__(
self,
*,
primary_hue: colors.Color | str = colors.purple,
secondary_hue: colors.Color | str = colors.blue,
neutral_hue: colors.Color | str = colors.neutral,
spacing_size: sizes.Size | str = sizes.spacing_md,
radius_size: sizes.Size | str = sizes.radius_md,
font: fonts.Font
| str
| Iterable[fonts.Font | str] = (
fonts.GoogleFont("Space Grotesk"),
"ui-sans-serif",
"sans-serif",
),
font_mono: fonts.Font
| str
| Iterable[fonts.Font | str] = (
fonts.GoogleFont("Space Mono"),
"ui-monospace",
"monospace",
),
):
super().__init__(
primary_hue=primary_hue,
secondary_hue=secondary_hue,
neutral_hue=neutral_hue,
spacing_size=spacing_size,
radius_size=radius_size,
font=font,
font_mono=font_mono,
)
super().set(
button_primary_background_fill="linear-gradient(90deg, *primary_300, *secondary_400)",
button_primary_background_fill_hover="linear-gradient(90deg, *primary_200, *secondary_300)",
button_primary_text_color="white",
button_primary_background_fill_dark="linear-gradient(90deg, *primary_600, *secondary_800)",
block_shadow="*shadow_drop_lg",
button_shadow="*shadow_drop_lg",
input_background_fill="zinc",
input_border_color="*secondary_300",
input_shadow="*shadow_drop",
input_shadow_focus="*shadow_drop_lg",
)
custom_theme = BlueTheme()
def generate(instruction):
prompt = ins.format(question=instruction)
response = llm.create_completion(prompt, stream=True, stop=['<|im_start|>user', '<|im_end|>'], repeat_penalty=1.1)
result = ""
for output in response:
result += output['choices'][0]['text']
yield result
examples = [
"How do dogs bark?",
"Why are apples red?",
"How do I make a campfire?",
"Why do cats love to chirp at something?"
]
def process_example(args):
for x in generate(args):
pass
return x
css = ".generating {visibility: hidden}"
with Gradio.Blocks(theme=custom_theme, analytics_enabled=False, css=css) as demo:
with Gradio.Column():
Gradio.Markdown(
""" # 𓄿 [Corvus] Dolphin-2.6 (Phi-2)
Type in the box below and click the button to generate answers to your most pressing questions!
""")
with Gradio.Tabs():
with Gradio.Tab(label="Prompt"):
usr_prompt = Gradio.components.Textbox(placeholder="Why do cats meow?", label="Prompt", info="What things do you want to ask the chat assistant?");
with Gradio.Tab(label="Configuration (disabled)"):
top_p = Gradio.components.Slider(value=0.4, maximum=1, interactive=True, label="Top-P (Nucleus sampling)", info="Represents the token diversity threshold for CogniForge.");
top_k = Gradio.components.Slider(value=40, maximum=100, interactive=True, label="Top-K sampling", info="Represents the token probability threshold for CogniForge.");
temp = Gradio.components.Slider(value=0.7, maximum=2, interactive=True, label="Temperature", info="Represents the creativity threshold for CogniForge.");
with Gradio.Group():
output = Gradio.components.Textbox(value="", label="Output", info="Corvus' output");
Gradio.Examples(
examples=examples,
inputs=[usr_prompt],
cache_examples=False,
fn=process_example,
outputs=[output],
);
submit = Gradio.Button("Generate", variant="primary")
submit.click(generate, inputs=[usr_prompt], outputs=[output], concurrency_limit=1)
demo.launch(debug=True) |