from llama_cpp import Llama import gradio as gr llm = Llama.from_pretrained( repo_id="QuantFactory/Qwen2.5-7B-Instruct-Uncensored-GGUF", filename="Qwen2.5-7B-Instruct-Uncensored.Q2_K.gguf", )