import gradio as gr gr.Interface.load("models/FlagAlpha/Llama2-Chinese-13b-Chat-4bit").launch()