Chat_FastAPI / app.py
Shrees0507's picture
Update app.py
d069c62 verified
raw
history blame
1.62 kB
from fastapi import FastAPI, HTTPException
from pydantic import BaseModel
from huggingface_hub import InferenceClient
import os
import gradio as gr
app = FastAPI()
client = InferenceClient(model="HuggingFaceH4/zephyr-7b-beta", token=os.getenv("huggingface_token"))
class Message(BaseModel):
input: str
history: list
@app.get("/")
async def home():
return {"message": "Welcome to the chatbot API!"}
@app.post("/chat")
async def chat(message: Message):
try:
input_message = message.input
# Call the chatbot function
response = chatbot(input_message)
return {"response": response}
except Exception as e:
raise HTTPException(status_code=500, detail=str(e))
def chatbot(input, history):
try:
# Call your chatbot function here
message = [{"role": "user", "content": input}]
history = [{"role": "system", "content": "You are a helpful assistant."}]
messages = history + message
output = client.chat_completion(
messages=messages,
max_tokens=4000,
temperature=0.7
)
return output.choices[0].message.content
except Exception as e:
raise Exception(str(e))
# Define the Gradio chat interface
def gradio_chat(input):
response = chatbot(input, [])
return response
# Define Gradio inputs and outputs
inputs = [gr.Textbox(lines=5, label="Input")]
output = gr.Textbox(label="Response")
# Create Gradio interface
gr.Interface(chatbot, inputs=inputs, outputs=output, title="Chatbot",fill_height=True).launch()