import time
import openai
import gradio as gr
import requests
from pydub import AudioSegment as am
from xml.etree import ElementTree
aoai_url, aoai_key, stts_key, stts_region = "", "", "", ""
openai.api_type = "azure"
prompts = ""
model_gpt = ""
messages_gpt = []
model_chat = ""
messages_chat = [
{"role": "system", "content": "You are an AI assistant that helps people find information."},
]
response_walle = []
model_vchat = ""
messages_vchat = [
{"role": "system", "content": "You are an AI assistant that helps people find information and just respond with SSML."},
]
def get_aoai_set(get_aoai_url, get_aoai_key, get_aoai_API):
if get_aoai_url:
openai.api_base = get_aoai_url
if get_aoai_key:
openai.api_key = get_aoai_key
if get_aoai_API:
openai.api_version = get_aoai_API
return gr.update(value=get_aoai_url), gr.update(value=get_aoai_key), gr.update(value=get_aoai_API)
def get_stts_set(get_stts_key, get_stts_region):
global stts_key, stts_region
if get_stts_key:
stts_key = get_stts_key
if get_stts_region:
stts_region = get_stts_region
return gr.update(value=get_stts_key), gr.update(value=get_stts_region)
with gr.Blocks() as page:
with gr.Tabs():
with gr.TabItem("Settings"):
gr.HTML("""
Please read and set parameters before switching to another tab.
Your Azure OpenAI Key and other Azure Cognitive Service Keys
will not be saved or viewed by anyone.
You can find these parameters in Azure Portal. Select Azure OpenAI resource or Cognitive Service resource like Speech, and then select
'Keys and Endpoint' from left panel.
For Azure OpenAI service, you need to provide the resource URL and key for REST API. You also
need to set the API version or just use the default value. The Azure OpenAI model which is deployed needs to be set in each tab. Because
you may need to run different models at the same time. Don't forget to hit 'Enter' with every input.
For Azure Cognitive services,
you need to provide a Key for REST API, and also need to provide a service region, for example, 'westus'. The app will create the endpoint
URL by itself.
Thank you.
Azure OpenAI Service parameters for ChatGPT/GPT. Please input these settings and hit the
'Enter' key.
""")
with gr.Row():
with gr.Column(scale=0.6):
ui_aoai_url = gr.Textbox(placeholder="Like https://your-url-base.openai.azure.com , etc.",
label="- Azure OpenAI service API endpoint:", lines=1).style(container=False)
with gr.Column(scale=0.2):
ui_aoai_key = gr.Textbox(placeholder="Please enter your Azure OpenAI API key here.",
label="- Azure OpenAI service API Key: ", lines=1, type='password').style(container=False)
with gr.Column(scale=0.2):
ui_aoai_api = gr.Textbox(value="2023-03-15-preview", label="· Azure OpenAI service API version: ",
lines=1, interactive=True).style(container=False)
gr.HTML("Azure Cognitive Speech Service parameters to use VoiceChat. ")
with gr.Row():
with gr.Column(scale=0.6):
ui_stts_key = gr.Textbox(placeholder="Please enter your speech service API key if you want to try VoiceChat. " +
"Please input these settings and hit 'Enter' key.",
label="- Azure Cognitive Speech service API Key: ", interactive=True, type='password').style(container=False)
with gr.Column(scale=0.4):
ui_stts_loc = gr.Textbox(placeholder="Please enter your speech service region.",
label="- Azure Cognitive Speech service region: ", interactive=True).style(container=False)
ui_aoai_url.submit(get_aoai_set, [ui_aoai_url, ui_aoai_key, ui_aoai_api], [ui_aoai_url, ui_aoai_key, ui_aoai_api])
ui_aoai_key.submit(get_aoai_set, [ui_aoai_url, ui_aoai_key, ui_aoai_api], [ui_aoai_url, ui_aoai_key, ui_aoai_api])
ui_aoai_api.submit(get_aoai_set, [ui_aoai_url, ui_aoai_key, ui_aoai_api], [ui_aoai_url, ui_aoai_key, ui_aoai_api])
ui_stts_key.submit(get_stts_set, [ui_stts_key, ui_stts_loc], [ui_stts_key, ui_stts_loc])
ui_stts_loc.submit(get_stts_set, [ui_stts_key, ui_stts_loc], [ui_stts_key, ui_stts_loc])
with gr.TabItem("GPT-3.5 Playground"):
ui_chatbot_gpt = gr.Chatbot(label="GPT Playground:")
with gr.Row():
with gr.Column(scale=0.9):
ui_prompt_gpt = gr.Textbox(placeholder="Please enter your prompt here.", show_label=False).style(container=False)
with gr.Column(scale=0.1, min_width=100):
ui_clear_gpt = gr.Button("Clear Input", )
with gr.Accordion("Expand to config parameters:", open=True):
ui_memo_gpt = gr.HTML("GPT-3.5 playground use Completion(). So you just need to provide model name as engine parameter.")
ui_model_gpt = gr.Textbox(placeholder="Azure OpenAI GPT model deployment name. ",
label="- Azure OpenAI deployment name:", lines=1).style(container=False)
with gr.Row():
ui_temp_gpt = gr.Slider(0.1, 1.0, 0.9, step=0.1, label="Temperature", interactive=True)
ui_max_tokens_gpt = gr.Slider(100, 4000, 1000, step=100, label="Max Tokens", interactive=True)
ui_top_p_gpt = gr.Slider(0.1, 1.0, 0.5, step=0.1, label="Top P", interactive=True)
with gr.Accordion("Select radio button to see detail:", open=False):
ui_res_radio_gpt = gr.Radio(["Response from OpenAI Model", "Prompt messages history"], label="Show OpenAI response:", interactive=True)
ui_response_gpt = gr.TextArea(show_label=False, interactive=False).style(container=False)
def get_parameters_gpt(slider_1, slider_2, slider_3):
ui_temp_gpt.value = slider_1
ui_max_tokens_gpt.value = slider_2
ui_top_p_gpt.value = slider_3
print("Log - Updated GPT parameters: Temperature=", ui_temp_gpt.value,
" Max Tokens=", ui_max_tokens_gpt.value, " Top_P=", ui_top_p_gpt.value)
def get_engine_gpt(get_aoai_model):
global model_gpt
model_gpt = get_aoai_model
return gr.update(value=get_aoai_model)
def select_response_gpt(radio):
if radio == "Response from OpenAI Model":
return gr.update(value=gpt_x)
else:
return gr.update(value=messages_gpt)
def user_gpt(user_message, history):
global prompts
prompts = user_message
messages_gpt.append(prompts)
return "", history + [[user_message, None]]
def bot_gpt(history):
global gpt_x
print(ui_model_gpt.value)
gpt_x = openai.Completion.create(
engine=model_gpt,
prompt=prompts,
temperature=0.6,
max_tokens=1000,
top_p=1,
frequency_penalty=0,
presence_penalty=0,
best_of=1,
stop=None
)
gpt_reply = gpt_x.choices[0].text
messages_gpt.append(gpt_reply)
history[-1][1] = gpt_reply
return history
ui_model_gpt.submit(get_engine_gpt, ui_model_gpt , ui_model_gpt)
ui_temp_gpt.change(get_parameters_gpt, [ui_temp_gpt, ui_max_tokens_gpt, ui_top_p_gpt])
ui_max_tokens_gpt.change(get_parameters_gpt, [ui_temp_gpt, ui_max_tokens_gpt, ui_top_p_gpt])
ui_top_p_gpt.change(get_parameters_gpt, [ui_temp_gpt, ui_max_tokens_gpt, ui_top_p_gpt])
ui_prompt_gpt.submit(user_gpt, [ui_prompt_gpt, ui_chatbot_gpt], [ui_prompt_gpt, ui_chatbot_gpt], queue=False).then(
bot_gpt, ui_chatbot_gpt, ui_chatbot_gpt
)
ui_clear_gpt.click(lambda: None, None, ui_chatbot_gpt, queue=False)
ui_res_radio_gpt.change(select_response_gpt, ui_res_radio_gpt, ui_response_gpt)
with gr.TabItem("ChatGPT on GPT-4"):
ui_chatbot_chat = gr.Chatbot(label="ChatGPT:")
with gr.Row():
with gr.Column(scale=0.9):
ui_prompt_chat = gr.Textbox(placeholder="Please enter your prompt here.", show_label=False).style(container=False)
with gr.Column(scale=0.1, min_width=100):
ui_clear_chat = gr.Button("Clear Chat")
with gr.Blocks():
with gr.Accordion("Expand to config parameters:", open=True):
gr.HTML("ChatGPT use ChatCompletion(). Here is the default system prompt, you can change it to your own prompt.")
ui_prompt_sys = gr.Textbox(value="You are an AI assistant that helps people find information.",
label="- Here is the default system prompt, you can change it to your own prompt.",
interactive=True).style(container=False)
ui_model_chat = gr.Textbox(placeholder="Azure OpenAI model deployment name. ",
label="- Azure OpenAI GPT-3.5/4 deployment name:", lines=1).style(container=False)
with gr.Row():
ui_temp_chat = gr.Slider(0.1, 1.0, 0.7, step=0.1, label="Temperature", interactive=True)
ui_max_tokens_chat = gr.Slider(100, 8000, 2000, step=100, label="Max Tokens", interactive=True)
ui_top_p_chat = gr.Slider(0.05, 1.0, 0.9, step=0.1, label="Top P", interactive=True)
with gr.Accordion("Select radio button to see detail:", open=False):
ui_res_radio_chat = gr.Radio(["Response from OpenAI Model", "Prompt messages history"], label="Show OpenAI response:", interactive=True)
ui_response_chat = gr.TextArea(show_label=False, interactive=False).style(container=False)
def get_parameters_chat(slider_1, slider_2, slider_3):
ui_temp_chat.value = slider_1
ui_max_tokens_chat.value = slider_2
ui_top_p_chat.value = slider_3
print("Log - Updated chatGPT parameters: Temperature=", ui_temp_chat.value,
" Max Tokens=", ui_max_tokens_chat.value, " Top_P=", ui_top_p_chat.value)
def get_engine_chat(get_aoai_model):
global model_chat
model_chat = get_aoai_model
return gr.update(value=get_aoai_model)
def select_response_chat(radio):
if radio == "Response from OpenAI Model":
return gr.update(value=chat_x)
else:
return gr.update(value=messages_chat)
def user_chat(user_message, history):
messages_chat.append({"role": "user", "content": user_message})
return "", history + [[user_message, None]]
def bot_chat(history):
global chat_x
chat_x = openai.ChatCompletion.create(
engine=model_chat, messages=messages_chat,
temperature=ui_temp_chat.value,
max_tokens=ui_max_tokens_chat.value,
top_p=ui_top_p_chat.value,
frequency_penalty=0,
presence_penalty=0,
stop=None
)
ui_response_chat.value= chat_x
print(ui_response_chat.value)
chat_reply = chat_x.choices[0].message.content
messages_chat.append({"role": "assistant", "content": chat_reply})
history[-1][1] = chat_reply
return history
def reset_sys(sysmsg):
global messages_chat
messages_chat = [
{"role": "system", "content": sysmsg},
]
ui_model_chat.submit(get_engine_chat, ui_model_chat, ui_model_chat)
ui_res_radio_chat.change(select_response_chat, ui_res_radio_chat, ui_response_chat)
ui_temp_chat.change(get_parameters_chat, [ui_temp_chat, ui_max_tokens_chat, ui_top_p_chat])
ui_max_tokens_chat.change(get_parameters_chat, [ui_temp_chat, ui_max_tokens_chat, ui_top_p_chat])
ui_top_p_chat.change(get_parameters_chat, [ui_temp_chat, ui_max_tokens_chat, ui_top_p_chat])
ui_prompt_sys.submit(reset_sys, ui_prompt_sys)
ui_prompt_chat.submit(user_chat, [ui_prompt_chat, ui_chatbot_chat], [ui_prompt_chat, ui_chatbot_chat], queue=False).then(
bot_chat, ui_chatbot_chat, ui_chatbot_chat
)
ui_clear_chat.click(lambda: None, None, ui_chatbot_chat, queue=False).then(reset_sys, ui_prompt_sys)
with gr.TabItem("DALL·E 2 Painting"):
ui_prompt_walle = gr.Textbox(placeholder="Please enter your prompt here to generate image.",
show_label=False).style(container=False)
ui_image_walle = gr.Image()
with gr.Accordion("Select radio button to see detail:", open=False):
ui_response_walle = gr.TextArea(show_label=False, interactive=False).style(container=False)
def get_image_walle(prompt_walle):
global response_walle
walle_api_version = '2022-08-03-preview'
url = "{}dalle/text-to-image?api-version={}".format(openai.api_base, walle_api_version)
headers= { "api-key": openai.api_key, "Content-Type": "application/json" }
body = {
"caption": prompt_walle,
"resolution": "1024x1024"
}
submission = requests.post(url, headers=headers, json=body)
response_walle.append(submission.json())
print("Log - WALL·E status: {}".format(submission.json()))
operation_location = submission.headers['Operation-Location']
retry_after = submission.headers['Retry-after']
status = ""
while (status != "Succeeded"):
time.sleep(int(retry_after))
response = requests.get(operation_location, headers=headers)
response_walle.append(response.json())
print("Log - WALL·E status: {}".format(response.json()))
status = response.json()['status']
image_url_walle = response.json()['result']['contentUrl']
return gr.update(value=image_url_walle)
def get_response_walle():
global response_walle
return gr.update(value=response_walle)
ui_prompt_walle.submit(get_image_walle, ui_prompt_walle, ui_image_walle, queue=False).then(get_response_walle, None, ui_response_walle)
with gr.TabItem("VoiceChat on GPT"):
with gr.Row():
with gr.Column():
with gr.Accordion("Expand to config parameters:", open=True):
ui_prompt_sys_vchat = gr.Textbox(value="You are an AI assistant that helps people find information and just respond with SSML.",
label="- Here is the default system prompt, you can change it to your own prompt.",
interactive=True).style(container=False)
ui_model_vchat = gr.Textbox(placeholder="- Azure OpenAI model deployment name. ",
label="- Azure OpenAI GPT-3.5/4 deployment name:", lines=1).style(container=False)
ui_voice_inc_vchat = gr.Audio(source="microphone", type="filepath")
ui_voice_out_vchat = gr.Audio(value=None, type="filepath", interactive=False).style(container=False)
with gr.Accordion("Expand to config parameters:", open=False):
with gr.Row():
ui_temp_vchat = gr.Slider(0.1, 1.0, 0.7, step=0.1, label="Temperature", interactive=True)
ui_max_tokens_vchat = gr.Slider(100, 8000, 800, step=100, label="Max Tokens", interactive=True)
ui_top_p_vchat = gr.Slider(0.05, 1.0, 0.9, step=0.1, label="Top P", interactive=True)
with gr.Column():
ui_chatbot_vchat = gr.Chatbot(label="Voice to ChatGPT:")
with gr.Accordion("Select radio button to see detail:", open=False):
ui_res_radio_vchat = gr.Radio(["Response from OpenAI Model", "Prompt messages history"], label="Show OpenAI response:", interactive=True)
ui_response_vchat = gr.TextArea(show_label=False, interactive=False).style(container=False)
def get_parameters_vchat(slider_1, slider_2, slider_3):
ui_temp_vchat.value = slider_1
ui_max_tokens_vchat.value = slider_2
ui_top_p_vchat.value = slider_3
print("Log - Updated chatGPT parameters: Temperature=", ui_temp_vchat.value,
" Max Tokens=", ui_max_tokens_vchat.value, " Top_P=", ui_top_p_vchat.value)
def get_engine_vchat(get_aoai_model):
global model_vchat
model_vchat = get_aoai_model
return gr.update(value=get_aoai_model)
def select_response_vchat(radio):
if radio == "Response from OpenAI Model":
return gr.update(value=vchat_x)
else:
return gr.update(value=messages_vchat)
def speech_to_text(voice_message):
# Downsample input voice to 16kHz
voice_wav = am.from_file(voice_message, format='wav')
voice_wav = voice_wav.set_frame_rate(16000)
voice_wav.export(voice_message, format='wav')
# STT
service_region = stts_region
base_url = "https://"+service_region+".stt.speech.microsoft.com/"
path = 'speech/recognition/conversation/cognitiveservices/v1'
constructed_url = base_url + path
params = {
'language': 'zh-CN',
'format': 'detailed'
}
headers = {
'Ocp-Apim-Subscription-Key': stts_key,
'Content-Type': 'audio/wav; codecs=audio/pcm; samplerate=16000',
'Accept': 'application/json;text/xml'
}
body = open(voice_message,'rb').read()
response = requests.post(constructed_url, params=params, headers=headers, data=body)
if response.status_code == 200:
rs = response.json()
if rs != '':
print(rs)
else:
print("\nLog - Status code: " + str(response.status_code) + "\nSomething went wrong. Check your subscription key and headers.\n")
print("Reason: " + str(response.reason) + "\n")
sst_text = rs['DisplayText']
return sst_text
def text_to_speech():
service_region = stts_region
# test
print(stts_key)
base_url = "https://"+service_region+".tts.speech.microsoft.com/"
path = 'cognitiveservices/v1'
constructed_url = base_url + path
headers = {
'Ocp-Apim-Subscription-Key': stts_key,
'Content-Type': 'application/ssml+xml',
'X-Microsoft-OutputFormat': 'riff-24khz-16bit-mono-pcm',
'User-Agent': 'Voice ChatGPT'
}
xml_body = ElementTree.Element('speak', version='1.0')
xml_body.set('{http://www.w3.org/XML/1998/namespace}lang', 'zh-cn')
voice = ElementTree.SubElement(xml_body, 'voice')
voice.set('{http://www.w3.org/XML/1998/namespace}lang', 'zh-cn')
voice.set('name', 'zh-CN-XiaoxiaoNeural')
voice.text = vchat_reply
body = ElementTree.tostring(xml_body)
response = requests.post(constructed_url, headers=headers, data=body)
if response.status_code == 200:
with open('chatgpt.wav', 'wb') as audio:
audio.write(response.content)
print("\nStatus code: " + str(response.status_code) + "\nYour TTS is ready for playback.\n")
else:
print("\nStatus code: " + str(response.status_code) + "\nSomething went wrong. Check your subscription key and headers.\n")
print("Reason: " + str(response.reason) + "\n")
tts_file = "chatgpt.wav"
return gr.update(value=tts_file, interactive=True)
def user_vchat(user_voice_message, history):
user_message = speech_to_text(user_voice_message)
messages_vchat.append({"role": "user", "content": user_message})
return history + [[user_message, None]]
def bot_vchat(history):
global vchat_x, vchat_reply
vchat_x = openai.ChatCompletion.create(
engine=model_vchat, messages=messages_vchat,
temperature=ui_temp_chat.value,
max_tokens=ui_max_tokens_chat.value,
top_p=ui_top_p_chat.value,
frequency_penalty=0,
presence_penalty=0,
stop=None
)
ui_response_vchat.value= vchat_x
print(ui_response_vchat.value)
vchat_reply = vchat_x.choices[0].message.content
messages_vchat.append({"role": "assistant", "content": vchat_reply})
history[-1][1] = vchat_reply
return history
ui_model_vchat.submit(get_engine_vchat, ui_model_vchat, ui_model_vchat)
ui_res_radio_vchat.change(select_response_vchat, ui_res_radio_vchat, ui_response_vchat)
ui_temp_chat.change(get_parameters_chat, [ui_temp_chat, ui_max_tokens_chat, ui_top_p_chat])
ui_max_tokens_chat.change(get_parameters_chat, [ui_temp_chat, ui_max_tokens_chat, ui_top_p_chat])
ui_top_p_chat.change(get_parameters_chat, [ui_temp_chat, ui_max_tokens_chat, ui_top_p_chat])
ui_voice_inc_vchat.change(user_vchat, [ui_voice_inc_vchat, ui_chatbot_vchat], ui_chatbot_vchat, queue=False).then(
bot_vchat, ui_chatbot_vchat, ui_chatbot_vchat, queue=False).then(text_to_speech, None, ui_voice_out_vchat)
page.launch(share=False, debug=True)