Spaces:

eastsheng
/

gpt_academic

Running

App Files Files Community

gpt_academic / crazy_functions /图片生成.py

eastsheng

Upload 266 files

506c93a verified 6 months ago

raw

history blame

12.7 kB

	from toolbox import CatchException, update_ui, get_conf, select_api_key, get_log_folder
	from crazy_functions.multi_stage.multi_stage_utils import GptAcademicState


	def gen_image(llm_kwargs, prompt, resolution="1024x1024", model="dall-e-2", quality=None, style=None):
	import requests, json, time, os
	from request_llms.bridge_all import model_info

	proxies = get_conf('proxies')
	# Set up OpenAI API key and model
	api_key = select_api_key(llm_kwargs['api_key'], llm_kwargs['llm_model'])
	chat_endpoint = model_info[llm_kwargs['llm_model']]['endpoint']
	# 'https://api.openai.com/v1/chat/completions'
	img_endpoint = chat_endpoint.replace('chat/completions','images/generations')
	# # Generate the image
	url = img_endpoint
	headers = {
	'Authorization': f"Bearer {api_key}",
	'Content-Type': 'application/json'
	}
	data = {
	'prompt': prompt,
	'n': 1,
	'size': resolution,
	'model': model,
	'response_format': 'url'
	}
	if quality is not None:
	data['quality'] = quality
	if style is not None:
	data['style'] = style
	response = requests.post(url, headers=headers, json=data, proxies=proxies)
	print(response.content)
	try:
	image_url = json.loads(response.content.decode('utf8'))['data'][0]['url']
	except:
	raise RuntimeError(response.content.decode())
	# 文件保存到本地
	r = requests.get(image_url, proxies=proxies)
	file_path = f'{get_log_folder()}/image_gen/'
	os.makedirs(file_path, exist_ok=True)
	file_name = 'Image' + time.strftime("%Y-%m-%d-%H-%M-%S", time.localtime()) + '.png'
	with open(file_path+file_name, 'wb+') as f: f.write(r.content)


	return image_url, file_path+file_name


	def edit_image(llm_kwargs, prompt, image_path, resolution="1024x1024", model="dall-e-2"):
	import requests, json, time, os
	from request_llms.bridge_all import model_info

	proxies = get_conf('proxies')
	api_key = select_api_key(llm_kwargs['api_key'], llm_kwargs['llm_model'])
	chat_endpoint = model_info[llm_kwargs['llm_model']]['endpoint']
	# 'https://api.openai.com/v1/chat/completions'
	img_endpoint = chat_endpoint.replace('chat/completions','images/edits')
	# # Generate the image
	url = img_endpoint
	n = 1
	headers = {
	'Authorization': f"Bearer {api_key}",
	}
	make_transparent(image_path, image_path+'.tsp.png')
	make_square_image(image_path+'.tsp.png', image_path+'.tspsq.png')
	resize_image(image_path+'.tspsq.png', image_path+'.ready.png', max_size=1024)
	image_path = image_path+'.ready.png'
	with open(image_path, 'rb') as f:
	file_content = f.read()
	files = {
	'image': (os.path.basename(image_path), file_content),
	# 'mask': ('mask.png', open('mask.png', 'rb'))
	'prompt': (None, prompt),
	"n": (None, str(n)),
	'size': (None, resolution),
	}

	response = requests.post(url, headers=headers, files=files, proxies=proxies)
	print(response.content)
	try:
	image_url = json.loads(response.content.decode('utf8'))['data'][0]['url']
	except:
	raise RuntimeError(response.content.decode())
	# 文件保存到本地
	r = requests.get(image_url, proxies=proxies)
	file_path = f'{get_log_folder()}/image_gen/'
	os.makedirs(file_path, exist_ok=True)
	file_name = 'Image' + time.strftime("%Y-%m-%d-%H-%M-%S", time.localtime()) + '.png'
	with open(file_path+file_name, 'wb+') as f: f.write(r.content)


	return image_url, file_path+file_name


	@CatchException
	def 图片生成_DALLE2(prompt, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt, user_request):
	"""
	txt 输入栏用户输入的文本,例如需要翻译的一段话,再例如一个包含了待处理文件的路径
	llm_kwargs gpt模型参数,如温度和top_p等,一般原样传递下去就行
	plugin_kwargs 插件模型的参数,暂时没有用武之地
	chatbot 聊天显示框的句柄,用于显示给用户
	history 聊天历史,前情提要
	system_prompt 给gpt的静默提醒
	user_request 当前用户的请求信息（IP地址等）
	"""
	history = [] # 清空历史,以免输入溢出
	if prompt.strip() == "":
	chatbot.append((prompt, "[Local Message] 图像生成提示为空白，请在“输入区”输入图像生成提示。"))
	yield from update_ui(chatbot=chatbot, history=history) # 刷新界面界面更新
	return
	chatbot.append(("您正在调用“图像生成”插件。", "[Local Message] 生成图像, 请先把模型切换至gpt-*。如果中文Prompt效果不理想, 请尝试英文Prompt。正在处理中 ....."))
	yield from update_ui(chatbot=chatbot, history=history) # 刷新界面由于请求gpt需要一段时间,我们先及时地做一次界面更新
	if ("advanced_arg" in plugin_kwargs) and (plugin_kwargs["advanced_arg"] == ""): plugin_kwargs.pop("advanced_arg")
	resolution = plugin_kwargs.get("advanced_arg", '1024x1024')
	image_url, image_path = gen_image(llm_kwargs, prompt, resolution)
	chatbot.append([prompt,
	f'图像中转网址: <br/>`{image_url}`<br/>'+
	f'中转网址预览: <br/><div align="center"><img src="{image_url}"></div>'
	f'本地文件地址: <br/>`{image_path}`<br/>'+
	f'本地文件预览: <br/><div align="center"><img src="file={image_path}"></div>'
	])
	yield from update_ui(chatbot=chatbot, history=history) # 刷新界面界面更新


	@CatchException
	def 图片生成_DALLE3(prompt, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt, user_request):
	history = [] # 清空历史,以免输入溢出
	if prompt.strip() == "":
	chatbot.append((prompt, "[Local Message] 图像生成提示为空白，请在“输入区”输入图像生成提示。"))
	yield from update_ui(chatbot=chatbot, history=history) # 刷新界面界面更新
	return
	chatbot.append(("您正在调用“图像生成”插件。", "[Local Message] 生成图像, 请先把模型切换至gpt-*。如果中文Prompt效果不理想, 请尝试英文Prompt。正在处理中 ....."))
	yield from update_ui(chatbot=chatbot, history=history) # 刷新界面由于请求gpt需要一段时间,我们先及时地做一次界面更新
	if ("advanced_arg" in plugin_kwargs) and (plugin_kwargs["advanced_arg"] == ""): plugin_kwargs.pop("advanced_arg")
	resolution_arg = plugin_kwargs.get("advanced_arg", '1024x1024-standard-vivid').lower()
	parts = resolution_arg.split('-')
	resolution = parts[0] # 解析分辨率
	quality = 'standard' # 质量与风格默认值
	style = 'vivid'
	# 遍历检查是否有额外参数
	for part in parts[1:]:
	if part in ['hd', 'standard']:
	quality = part
	elif part in ['vivid', 'natural']:
	style = part
	image_url, image_path = gen_image(llm_kwargs, prompt, resolution, model="dall-e-3", quality=quality, style=style)
	chatbot.append([prompt,
	f'图像中转网址: <br/>`{image_url}`<br/>'+
	f'中转网址预览: <br/><div align="center"><img src="{image_url}"></div>'
	f'本地文件地址: <br/>`{image_path}`<br/>'+
	f'本地文件预览: <br/><div align="center"><img src="file={image_path}"></div>'
	])
	yield from update_ui(chatbot=chatbot, history=history) # 刷新界面界面更新


	class ImageEditState(GptAcademicState):
	# 尚未完成
	def get_image_file(self, x):
	import os, glob
	if len(x) == 0: return False, None
	if not os.path.exists(x): return False, None
	if x.endswith('.png'): return True, x
	file_manifest = [f for f in glob.glob(f'{x}/*/.png', recursive=True)]
	confirm = (len(file_manifest) >= 1 and file_manifest[0].endswith('.png') and os.path.exists(file_manifest[0]))
	file = None if not confirm else file_manifest[0]
	return confirm, file

	def lock_plugin(self, chatbot):
	chatbot._cookies['lock_plugin'] = 'crazy_functions.图片生成->图片修改_DALLE2'
	self.dump_state(chatbot)

	def unlock_plugin(self, chatbot):
	self.reset()
	chatbot._cookies['lock_plugin'] = None
	self.dump_state(chatbot)

	def get_resolution(self, x):
	return (x in ['256x256', '512x512', '1024x1024']), x

	def get_prompt(self, x):
	confirm = (len(x)>=5) and (not self.get_resolution(x)[0]) and (not self.get_image_file(x)[0])
	return confirm, x

	def reset(self):
	self.req = [
	{'value':None, 'description': '请先上传图像（必须是.png格式）, 然后再次点击本插件', 'verify_fn': self.get_image_file},
	{'value':None, 'description': '请输入分辨率,可选：256x256, 512x512 或 1024x1024, 然后再次点击本插件', 'verify_fn': self.get_resolution},
	{'value':None, 'description': '请输入修改需求,建议您使用英文提示词, 然后再次点击本插件', 'verify_fn': self.get_prompt},
	]
	self.info = ""

	def feed(self, prompt, chatbot):
	for r in self.req:
	if r['value'] is None:
	confirm, res = r['verify_fn'](prompt)
	if confirm:
	r['value'] = res
	self.dump_state(chatbot)
	break
	return self

	def next_req(self):
	for r in self.req:
	if r['value'] is None:
	return r['description']
	return "已经收集到所有信息"

	def already_obtained_all_materials(self):
	return all([x['value'] is not None for x in self.req])

	@CatchException
	def 图片修改_DALLE2(prompt, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt, user_request):
	# 尚未完成
	history = [] # 清空历史
	state = ImageEditState.get_state(chatbot, ImageEditState)
	state = state.feed(prompt, chatbot)
	state.lock_plugin(chatbot)
	if not state.already_obtained_all_materials():
	chatbot.append(["图片修改\n\n1. 上传图片（图片中需要修改的位置用橡皮擦擦除为纯白色，即RGB=255,255,255）\n2. 输入分辨率 \n3. 输入修改需求", state.next_req()])
	yield from update_ui(chatbot=chatbot, history=history)
	return

	image_path = state.req[0]['value']
	resolution = state.req[1]['value']
	prompt = state.req[2]['value']
	chatbot.append(["图片修改, 执行中", f"图片:`{image_path}`<br/>分辨率:`{resolution}`<br/>修改需求:`{prompt}`"])
	yield from update_ui(chatbot=chatbot, history=history)
	image_url, image_path = edit_image(llm_kwargs, prompt, image_path, resolution)
	chatbot.append([prompt,
	f'图像中转网址: <br/>`{image_url}`<br/>'+
	f'中转网址预览: <br/><div align="center"><img src="{image_url}"></div>'
	f'本地文件地址: <br/>`{image_path}`<br/>'+
	f'本地文件预览: <br/><div align="center"><img src="file={image_path}"></div>'
	])
	yield from update_ui(chatbot=chatbot, history=history) # 刷新界面界面更新
	state.unlock_plugin(chatbot)

	def make_transparent(input_image_path, output_image_path):
	from PIL import Image
	image = Image.open(input_image_path)
	image = image.convert("RGBA")
	data = image.getdata()
	new_data = []
	for item in data:
	if item[0] == 255 and item[1] == 255 and item[2] == 255:
	new_data.append((255, 255, 255, 0))
	else:
	new_data.append(item)
	image.putdata(new_data)
	image.save(output_image_path, "PNG")

	def resize_image(input_path, output_path, max_size=1024):
	from PIL import Image
	with Image.open(input_path) as img:
	width, height = img.size
	if width > max_size or height > max_size:
	if width >= height:
	new_width = max_size
	new_height = int((max_size / width) * height)
	else:
	new_height = max_size
	new_width = int((max_size / height) * width)

	resized_img = img.resize(size=(new_width, new_height))
	resized_img.save(output_path)
	else:
	img.save(output_path)

	def make_square_image(input_path, output_path):
	from PIL import Image
	with Image.open(input_path) as img:
	width, height = img.size
	size = max(width, height)
	new_img = Image.new("RGBA", (size, size), color="black")
	new_img.paste(img, ((size - width) // 2, (size - height) // 2))
	new_img.save(output_path)