Stable-Diffusion-3.5-Serverless

Runtime error

App Files Files Community

Stable-Diffusion-3.5-Serverless / app.py

K00B404

Update app.py

52bd1b1 verified 26 days ago

raw

history blame contribute delete

7.62 kB

	import gradio as gr
	import requests
	import io
	import random
	import os
	import time
	from PIL import Image
	from deep_translator import GoogleTranslator
	import json
	from gradio_client import Client

	# Project by Nymbo

	API_URL = "https://api-inference.huggingface.co/models/stabilityai/stable-diffusion-3.5-large"
	API_TOKEN = os.getenv("HF_READ_TOKEN")
	headers = {"Authorization": f"Bearer {API_TOKEN}"}
	timeout = 100

	# Initialize the prompt enhancer client
	prompt_enhancer = Client("K00B404/mistral-nemo-prompt-enhancer")

	def enhance_prompt(prompt, enable_enhancement=True):
	"""Enhance the given prompt using the Mistral Nemo prompt enhancer."""
	if not enable_enhancement:
	print(f'\033[1mPrompt enhancement disabled, using original prompt:\033[0m {prompt}')
	return prompt

	try:
	system_message = "You are an expert at writing detailed, high-quality image generation prompts. Enhance the given prompt by adding relevant artistic details, style elements, and quality descriptors. Keep the original intent but make it more elaborate and specific."
	enhanced = prompt_enhancer.predict(
	message=prompt,
	system_message=system_message,
	max_tokens=512,
	temperature=0.7,
	top_p=0.95,
	api_name="/chat"
	)
	print(f'\033[1mOriginal prompt:\033[0m {prompt}')
	print(f'\033[1mEnhanced prompt:\033[0m {enhanced}')
	return enhanced
	except Exception as e:
	print(f"Error enhancing prompt: {e}")
	return prompt # Fall back to original prompt if enhancement fails

	# Function to query the API and return the generated image
	def query(prompt, is_negative=False, steps=35, cfg_scale=7, sampler="DPM++ 2M Karras", seed=-1, strength=0.7, width=1024, height=1024, enable_enhancement=True):
	if prompt == "" or prompt is None:
	return None, None

	key = random.randint(0, 999)

	API_TOKEN = random.choice([os.getenv("HF_READ_TOKEN")])
	headers = {"Authorization": f"Bearer {API_TOKEN}"}

	# Translate the prompt from Russian to English if necessary
	prompt = GoogleTranslator(source='ru', target='en').translate(prompt)
	print(f'\033[1mGeneration {key} translation:\033[0m {prompt}')

	# Enhance the prompt using the Mistral Nemo model if enabled
	enhanced_prompt = enhance_prompt(prompt, enable_enhancement)

	# Add some extra flair to the prompt
	final_prompt = f"{enhanced_prompt} \| ultra detail, ultra elaboration, ultra quality, perfect."
	print(f'\033[1mGeneration {key} final prompt:\033[0m {final_prompt}')

	# Prepare the payload for the API call, including width and height
	payload = {
	"inputs": final_prompt,
	"is_negative": is_negative,
	"steps": steps,
	"cfg_scale": cfg_scale,
	"seed": seed if seed != -1 else random.randint(1, 1000000000),
	"strength": strength,
	"parameters": {
	"width": width,
	"height": height
	}
	}

	# Send the request to the API and handle the response
	response = requests.post(API_URL, headers=headers, json=payload, timeout=timeout)
	if response.status_code != 200:
	print(f"Error: Failed to get image. Response status: {response.status_code}")
	print(f"Response content: {response.text}")
	if response.status_code == 503:
	raise gr.Error(f"{response.status_code} : The model is being loaded")
	raise gr.Error(f"{response.status_code}")

	try:
	# Convert the response content into an image
	image_bytes = response.content
	image = Image.open(io.BytesIO(image_bytes))
	print(f'\033[1mGeneration {key} completed!\033[0m ({final_prompt})')
	return image, enhanced_prompt
	except Exception as e:
	print(f"Error when trying to open the image: {e}")
	return None, None

	# CSS to style the app
	css = """
	#app-container {
	max-width: 800px;
	margin-left: auto;
	margin-right: auto;
	}
	"""

	# Build the Gradio UI with Blocks
	with gr.Blocks(theme='Nymbo/Nymbo_Theme', css=css) as app:
	# Add a title to the app
	gr.HTML("<center><h1>Stable Diffusion 3.5 Large with Prompt Enhancement</h1></center>")

	# Container for all the UI elements
	with gr.Column(elem_id="app-container"):
	# Add a text input for the main prompt
	with gr.Row():
	with gr.Column(elem_id="prompt-container"):
	with gr.Row():
	text_prompt = gr.Textbox(
	label="Prompt",
	placeholder="Enter a prompt here - it will be automatically enhanced for better results",
	lines=2,
	elem_id="prompt-text-input"
	)

	# Accordion for advanced settings
	with gr.Row():
	with gr.Accordion("Advanced Settings", open=False):
	enable_enhancement = gr.Checkbox(
	label="Enable Prompt Enhancement",
	value=True
	)
	negative_prompt = gr.Textbox(
	label="Negative Prompt",
	placeholder="What should not be in the image",
	value="(deformed, distorted, disfigured), poorly drawn, bad anatomy, wrong anatomy, extra limb, missing limb, floating limbs, (mutated hands and fingers), disconnected limbs, mutation, mutated, ugly, disgusting, blurry, amputation, misspellings, typos",
	lines=3,
	elem_id="negative-prompt-text-input"
	)
	with gr.Row():
	width = gr.Slider(label="Width", value=1024, minimum=64, maximum=1216, step=32)
	height = gr.Slider(label="Height", value=1024, minimum=64, maximum=1216, step=32)
	steps = gr.Slider(label="Sampling steps", value=35, minimum=1, maximum=100, step=1)
	cfg = gr.Slider(label="CFG Scale", value=7, minimum=1, maximum=20, step=1)
	strength = gr.Slider(label="Strength", value=0.7, minimum=0, maximum=1, step=0.001)
	seed = gr.Slider(label="Seed", value=-1, minimum=-1, maximum=1000000000, step=1)
	method = gr.Radio(
	label="Sampling method",
	value="DPM++ 2M Karras",
	choices=["DPM++ 2M Karras", "DPM++ SDE Karras", "Euler", "Euler a", "Heun", "DDIM"]
	)

	# Add a button to trigger the image generation
	with gr.Row():
	text_button = gr.Button("Generate Enhanced Image", variant='primary', elem_id="gen-button")

	# Image output area to display the generated image
	with gr.Row():
	image_output = gr.Image(type="pil", label="Image Output", elem_id="gallery")

	# Text output area to display the enhanced prompt
	with gr.Row():
	prompt_output = gr.Textbox(label="Enhanced Prompt", elem_id="prompt-output")

	# Bind the button to the query function with all inputs
	text_button.click(
	query,
	inputs=[text_prompt, negative_prompt, steps, cfg, method, seed, strength, width, height, enable_enhancement],
	outputs=[image_output, prompt_output]
	)

	# Launch the Gradio app
	app.launch(show_api=True, share=False)