Spaces:

nqdior
/

stable-image-webui

Running

App Files Files Community

stable-image-webui / app.py

nqdior

update theme

ec6d589 4 months ago

raw

history blame

24 kB

	import gradio as gr
	import numpy as np
	import requests
	from PIL import Image
	from io import BytesIO
	import time

	MAX_SEED = np.iinfo(np.int32).max
	MAX_IMAGE_SIZE = 1344

	title = """
	# Stability AI - Developer Platform WebUI
	### UI for using the stable image api

	API Key is required to use this service.
	https://platform.stability.ai/account/keys

	Contact: D̷ELL@Stability AI - Advocate (https://x.com/xqdior) / Author: umise (https://x.com/UiE029)
	"""

	title_jp = """
	# Stability AI - Developer Platform WebUI
	### このSpaceは、Stable Image APIを使用するためのWEB-UIです。

	このサービスを利用するにはAPIキーが必要です。以下のリンクから取得してください。
	https://platform.stability.ai/account/keys

	お問い合わせ先: D̷ELL@Stability AI - Advocate (https://x.com/xqdior) / Author: umise (https://x.com/UiE029)
	"""

	overview = """

	Overview
	Stability AI’s Stable Image services offer a growing set of APIs for developers to build the best in class image applications.

	- Disrupting Content Creation: Stability’s Image APIs are the foundation for applications disrupting publishing, media, gaming, marketing, advertising, design, and more.
	- For Developers: Application developers can build advanced features for designers, photographers, content creators, and a variety of B2C customers.
	- Simple APIs: Stability AI is focused on delivering simple APIs for easy integration into applications with a high bar for quality, alignment, speed, and safety.

	Get Started Now: https://platform.stability.ai/docs/getting-started/stable-image
	"""

	overview_jp = """
	各種モードについて
	- テキストから生成:
	プロンプトを基に画像を生成します。
	- アップスケール:
	- 通常のアップスケール:
	できるだけ絵を変更せずにアップスケールします
	- クリエィティブなアップスケール:
	絵全体をいい感じになるようにアップスケールします
	- 画像の編集:
	- 消去:
	マスクした要素を削除します
	- インペイント:
	マスクされた部分とプロンプトを基に再生成します
	- アウトペイント:
	指定した範囲分、画像を拡張します
	- 検索と置き換え:
	検索プロンプトに入力されたオブジェクトを探し、プロンプトをもとにオブジェクトを再生成します
	- コントロール:
	- 構図:
	入力画像の構図を基に新しい画像を生成します
	- スケッチ:
	ラフなスケッチとプロンプトを基に生成します
	"""

	model_url = {
	"ImageUltra": "https://api.stability.ai/v2beta/stable-image/generate/ultra",
	"ImageCore": "https://api.stability.ai/v2beta/stable-image/generate/core",
	"StableDiffusion3": "https://api.stability.ai/v2beta/stable-image/generate/sd3",
	}

	service_url = {
	"Conservative_Upscale": "https://api.stability.ai/v2beta/stable-image/upscale/conservative",
	"Creative_Upscale": "https://api.stability.ai/v2beta/stable-image/upscale/creative",
	"Erase": "https://api.stability.ai/v2beta/stable-image/edit/erase",
	"Inpaint": "https://api.stability.ai/v2beta/stable-image/edit/inpaint",
	"Outpaint": "https://api.stability.ai/v2beta/stable-image/edit/outpaint",
	"SR": "https://api.stability.ai/v2beta/stable-image/edit/search-and-replace",
	"RMBG": "https://api.stability.ai/v2beta/stable-image/edit/remove-background",
	"Sketch": "https://api.stability.ai/v2beta/stable-image/control/sketch",
	"Structure": "https://api.stability.ai/v2beta/stable-image/control/structure",
	}


	translations = {
	"en": {
	"api_key": "API Key",
	"api_key_placeholder": "Enter your API key",
	"model_label": "Model",
	"mode_label": "Mode",
	"prompt_placeholder": "Enter your prompt",
	"negative_prompt_placeholder": "Enter a negative prompt",
	"seed_label": "Seed",
	"randomize_seed_label": "Randomize seed",
	"aspect_label": "Aspect ratio",
	"run_button": "Run",
	"result_label": "Result",
	"copy_field_placeholder": "Copy the field",
	"Negative_prompt": "Negative prompt",
	"Advanced_Settings": "Advanced Settings",
	"Example": "Example",
	"Generate": "Generate",
	"Upscale": "Upscale",
	"Edit": "Edit",
	"Control": "Control",
	"Submode": "Submode",
	"Conservative": "Conservative",
	"Creative": "Creative",
	"Erase": "Erase",
	"Inpaint": "Inpaint",
	"Outpaint": "Outpaint",
	"Structure": "Structure",
	"Sketch": "Sketch",
	"Search_and_Replace": "Search and Replace",
	"Remove_Background": "Remove Background",
	"input_image": "Input Image",
	"style_preset": "Style preset",
	"preset_description": "This parameter is only available for ImageCore model.",
	"Search_prompt_placeholder": "Enter a search prompt",
	"Control_Strength": "Control Strength",
	"overview": overview,
	"overview_label": "How to use",
	"title": title,
	},
	"ja": {
	"api_key": "APIキー",
	"api_key_placeholder": "APIキーを入力してください",
	"model_label": "モデル",
	"mode_label": "モード",
	"prompt_placeholder": "プロンプトを入力してください",
	"negative_prompt_placeholder": "ネガティブプロンプトを入力してください",
	"seed_label": "シード",
	"randomize_seed_label": "シードをランダム化",
	"aspect_label": "アスペクト比",
	"run_button": "実行",
	"result_label": "結果",
	"copy_field_placeholder": "ここに貼り付け用の情報が出てきます",
	"Negative_prompt": "ネガティブプロンプト",
	"Advanced_Settings": "追加設定",
	"Example": "例",
	"Generate": "テキストから生成",
	"Upscale": "アップスケール",
	"Edit": "画像の編集",
	"Control": "コントロールモード",
	"Submode": "サブモード",
	"Conservative": "通常のアップスケール",
	"Creative": "クリエィティブなアップスケール",
	"Erase": "消去",
	"Inpaint": "インペイント",
	"Outpaint": "アウトペイント(拡張)",
	"Structure": "構図",
	"Sketch": "スケッチ",
	"Search_and_Replace": "検索と置き換え",
	"Remove_Background": "背景削除",
	"input_image": "入力画像",
	"style_preset": "スタイルのプリセット",
	"preset_description": "このパラメータはimage coreのときにだけ有効になります",
	"Search_prompt_placeholder": "探したい要素を入力してください",
	"Control_Strength": "コントロールネットの適用強度",
	"overview": overview_jp,
	"overview_label": "使い方",
	"title": title_jp,
	},
	}

	lang = "ja"


	def bytes_to_image(image):
	image = BytesIO(image)
	image = Image.open(image).convert("RGB")
	return image


	def image_to_bytes(image):
	byte_io = BytesIO()
	image.save(byte_io, format="PNG")
	byte_data = byte_io.getvalue()
	return byte_data


	def send_request(url, api_key, file, data):
	response = requests.post(
	url,
	headers={"Authorization": f"Bearer {api_key}", "Accept": "image/*"},
	files=file,
	data=data,
	)
	return response


	def generate(
	prompt,
	negative_prompt,
	seed,
	mode,
	submode,
	input_image,
	mask,
	CNstrength,
	search_prompt,
	op_left,
	op_right,
	op_up,
	op_down,
	randomize_seed,
	aspect,
	model,
	preset,
	api_key,
	):
	if randomize_seed:
	seed = 0

	file = {}
	data = {
	"prompt": prompt,
	"negative_prompt": negative_prompt,
	"output_format": "png",
	"seed": seed,
	"aspect_ratio": aspect,
	}
	data_rmbg = {
	"output_format": "png",
	}
	if input_image is not None:
	file["image"] = image_to_bytes(input_image)
	if mask is not None:
	file["mask"] = image_to_bytes(mask)

	if mode == translations[lang]["Generate"]:
	file["none"] = ""
	if model == "Stable Image Ultra (8B + workflow)":
	url = model_url["ImageUltra"]
	elif model == "Stable Image Core (2B + workflow)":
	url = model_url["ImageCore"]
	data["style_preset"] = preset
	elif model == "Stable Diffusion 3 Medium (2B)":
	url = model_url["StableDiffusion3"]
	data["model"] = "sd3-medium"
	elif model == "Stable Diffusion 3 Large (8B)":
	url = model_url["StableDiffusion3"]
	data["model"] = "sd3-large"
	elif model == "Stable Diffusion 3 Large Turbo (8B Turbo)":
	url = model_url["StableDiffusion3"]
	data["model"] = "sd3-large-turbo"
	else:
	raise ValueError("Invalid model type")

	elif mode == translations[lang]["Upscale"]:
	if submode == translations[lang]["Conservative"]:
	url = service_url["Conservative_Upscale"]
	elif submode == translations[lang]["Creative"]:
	url = service_url["Creative_Upscale"]

	elif mode == translations[lang]["Edit"]:
	if submode == translations[lang]["Erase"]:
	url = service_url["Erase"]
	elif submode == translations[lang]["Inpaint"]:
	url = service_url["Inpaint"]
	elif submode == translations[lang]["Outpaint"]:
	url = service_url["Outpaint"]
	data["left"] = op_left
	data["right"] = op_right
	data["up"] = op_up
	data["down"] = op_down
	elif submode == translations[lang]["Search_and_Replace"]:
	url = service_url["SR"]
	data["search_prompt"] = search_prompt
	elif submode == translations[lang]["Remove_Background"]:
	data = data_rmbg
	url = service_url["RMBG"]

	elif mode == translations[lang]["Control"]:
	data["control_strength"] = CNstrength
	if submode == translations[lang]["Sketch"]:
	url = service_url["Sketch"]
	elif submode == translations[lang]["Structure"]:
	url = service_url["Structure"]
	response = send_request(url, api_key, file, data)

	if response.status_code == 200:
	if (
	mode == translations[lang]["Upscale"]
	and submode == translations[lang]["Creative"]
	):
	generation_id = response.json().get("id")
	if not generation_id:
	raise Exception("No generation ID returned for creative upscale")

	# Polling for the result
	result_url = f"https://api.stability.ai/v2beta/stable-image/upscale/creative/result/{generation_id}"
	while True:
	result_response = requests.get(
	result_url,
	headers={"accept": "image/*", "authorization": f"Bearer {api_key}"},
	)
	if result_response.status_code == 202:
	print("Generation in-progress, try again in 10 seconds.")
	time.sleep(10)
	elif result_response.status_code == 200:
	print("Generation complete!")
	image = result_response.content
	image = bytes_to_image(image)
	copy_filed_value = f"prompt:{prompt}, negative:{negative_prompt}, mode:{mode}, submode:{submode}"
	return image, seed, copy_filed_value
	else:
	raise Exception(str(result_response.json()))
	else:
	image = response.content
	image = bytes_to_image(image)
	copy_filed_value = f"prompt:{prompt}, negative:{negative_prompt}, mode:{mode}, submode:{submode}"
	return image, seed, copy_filed_value
	else:
	raise Exception(str(response.json()))


	examples = [
	"Astronaut in a jungle, cold color palette, muted colors, detailed, 8k",
	"An astronaut riding a green horse",
	"A delicious ceviche cheesecake slice",
	]

	css = """
	#col-container {
	margin: 0 auto;
	max-width: 50vw;
	}
	"""


	def update_style_visibility(model):
	if model == "Stable Image Core (2B + workflow)":
	return gr.update(visible=True)
	else:
	return gr.update(visible=False)


	def update_mode(mode):
	submode_update = gr.update(choices=["None"], visible=False)
	image_label_update = gr.update(visible=False)
	img_input_update = gr.update(visible=False)
	mask_update = gr.update(visible=False)

	if mode == translations[lang]["Generate"]:
	submode_update = gr.update(visible=False)
	elif mode == translations[lang]["Upscale"]:
	submode_update = gr.update(
	choices=[
	translations[lang]["Conservative"],
	translations[lang]["Creative"],
	],
	value=translations[lang]["Conservative"],
	visible=True,
	)
	img_input_update = gr.update(visible=True)
	image_label_update = gr.update(visible=True)
	elif mode == translations[lang]["Edit"]:
	submode_update = gr.update(
	choices=[
	translations[lang]["Erase"],
	translations[lang]["Inpaint"],
	translations[lang]["Outpaint"],
	translations[lang]["Search_and_Replace"],
	translations[lang]["Remove_Background"],
	],
	value=translations[lang]["Erase"],
	visible=True,
	)
	img_input_update = gr.update(visible=True)
	image_label_update = gr.update(visible=True)
	elif mode == translations[lang]["Control"]:
	submode_update = gr.update(
	choices=[
	translations[lang]["Structure"],
	translations[lang]["Sketch"],
	],
	value=translations[lang]["Structure"],
	visible=True,
	)
	img_input_update = gr.update(visible=True)
	image_label_update = gr.update(visible=True)

	return submode_update, img_input_update, mask_update, image_label_update


	def update_submode(submode):
	mask = gr.update(visible=False)
	outpaint = gr.update(visible=False)
	cn = gr.update(visible=False)
	search_prompt = gr.update(visible=False)

	if submode in [translations[lang]["Erase"], translations[lang]["Inpaint"]]:
	mask = gr.update(visible=True)

	else:
	if submode == translations[lang]["Outpaint"]:
	outpaint = gr.update(visible=True)

	elif submode in [translations[lang]["Structure"], translations[lang]["Sketch"]]:
	cn = gr.update(visible=True)

	elif submode == translations[lang]["Search_and_Replace"]:
	search_prompt = gr.update(visible=True)

	return mask, outpaint, cn, search_prompt


	with gr.Blocks(css=css) as demo: #, theme="NoCrypt/miku") as demo:
	with gr.Column(elem_id="col-container"):
	gr.Markdown(
	translations[lang]["title"],
	)
	with gr.Accordion(translations[lang]["overview_label"], open=False):
	gr.Markdown(
	translations[lang]["overview"],
	)

	with gr.Row():
	api_key = gr.Text(
	label=translations[lang]["api_key"],
	type="password",
	placeholder=translations[lang]["api_key_placeholder"],
	max_lines=1,
	container=False,
	)

	with gr.Row():
	model = gr.Dropdown(
	label=translations[lang]["model_label"],
	choices=[
	"Stable Image Ultra (8B + workflow)",
	"Stable Image Core (2B + workflow)",
	"Stable Diffusion 3 Large Turbo (8B Turbo)",
	"Stable Diffusion 3 Large (8B)",
	"Stable Diffusion 3 Medium (2B)",
	],
	value="Stable Image Ultra (8B + workflow)",
	)
	mode = gr.Dropdown(
	label=translations[lang]["mode_label"],
	choices=[
	translations[lang]["Generate"],
	translations[lang]["Upscale"],
	translations[lang]["Edit"],
	translations[lang]["Control"],
	],
	value=translations[lang]["Generate"],
	)

	submode = gr.Dropdown(
	label=translations[lang]["Submode"],
	choices=["None"],
	visible=False,
	value="None",
	)

	with gr.Row():
	with gr.Column():
	prompt = gr.Text(
	label="Prompt",
	show_label=False,
	max_lines=1,
	placeholder=translations[lang]["prompt_placeholder"],
	container=False,
	)
	search_prompt = gr.Text(
	label="search prompt",
	visible=False,
	show_label=False,
	max_lines=1,
	placeholder=translations[lang]["Search_prompt_placeholder"],
	)
	run_button = gr.Button(translations[lang]["run_button"], scale=0)
	with gr.Row():
	gr.Examples(
	label=translations[lang]["Example"], examples=examples, inputs=[prompt]
	)
	with gr.Row():
	with gr.Column():
	image_label = gr.Markdown(
	value=translations[lang]["input_image"], visible=False
	)
	image = gr.Image(
	type="pil",
	label="img input",
	width="20vw",
	height="20vw",
	show_label=True,
	visible=False,
	interactive=True,
	container=False,
	)
	with gr.Column(visible=False) as mask:
	mask_label = gr.Markdown(value="input mask")
	mask_input = gr.Image(
	type="pil",
	label="mask",
	width="20vw",
	height="20vw",
	show_label=True,
	interactive=True,
	container=False,
	)

	with gr.Row():
	result = gr.Image(
	label=translations[lang]["result_label"], width="20vw", height="20%"
	)

	with gr.Accordion(translations[lang]["Advanced_Settings"], open=False):
	negative_prompt = gr.Text(
	label=translations[lang]["Negative_prompt"],
	max_lines=1,
	placeholder=translations[lang]["negative_prompt_placeholder"],
	)
	seed = gr.Slider(
	label=translations[lang]["seed_label"],
	minimum=0,
	maximum=MAX_SEED,
	step=1,
	value=0,
	)
	CN_strength = gr.Slider(
	label=translations[lang]["Control_Strength"],
	minimum=0,
	maximum=1,
	step=0.01,
	value=0.5,
	visible=False,
	)
	randomize_seed = gr.Checkbox(
	label=translations[lang]["randomize_seed_label"], value=True
	)
	aspect = gr.Radio(
	choices=[
	"1:1",
	"16:9",
	"21:9",
	"2:3",
	"3:2",
	"4:5",
	"5:4",
	"9:16",
	"9:21",
	],
	label=translations[lang]["aspect_label"],
	value="1:1",
	)
	with gr.Row(visible=False) as style:
	style_preset = gr.Radio(
	choices=[
	"3d-model",
	"analog-film",
	"anime",
	"cinematic",
	"comic-book",
	"digital-art",
	"enhance",
	"fantasy-art",
	"isometric",
	"line-art",
	"low-poly",
	"modeling-compound",
	"neon-punk",
	"origami",
	"photographic",
	"pixel-art",
	"tile-texture",
	],
	label=translations[lang]["style_preset"],
	value="anime",
	info=translations[lang]["preset_description"],
	)
	with gr.Row(visible=False) as outpaint_scale:
	paint = gr.Markdown(value="Outpain Scale")
	op_left = gr.Slider(
	label="left", minimum=0, maximum=2000, step=4, value=200
	)
	op_right = gr.Slider(
	label="right", minimum=0, maximum=2000, step=4, value=200
	)
	op_up = gr.Slider(
	label="up", minimum=0, maximum=2000, step=4, value=200
	)
	op_down = gr.Slider(
	label="down", minimum=0, maximum=2000, step=4, value=200
	)

	copy_filed = gr.TextArea(
	value="",
	label="Copy Field",
	max_lines=1,
	placeholder=translations[lang]["copy_field_placeholder"],
	show_copy_button=True,
	container=False,
	)
	gr.Markdown(
	f"""
	## License
	This work is licensed under a
	[Creative Commons Attribution-NonCommercial 4.0 International License][cc-by-nc].

	[![CC BY-NC 4.0][cc-by-nc-image]][cc-by-nc]

	[cc-by-nc]: https://creativecommons.org/licenses/by-nc/4.0/
	[cc-by-nc-image]: https://licensebuttons.net/l/by-nc/4.0/88x31.png
	[cc-by-nc-shield]: https://img.shields.io/badge/License-CC%20BY--NC%204.0-lightgrey.svg

	MIT Licensed Source Code
	Portions of this work are licensed under the MIT License. For more details, please refer to the original source at: [stabilityai/stable-diffusion-3-medium](https://huggingface.co/spaces/stabilityai/stable-diffusion-3-medium)
	"""
	)
	gr.on(
	triggers=[run_button.click, prompt.submit, negative_prompt.submit],
	fn=generate,
	inputs=[
	prompt,
	negative_prompt,
	seed,
	mode,
	submode,
	image,
	mask_input,
	CN_strength,
	search_prompt,
	op_left,
	op_right,
	op_up,
	op_down,
	randomize_seed,
	aspect,
	model,
	style_preset,
	api_key,
	],
	outputs=[result, seed, copy_filed],
	)

	mode.change(
	fn=update_mode, inputs=mode, outputs=[submode, image, mask, image_label]
	)
	submode.change(
	fn=update_submode,
	inputs=submode,
	outputs=[mask, outpaint_scale, CN_strength, search_prompt],
	)
	model.change(fn=update_style_visibility, inputs=model, outputs=style)
	demo.launch()