Merge branch 'AUTOMATIC1111:master' into draft (263b323d) · Commits · github_fork / Stable Diffusion Webui

README.md

+1 −1

Original line number	Diff line number	Diff line
		@@ -70,7 +70,7 @@ Check the [custom scripts](https://github.com/AUTOMATIC1111/stable-diffusion-web
		- separate prompts using uppercase `AND`
		- also supports weights for prompts: `a cat :1.2 AND a dog AND a penguin :2.2`
		- No token limit for prompts (original stable diffusion lets you use up to 75 tokens)
		- DeepDanbooru integration, creates danbooru style tags for anime prompts (add --deepdanbooru to commandline args)
		- DeepDanbooru integration, creates danbooru style tags for anime prompts
		- [xformers](https://github.com/AUTOMATIC1111/stable-diffusion-webui/wiki/Xformers), major speed increase for select cards: (add --xformers to commandline args)
		- via extension: [History tab](https://github.com/yfszzx/stable-diffusion-webui-images-browser): view, direct and delete images conveniently within the UI
		- Generate forever option

launch.py

+2 −7

Original line number	Diff line number	Diff line
		@@ -134,14 +134,13 @@ def prepare_enviroment():

		gfpgan_package = os.environ.get('GFPGAN_PACKAGE', "git+https://github.com/TencentARC/GFPGAN.git@8d2447a2d918f8eba5a4a01463fd48e45126a379")
		clip_package = os.environ.get('CLIP_PACKAGE', "git+https://github.com/openai/CLIP.git@d50d76daa670286dd6cacf3bcd80b5e4823fc8e1")
		deepdanbooru_package = os.environ.get('DEEPDANBOORU_PACKAGE', "git+https://github.com/KichangKim/DeepDanbooru.git@d91a2963bf87c6a770d74894667e9ffa9f6de7ff")

		xformers_windows_package = os.environ.get('XFORMERS_WINDOWS_PACKAGE', 'https://github.com/C43H66N12O12S2/stable-diffusion-webui/releases/download/f/xformers-0.0.14.dev0-cp310-cp310-win_amd64.whl')

		stable_diffusion_repo = os.environ.get('STABLE_DIFFUSION_REPO', "https://github.com/CompVis/stable-diffusion.git")
		taming_transformers_repo = os.environ.get('TAMING_REANSFORMERS_REPO', "https://github.com/CompVis/taming-transformers.git")
		taming_transformers_repo = os.environ.get('TAMING_TRANSFORMERS_REPO', "https://github.com/CompVis/taming-transformers.git")
		k_diffusion_repo = os.environ.get('K_DIFFUSION_REPO', 'https://github.com/crowsonkb/k-diffusion.git')
		codeformer_repo = os.environ.get('CODEFORMET_REPO', 'https://github.com/sczhou/CodeFormer.git')
		codeformer_repo = os.environ.get('CODEFORMER_REPO', 'https://github.com/sczhou/CodeFormer.git')
		blip_repo = os.environ.get('BLIP_REPO', 'https://github.com/salesforce/BLIP.git')

		stable_diffusion_commit_hash = os.environ.get('STABLE_DIFFUSION_COMMIT_HASH', "69ae4b35e0a0f6ee1af8bb9a5d0016ccb27e36dc")
		@@ -158,7 +157,6 @@ def prepare_enviroment():
		sys.argv, update_check = extract_arg(sys.argv, '--update-check')
		sys.argv, run_tests = extract_arg(sys.argv, '--tests')
		xformers = '--xformers' in sys.argv
		deepdanbooru = '--deepdanbooru' in sys.argv
		ngrok = '--ngrok' in sys.argv

		try:
		@@ -193,9 +191,6 @@ def prepare_enviroment():
		elif platform.system() == "Linux":
		run_pip("install xformers", "xformers")

		if not is_installed("deepdanbooru") and deepdanbooru:
		run_pip(f"install {deepdanbooru_package}#egg=deepdanbooru[tensorflow] tensorflow==2.10.0 tensorflow-io==0.27.0", "deepdanbooru")

		if not is_installed("pyngrok") and ngrok:
		run_pip("install pyngrok", "ngrok")

modules/api/api.py

+58 −52

Original line number	Diff line number	Diff line
		@@ -5,19 +5,19 @@ import uvicorn
		from threading import Lock
		from gradio.processing_utils import encode_pil_to_base64, decode_base64_to_file, decode_base64_to_image
		from fastapi import APIRouter, Depends, FastAPI, HTTPException
		from fastapi.security import HTTPBasic, HTTPBasicCredentials
		from secrets import compare_digest

		import modules.shared as shared
		from modules import sd_samplers, deepbooru
		from modules.api.models import *
		from modules.processing import StableDiffusionProcessingTxt2Img, StableDiffusionProcessingImg2Img, process_images
		from modules.sd_samplers import all_samplers
		from modules.extras import run_extras, run_pnginfo
		from PIL import PngImagePlugin
		from modules.sd_models import checkpoints_list
		from modules.realesrgan_model import get_realesrgan_models
		from typing import List

		if shared.cmd_opts.deepdanbooru:
		from modules.deepbooru import get_deepbooru_tags

		def upscaler_to_index(name: str):
		try:
		return [x.name.lower() for x in shared.sd_upscalers].index(name.lower())
		@@ -25,8 +25,12 @@ def upscaler_to_index(name: str):
		raise HTTPException(status_code=400, detail=f"Invalid upscaler, needs to be on of these: {' , '.join([x.name for x in sd_upscalers])}")


		sampler_to_index = lambda name: next(filter(lambda row: name.lower() == row[1].name.lower(), enumerate(all_samplers)), None)
		def validate_sampler_name(name):
		config = sd_samplers.all_samplers_map.get(name, None)
		if config is None:
		raise HTTPException(status_code=404, detail="Sampler not found")

		return name

		def setUpscalers(req: dict):
		reqDict = vars(req)
		@@ -57,39 +61,53 @@ def encode_pil_to_base64(image):

		class Api:
		def __init__(self, app: FastAPI, queue_lock: Lock):
		if shared.cmd_opts.api_auth:
		self.credenticals = dict()
		for auth in shared.cmd_opts.api_auth.split(","):
		user, password = auth.split(":")
		self.credenticals[user] = password

		self.router = APIRouter()
		self.app = app
		self.queue_lock = queue_lock
		self.app.add_api_route("/sdapi/v1/txt2img", self.text2imgapi, methods=["POST"], response_model=TextToImageResponse)
		self.app.add_api_route("/sdapi/v1/img2img", self.img2imgapi, methods=["POST"], response_model=ImageToImageResponse)
		self.app.add_api_route("/sdapi/v1/extra-single-image", self.extras_single_image_api, methods=["POST"], response_model=ExtrasSingleImageResponse)
		self.app.add_api_route("/sdapi/v1/extra-batch-images", self.extras_batch_images_api, methods=["POST"], response_model=ExtrasBatchImagesResponse)
		self.app.add_api_route("/sdapi/v1/png-info", self.pnginfoapi, methods=["POST"], response_model=PNGInfoResponse)
		self.app.add_api_route("/sdapi/v1/progress", self.progressapi, methods=["GET"], response_model=ProgressResponse)
		self.app.add_api_route("/sdapi/v1/interrogate", self.interrogateapi, methods=["POST"])
		self.app.add_api_route("/sdapi/v1/interrupt", self.interruptapi, methods=["POST"])
		self.app.add_api_route("/sdapi/v1/options", self.get_config, methods=["GET"], response_model=OptionsModel)
		self.app.add_api_route("/sdapi/v1/options", self.set_config, methods=["POST"])
		self.app.add_api_route("/sdapi/v1/cmd-flags", self.get_cmd_flags, methods=["GET"], response_model=FlagsModel)
		self.app.add_api_route("/sdapi/v1/samplers", self.get_samplers, methods=["GET"], response_model=List[SamplerItem])
		self.app.add_api_route("/sdapi/v1/upscalers", self.get_upscalers, methods=["GET"], response_model=List[UpscalerItem])
		self.app.add_api_route("/sdapi/v1/sd-models", self.get_sd_models, methods=["GET"], response_model=List[SDModelItem])
		self.app.add_api_route("/sdapi/v1/hypernetworks", self.get_hypernetworks, methods=["GET"], response_model=List[HypernetworkItem])
		self.app.add_api_route("/sdapi/v1/face-restorers", self.get_face_restorers, methods=["GET"], response_model=List[FaceRestorerItem])
		self.app.add_api_route("/sdapi/v1/realesrgan-models", self.get_realesrgan_models, methods=["GET"], response_model=List[RealesrganItem])
		self.app.add_api_route("/sdapi/v1/prompt-styles", self.get_promp_styles, methods=["GET"], response_model=List[PromptStyleItem])
		self.app.add_api_route("/sdapi/v1/artist-categories", self.get_artists_categories, methods=["GET"], response_model=List[str])
		self.app.add_api_route("/sdapi/v1/artists", self.get_artists, methods=["GET"], response_model=List[ArtistItem])
		self.add_api_route("/sdapi/v1/txt2img", self.text2imgapi, methods=["POST"], response_model=TextToImageResponse)
		self.add_api_route("/sdapi/v1/img2img", self.img2imgapi, methods=["POST"], response_model=ImageToImageResponse)
		self.add_api_route("/sdapi/v1/extra-single-image", self.extras_single_image_api, methods=["POST"], response_model=ExtrasSingleImageResponse)
		self.add_api_route("/sdapi/v1/extra-batch-images", self.extras_batch_images_api, methods=["POST"], response_model=ExtrasBatchImagesResponse)
		self.add_api_route("/sdapi/v1/png-info", self.pnginfoapi, methods=["POST"], response_model=PNGInfoResponse)
		self.add_api_route("/sdapi/v1/progress", self.progressapi, methods=["GET"], response_model=ProgressResponse)
		self.add_api_route("/sdapi/v1/interrogate", self.interrogateapi, methods=["POST"])
		self.add_api_route("/sdapi/v1/interrupt", self.interruptapi, methods=["POST"])
		self.add_api_route("/sdapi/v1/skip", self.skip, methods=["POST"])
		self.add_api_route("/sdapi/v1/options", self.get_config, methods=["GET"], response_model=OptionsModel)
		self.add_api_route("/sdapi/v1/options", self.set_config, methods=["POST"])
		self.add_api_route("/sdapi/v1/cmd-flags", self.get_cmd_flags, methods=["GET"], response_model=FlagsModel)
		self.add_api_route("/sdapi/v1/samplers", self.get_samplers, methods=["GET"], response_model=List[SamplerItem])
		self.add_api_route("/sdapi/v1/upscalers", self.get_upscalers, methods=["GET"], response_model=List[UpscalerItem])
		self.add_api_route("/sdapi/v1/sd-models", self.get_sd_models, methods=["GET"], response_model=List[SDModelItem])
		self.add_api_route("/sdapi/v1/hypernetworks", self.get_hypernetworks, methods=["GET"], response_model=List[HypernetworkItem])
		self.add_api_route("/sdapi/v1/face-restorers", self.get_face_restorers, methods=["GET"], response_model=List[FaceRestorerItem])
		self.add_api_route("/sdapi/v1/realesrgan-models", self.get_realesrgan_models, methods=["GET"], response_model=List[RealesrganItem])
		self.add_api_route("/sdapi/v1/prompt-styles", self.get_promp_styles, methods=["GET"], response_model=List[PromptStyleItem])
		self.add_api_route("/sdapi/v1/artist-categories", self.get_artists_categories, methods=["GET"], response_model=List[str])
		self.add_api_route("/sdapi/v1/artists", self.get_artists, methods=["GET"], response_model=List[ArtistItem])

		def add_api_route(self, path: str, endpoint, **kwargs):
		if shared.cmd_opts.api_auth:
		return self.app.add_api_route(path, endpoint, dependencies=[Depends(self.auth)], **kwargs)
		return self.app.add_api_route(path, endpoint, **kwargs)

		def auth(self, credenticals: HTTPBasicCredentials = Depends(HTTPBasic())):
		if credenticals.username in self.credenticals:
		if compare_digest(credenticals.password, self.credenticals[credenticals.username]):
		return True

		raise HTTPException(status_code=401, detail="Incorrect username or password", headers={"WWW-Authenticate": "Basic"})

		def text2imgapi(self, txt2imgreq: StableDiffusionTxt2ImgProcessingAPI):
		sampler_index = sampler_to_index(txt2imgreq.sampler_index)

		if sampler_index is None:
		raise HTTPException(status_code=404, detail="Sampler not found")

		populate = txt2imgreq.copy(update={ # Override __init__ params
		"sd_model": shared.sd_model,
		"sampler_index": sampler_index[0],
		"sampler_name": validate_sampler_name(txt2imgreq.sampler_index),
		"do_not_save_samples": True,
		"do_not_save_grid": True
		}
		@@ -109,12 +127,6 @@ class Api:
		return TextToImageResponse(images=b64images, parameters=vars(txt2imgreq), info=processed.js())

		def img2imgapi(self, img2imgreq: StableDiffusionImg2ImgProcessingAPI):
		sampler_index = sampler_to_index(img2imgreq.sampler_index)

		if sampler_index is None:
		raise HTTPException(status_code=404, detail="Sampler not found")


		init_images = img2imgreq.init_images
		if init_images is None:
		raise HTTPException(status_code=404, detail="Init image not found")
		@@ -123,10 +135,9 @@ class Api:
		if mask:
		mask = decode_base64_to_image(mask)


		populate = img2imgreq.copy(update={ # Override __init__ params
		"sd_model": shared.sd_model,
		"sampler_index": sampler_index[0],
		"sampler_name": validate_sampler_name(img2imgreq.sampler_index),
		"do_not_save_samples": True,
		"do_not_save_grid": True,
		"mask": mask
		@@ -231,10 +242,7 @@ class Api:
		if interrogatereq.model == "clip":
		processed = shared.interrogator.interrogate(img)
		elif interrogatereq.model == "deepdanbooru":
		if shared.cmd_opts.deepdanbooru:
		processed = get_deepbooru_tags(img)
		else:
		raise HTTPException(status_code=404, detail="Model not found. Add --deepdanbooru when launching for using the model.")
		processed = deepbooru.model.tag(img)
		else:
		raise HTTPException(status_code=404, detail="Model not found")

		@@ -245,6 +253,9 @@ class Api:

		return {}

		def skip(self):
		shared.state.skip()

		def get_config(self):
		options = {}
		for key in shared.opts.data.keys():
		@@ -256,14 +267,9 @@ class Api:

		return options

		def set_config(self, req: OptionsModel):
		# currently req has all options fields even if you send a dict like { "send_seed": false }, which means it will
		# overwrite all options with default values.
		raise RuntimeError('Setting options via API is not supported')

		reqDict = vars(req)
		for o in reqDict:
		setattr(shared.opts, o, reqDict[o])
		def set_config(self, req: Dict[str, Any]):
		for k, v in req.items():
		shared.opts.set(k, v)

		shared.opts.save(shared.config_filename)
		return
		@@ -272,7 +278,7 @@ class Api:
		return vars(shared.cmd_opts)

		def get_samplers(self):
		return [{"name":sampler[0], "aliases":sampler[2], "options":sampler[3]} for sampler in all_samplers]
		return [{"name": sampler[0], "aliases":sampler[2], "options":sampler[3]} for sampler in sd_samplers.all_samplers]

		def get_upscalers(self):
		upscalers = []

modules/api/models.py

+3 −3

Original line number	Diff line number	Diff line
		@@ -176,9 +176,9 @@ class InterrogateResponse(BaseModel):
		caption: str = Field(default=None, title="Caption", description="The generated caption for the image.")

		fields = {}
		for key, value in opts.data.items():
		metadata = opts.data_labels.get(key)
		optType = opts.typemap.get(type(value), type(value))
		for key, metadata in opts.data_labels.items():
		value = opts.data.get(key)
		optType = opts.typemap.get(type(metadata.default), type(value))

		if (metadata is not None):
		fields.update({key: (Optional[optType], Field(

modules/deepbooru.py

+91 −167

Original line number	Diff line number	Diff line
		import os.path
		from concurrent.futures import ProcessPoolExecutor
		import multiprocessing
		import time
		import os
		import re

		import torch
		from PIL import Image
		import numpy as np

		from modules import modelloader, paths, deepbooru_model, devices, images, shared

		re_special = re.compile(r'([\\()])')

		def get_deepbooru_tags(pil_image):
		"""
		This method is for running only one image at a time for simple use. Used to the img2img interrogate.
		"""
		from modules import shared # prevents circular reference

		try:
		create_deepbooru_process(shared.opts.interrogate_deepbooru_score_threshold, create_deepbooru_opts())
		return get_tags_from_process(pil_image)
		finally:
		release_process()


		OPT_INCLUDE_RANKS = "include_ranks"
		def create_deepbooru_opts():
		from modules import shared

		return {
		"use_spaces": shared.opts.deepbooru_use_spaces,
		"use_escape": shared.opts.deepbooru_escape,
		"alpha_sort": shared.opts.deepbooru_sort_alpha,
		OPT_INCLUDE_RANKS: shared.opts.interrogate_return_ranks,
		}


		def deepbooru_process(queue, deepbooru_process_return, threshold, deepbooru_opts):
		model, tags = get_deepbooru_tags_model()
		while True: # while process is running, keep monitoring queue for new image
		pil_image = queue.get()
		if pil_image == "QUIT":
		break
		else:
		deepbooru_process_return["value"] = get_deepbooru_tags_from_model(model, tags, pil_image, threshold, deepbooru_opts)


		def create_deepbooru_process(threshold, deepbooru_opts):
		"""
		Creates deepbooru process. A queue is created to send images into the process. This enables multiple images
		to be processed in a row without reloading the model or creating a new process. To return the data, a shared
		dictionary is created to hold the tags created. To wait for tags to be returned, a value of -1 is assigned
		to the dictionary and the method adding the image to the queue should wait for this value to be updated with
		the tags.
		"""
		from modules import shared # prevents circular reference
		context = multiprocessing.get_context("spawn")
		shared.deepbooru_process_manager = context.Manager()
		shared.deepbooru_process_queue = shared.deepbooru_process_manager.Queue()
		shared.deepbooru_process_return = shared.deepbooru_process_manager.dict()
		shared.deepbooru_process_return["value"] = -1
		shared.deepbooru_process = context.Process(target=deepbooru_process, args=(shared.deepbooru_process_queue, shared.deepbooru_process_return, threshold, deepbooru_opts))
		shared.deepbooru_process.start()


		def get_tags_from_process(image):
		from modules import shared

		shared.deepbooru_process_return["value"] = -1
		shared.deepbooru_process_queue.put(image)
		while shared.deepbooru_process_return["value"] == -1:
		time.sleep(0.2)
		caption = shared.deepbooru_process_return["value"]
		shared.deepbooru_process_return["value"] = -1

		return caption


		def release_process():
		"""
		Stops the deepbooru process to return used memory
		"""
		from modules import shared # prevents circular reference
		shared.deepbooru_process_queue.put("QUIT")
		shared.deepbooru_process.join()
		shared.deepbooru_process_queue = None
		shared.deepbooru_process = None
		shared.deepbooru_process_return = None
		shared.deepbooru_process_manager = None

		def get_deepbooru_tags_model():
		import deepdanbooru as dd
		import tensorflow as tf
		import numpy as np
		this_folder = os.path.dirname(__file__)
		model_path = os.path.abspath(os.path.join(this_folder, '..', 'models', 'deepbooru'))
		if not os.path.exists(os.path.join(model_path, 'project.json')):
		# there is no point importing these every time
		import zipfile
		from basicsr.utils.download_util import load_file_from_url
		load_file_from_url(
		r"https://github.com/KichangKim/DeepDanbooru/releases/download/v3-20211112-sgd-e28/deepdanbooru-v3-20211112-sgd-e28.zip",
		model_path)
		with zipfile.ZipFile(os.path.join(model_path, "deepdanbooru-v3-20211112-sgd-e28.zip"), "r") as zip_ref:
		zip_ref.extractall(model_path)
		os.remove(os.path.join(model_path, "deepdanbooru-v3-20211112-sgd-e28.zip"))

		tags = dd.project.load_tags_from_project(model_path)
		model = dd.project.load_model_from_project(
		model_path, compile_model=False
		)
		return model, tags

		class DeepDanbooru:
		def __init__(self):
		self.model = None

		def get_deepbooru_tags_from_model(model, tags, pil_image, threshold, deepbooru_opts):
		import deepdanbooru as dd
		import tensorflow as tf
		import numpy as np
		def load(self):
		if self.model is not None:
		return

		alpha_sort = deepbooru_opts['alpha_sort']
		use_spaces = deepbooru_opts['use_spaces']
		use_escape = deepbooru_opts['use_escape']
		include_ranks = deepbooru_opts['include_ranks']

		width = model.input_shape[2]
		height = model.input_shape[1]
		image = np.array(pil_image)
		image = tf.image.resize(
		image,
		size=(height, width),
		method=tf.image.ResizeMethod.AREA,
		preserve_aspect_ratio=True,
		files = modelloader.load_models(
		model_path=os.path.join(paths.models_path, "torch_deepdanbooru"),
		model_url='https://github.com/AUTOMATIC1111/TorchDeepDanbooru/releases/download/v1/model-resnet_custom_v3.pt',
		ext_filter=".pt",
		download_name='model-resnet_custom_v3.pt',
		)
		image = image.numpy() # EagerTensor to np.array
		image = dd.image.transform_and_pad_image(image, width, height)
		image = image / 255.0
		image_shape = image.shape
		image = image.reshape((1, image_shape[0], image_shape[1], image_shape[2]))

		y = model.predict(image)[0]
		self.model = deepbooru_model.DeepDanbooruModel()
		self.model.load_state_dict(torch.load(files[0], map_location="cpu"))

		result_dict = {}
		self.model.eval()
		self.model.to(devices.cpu, devices.dtype)

		for i, tag in enumerate(tags):
		result_dict[tag] = y[i]
		def start(self):
		self.load()
		self.model.to(devices.device)

		def stop(self):
		if not shared.opts.interrogate_keep_models_in_memory:
		self.model.to(devices.cpu)
		devices.torch_gc()

		def tag(self, pil_image):
		self.start()
		res = self.tag_multi(pil_image)
		self.stop()

		return res

		def tag_multi(self, pil_image, force_disable_ranks=False):
		threshold = shared.opts.interrogate_deepbooru_score_threshold
		use_spaces = shared.opts.deepbooru_use_spaces
		use_escape = shared.opts.deepbooru_escape
		alpha_sort = shared.opts.deepbooru_sort_alpha
		include_ranks = shared.opts.interrogate_return_ranks and not force_disable_ranks

		pic = images.resize_image(2, pil_image.convert("RGB"), 512, 512)
		a = np.expand_dims(np.array(pic, dtype=np.float32), 0) / 255

		with torch.no_grad(), devices.autocast():
		x = torch.from_numpy(a).cuda()
		y = self.model(x)[0].detach().cpu().numpy()

		probability_dict = {}

		for tag, probability in zip(self.model.tags, y):
		if probability < threshold:
		continue

		unsorted_tags_in_theshold = []
		result_tags_print = []
		for tag in tags:
		if result_dict[tag] >= threshold:
		if tag.startswith("rating:"):
		continue
		unsorted_tags_in_theshold.append((result_dict[tag], tag))
		result_tags_print.append(f'{result_dict[tag]} {tag}')

		# sort tags
		result_tags_out = []
		sort_ndx = 0
		probability_dict[tag] = probability

		if alpha_sort:
		sort_ndx = 1
		tags = sorted(probability_dict)
		else:
		tags = [tag for tag, _ in sorted(probability_dict.items(), key=lambda x: -x[1])]

		res = []

		# sort by reverse by likelihood and normal for alpha, and format tag text as requested
		unsorted_tags_in_theshold.sort(key=lambda y: y[sort_ndx], reverse=(not alpha_sort))
		for weight, tag in unsorted_tags_in_theshold:
		for tag in tags:
		probability = probability_dict[tag]
		tag_outformat = tag
		if use_spaces:
		tag_outformat = tag_outformat.replace('_', ' ')
		if use_escape:
		tag_outformat = re.sub(re_special, r'\\\1', tag_outformat)
		if include_ranks:
		tag_outformat = f"({tag_outformat}:{weight:.3f})"
		tag_outformat = f"({tag_outformat}:{probability:.3f})"

		res.append(tag_outformat)

		result_tags_out.append(tag_outformat)
		return ", ".join(res)

		print('\n'.join(sorted(result_tags_print, reverse=True)))

		return ', '.join(result_tags_out)
		model = DeepDanbooru()

Admin message