Upload 12 files

3a18eba over 1 year ago

5.13 kB

	# coding=utf-8
	# Copyright 2022 The HuggingFace Inc. team.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	import requests
	import os
	import os.path as osp
	import torch
	try:
	from omegaconf import OmegaConf
	except ImportError:
	raise ImportError(
	"OmegaConf is required to convert the LDM checkpoints. Please install it with `pip install OmegaConf`."
	)

	from diffusers import (
	AutoencoderKL,
	DDIMScheduler,
	DPMSolverMultistepScheduler,
	EulerAncestralDiscreteScheduler,
	EulerDiscreteScheduler,
	HeunDiscreteScheduler,
	LDMTextToImagePipeline,
	LMSDiscreteScheduler,
	PNDMScheduler,
	StableDiffusionPipeline,
	UNet2DConditionModel,
	DiffusionPipeline
	)
	from diffusers.pipelines.latent_diffusion.pipeline_latent_diffusion import LDMBertConfig, LDMBertModel
	#from diffusers.pipelines.paint_by_example import PaintByExampleImageEncoder, PaintByExamplePipeline
	from diffusers.pipelines.stable_diffusion import StableDiffusionSafetyChecker
	from transformers import AutoFeatureExtractor, BertTokenizerFast, CLIPTextModel, CLIPTokenizer, CLIPVisionConfig, CLIPTextConfig
	import model_util

	class Convert_SD_to_Diffusers():

	def __init__(self, checkpoint_path, output_path, prediction_type=None, img_size=None, original_config_file=None, extract_ema=False, num_in_channels=None,pipeline_type=None,scheduler_type=None,sd_version=None,half=None,version=None):
	self.checkpoint_path = checkpoint_path
	self.output_path = output_path
	self.prediction_type = prediction_type
	self.img_size = img_size
	self.original_config_file = original_config_file
	self.extract_ema = extract_ema
	self.num_in_channels = num_in_channels
	self.pipeline_type = pipeline_type
	self.scheduler_type = scheduler_type
	self.sd_version = sd_version
	self.half = half
	self.version = version
	self.main()


	def main(self):
	image_size = self.img_size
	prediction_type = self.prediction_type
	original_config_file = self.original_config_file
	num_in_channels = self.num_in_channels
	scheduler_type = self.scheduler_type
	pipeline_type = self.pipeline_type
	extract_ema = self.extract_ema
	reference_diffusers_model = None
	if self.version == 'v1':
	is_v1 = True
	is_v2 = False
	if self.version == 'v2':
	is_v1 = False
	is_v2 = True
	if is_v2 == True and prediction_type == 'vprediction':
	reference_diffusers_model = 'stabilityai/stable-diffusion-2'
	if is_v2 == True and prediction_type == 'epsilon':
	reference_diffusers_model = 'stabilityai/stable-diffusion-2-base'
	if is_v1 == True and prediction_type == 'epsilon':
	reference_diffusers_model = 'runwayml/stable-diffusion-v1-5'
	dtype = 'fp16' if self.half else None
	v2_model = True if is_v2 else False
	print(f"loading model from: {self.checkpoint_path}")
	#print(v2_model)
	text_encoder, vae, unet = model_util.load_models_from_stable_diffusion_checkpoint(v2_model, self.checkpoint_path)
	print(f"copy scheduler/tokenizer config from: {reference_diffusers_model}")
	model_util.save_diffusers_checkpoint(v2_model, self.output_path, text_encoder, unet, reference_diffusers_model, vae)
	print(f"Diffusers model saved.")



	class Convert_Diffusers_to_SD():
	def __init__(self,model_path=None, output_path=None):
	pass
	def main(model_path:str, output_path:str):
	#print(model_path)
	#print(output_path)
	global_step = None
	epoch = None
	dtype = torch.float32
	pipe = DiffusionPipeline.from_pretrained(model_path, torch_dtype=dtype, tokenizer=None, safety_checker=None)
	text_encoder = pipe.text_encoder
	vae = pipe.vae
	if os.path.exists(os.path.join(model_path, "ema_unet")):
	pipe.unet = UNet2DConditionModel.from_pretrained(
	model_path,
	subfolder="ema_unet",
	torch_dtype=dtype
	)
	unet = pipe.unet
	v2_model = unet.config.cross_attention_dim == 1024
	original_model = None
	key_count = model_util.save_stable_diffusion_checkpoint(v2_model, output_path, text_encoder, unet,
	original_model, epoch, global_step, dtype, vae)
	print(f"Saved model")
	return main(model_path, output_path)