import os import random import numpy as np import gradio as gr import base64 from io import BytesIO import PIL.Image from typing import Tuple from novita_client import NovitaClient, InstantIDControlnetUnit, InstantIDLora from time import time import datetime from style_template import styles # global variable MAX_SEED = np.iinfo(np.int32).max STYLE_NAMES = list(styles.keys()) DEFAULT_STYLE_NAME = '(No style)' DEFAULT_MODEL_NAME = 'sdxlUnstableDiffusers_v8HEAVENSWRATH_133813' enable_lcm_arg = False # Path to InstantID models face_adapter = f'./checkpoints/ip-adapter.bin' controlnet_path = f'./checkpoints/ControlNetModel' # controlnet-pose/canny/depth controlnet_pose_model = 'thibaud/controlnet-openpose-sdxl-1.0' controlnet_canny_model = 'diffusers/controlnet-canny-sdxl-1.0' controlnet_depth_model = 'diffusers/controlnet-depth-sdxl-1.0-small' SDXL_MODELS = [ "albedobaseXL_v04_130099", "altxl_v60_146691", "animagineXLV3_v30_231047", "animeArtDiffusionXL_alpha2_91872", "animeArtDiffusionXL_alpha3_93120", "animeIllustDiffusion_v04_117809", "breakdomainxl_V05g_124265", "brixlAMustInYour_v40Dagobah_145992", "cinemaxAlphaSDXLCinema_alpha1_107473", "cineroXLPhotomatic_v12aPHENO_137703", "clearhungAnimeXL_v10_117716", "copaxTimelessxlSDXL1_colorfulV2_100729", "counterfeitxl_v10_108721", "counterfeitxl__98184", "crystalClearXL_ccxl_97637", "dreamshaperXL09Alpha_alpha2Xl10_91562", "dynavisionXLAllInOneStylized_alpha036FP16Bakedvae_99980", "dynavisionXLAllInOneStylized_beta0411Bakedvae_109970", "dynavisionXLAllInOneStylized_release0534bakedvae_129001", "fenrisxl_145_134980", "foddaxlPhotorealism_v45_122788", "formulaxl_v10_104889", "juggernautXL_v8Rundiffusion_227002", "juggernautXL_version2_113240", "juggernautXL_version5_126522", "kohakuXL_alpha7_111843", "LahMysteriousSDXL_v40_122478", "leosamsHelloworldSDXLModel_helloworldSDXL10_112178", "leosamsHelloworldSDXL_helloworldSDXL50_268813", "mbbxlUltimate_v10RC_94686", "moefusionSDXL_v10_114018", "nightvisionXLPhotorealisticPortrait_beta0681Bakedvae_108833", "nightvisionXLPhotorealisticPortrait_beta0702Bakedvae_113098", "nightvisionXLPhotorealisticPortrait_release0770Bakedvae_154525", "novaPrimeXL_v10_107899", "pixelwave_v10_117722", "protovisionXLHighFidelity3D_beta0520Bakedvae_106612", "protovisionXLHighFidelity3D_release0620Bakedvae_131308", "protovisionXLHighFidelity3D_release0630Bakedvae_154359", "protovisionXLHighFidelity3D_releaseV660Bakedvae_207131", "realismEngineSDXL_v05b_131513", "realismEngineSDXL_v10_136287", "realisticStockPhoto_v10_115618", "RealitiesEdgeXL_4_122673", "realvisxlV20_v20Bakedvae_129156", "riotDiffusionXL_v20_139293", "roxl_v10_109354", "sdxlNijiSpecial_sdxlNijiSE_115638", "sdxlNijiV3_sdxlNijiV3_104571", "sdxlNijiV51_sdxlNijiV51_112807", "sdxlUnstableDiffusers_v8HEAVENSWRATH_133813", "sdxlYamersAnimeUltra_yamersAnimeV3_121537", "sd_xl_base_0.9", "sd_xl_base_1.0", "shikianimexl_v10_93788", "theTalosProject_v10_117893", "thinkdiffusionxl_v10_145931", "voidnoisecorexl_r1486_150780", "wlopArienwlopstylexl_v10_101973", "wlopSTYLEXL_v2_126171", "xl13AsmodeusSFWNSFW_v22BakedVAE_111954", "xxmix9realisticsdxl_v10_123235", "zavychromaxl_b2_103298", "toonSphere3D_v10_252626", "pixelArtDiffusionXL_spriteShaper_291175", "SDXLPixelArtBase_v10_246513", "animeRealisticXL_animeXLReal_211225", "animeChangefulXL_v10ReleasedCandidate_96351", "realisticMixXL_v10_288901", ] LORA_MODELS = [ "DI_belle_delphine_sdxl_v1_93586", #"NsfwPovAllInOneLoraSdxl-000009MINI_120545", "NsfwPovAllInOneLoraSdxl-000009_120561", "acidzlime-sdxl_154149", "add-detail-xl_99264", "bwporcelaincd_xl-000007_124344", "concept_pov_dt_xl2-000020_119643", "epoxy_skull-sdxl_153213", "landscape-painting-sdxl_v2_111037", "polyhedron_all_sdxl-000004_110557", "ral-beer-sdxl_235173", "ral-wtchz-sdxl_233487", "sdxl_cute_social_comic-000002_107980", "sdxl_glass_136034", "sdxl_lightning_2step_lora", "sdxl_lightning_4step_lora", "sdxl_lightning_8step_lora", "sdxl_offset_example_v10_113006", "sdxl_wrong_lora", "xl_more_art-full_v1_113467", "xl_yoshiaki_kawajiri_v1r64_126468", "AmiguramiRedmond-Crochet-Amigurumi_312819", "zwuul-sdxl_162249", "羊毛毡_119309", "Clay Animation_114757", "CLAYMATE_V2.03__182497", "ClayAnimationRedm_119998", "mosaic_110562", "hjsocrealmosaic_v10xl_158107", "jadecarvingcd_xl-000007_185347", "jade_125785", "SDXL1.0_Essenz-series-by-AI_Characters_Style_YourNameWeatheringWithYouSuzumeMakotoShinkai-v1.4-'Skynet'_195187", "pixel-art-xl-v1.1_99321", "OWStyleYeiyeiArt-8_210248", "yen_w3_sdxl_3000_95299", "EnvyEleganceXL01_170674", "Van_gogh_by_DevDope-000014_272552", "vincent_van_gogh_xl_98658", "tbh123-sdxl_422666", "AutumnStyleXL_152042", "shadows_281564", "cybepunk_261064", "Neon_Cyberpunk_SDXL_Dwarves_248422", "Neon_Cyberpunk_Headoverlay_SDXL_435708", "cyberpunk_xl-000004_410262", "Halcyon Cyberpunk Style_357239", "HLMCoreyAnimagine_242097", "GTA_VI_Style_203190", "oil-painting-style_A3.1_XL-9_418884", "oil painting_92815", "youhua_97640", "Realistic_Insta_InfluencerV1.0_340126", "Origami_World-000005_129203", "ORIGAMI_115169", "ral-orgmi-sdxl_179458", "MJMangaSDXL_280228", "Original video animation style_365023", "Nier_Automata_2B_White_Wedding_Dress_Bride_Cosplay_Realistic_LoRA_349884", "sl_sila_94476", "Ariel_the_Mermaid_XL_157225", "mermaidXL_143722", "EnvyFairyQueenXL01_114606", "童话绘本-Arien奇幻风格_v1.0_134091", "high_elf_archer_v0.0.1_102856", "DreamARTSDXL_100272", "harry_potter_v1_269226", "arwen_prodigy_sdxl_3300_235876", "2ellie-000003_184345", "bella_ramsey_sdxl_190746", "sketch_for_art_examination_166045", "traditional_watercolor_painting_137593", "watercolor_204560", "EnvyAnimeWatercolorXL01_199536", "vampire teeth v3_255457", "SDXL_Superhero_287891", "CyborgsXL_227686", "Astro_Life_132655", "ral-czmcrnbw-sdxl_252438", "EnvyScifiStreamlineXL01_204968", "PixarXL_162719", "chibistylexl-v1-2_99955", "gldnglry_203448", "NeonifyV2-4Extreme_99051", "fflix-npt_294031", "Dhevv-FantasyEgyptClothesXL_397565", "xl0918ice-water_124998", ] CONTROLNET_DICT = dict( pose=InstantIDControlnetUnit( model_name='controlnet-openpose-sdxl-1.0', strength=1, preprocessor='openpose', ), canny=InstantIDControlnetUnit( model_name='controlnet-canny-sdxl-1.0', strength=1, preprocessor='canny', ), depth=InstantIDControlnetUnit( model_name='controlnet-depth-sdxl-1.0', strength=1, preprocessor='depth', ), lineart=InstantIDControlnetUnit( model_name='controlnet-softedge-sdxl-1.0', strength=1, preprocessor='lineart', ), ) last_check = 0 def get_novita_client (novita_key): client = NovitaClient(novita_key, os.getenv('NOVITA_API_URI', None)) return client get_local_storage = ''' function () { globalThis.setStorage = (key, value)=>{ localStorage.setItem(key, JSON.stringify(value)) } globalThis.getStorage = (key, value)=>{ return JSON.parse(localStorage.getItem(key)) } const novita_key = getStorage("novita_key") return [novita_key]; } ''' def toggle_lcm_ui (value): if value: return ( gr.update(minimum=0, maximum=100, step=1, value=5), gr.update(minimum=0.1, maximum=20.0, step=0.1, value=1.5), ) else: return ( gr.update(minimum=5, maximum=100, step=1, value=30), gr.update(minimum=0.1, maximum=20.0, step=0.1, value=5), ) def randomize_seed_fn (seed: int, randomize_seed: bool) -> int: if randomize_seed: seed = random.randint(0, MAX_SEED) return seed def remove_tips (): return gr.update(visible=False) def apply_style (style_name: str, positive: str, negative: str = "") -> Tuple[str, str]: p, n = styles.get(style_name, styles[DEFAULT_STYLE_NAME]) return p.replace("{prompt}", positive), n + " " + negative def get_example (): case = [ [ './examples/yann-lecun_resize.jpg', None, 'a man', 'Spring Festival', '(lowres, low quality, worst quality:1.2), (text:1.2), watermark, (frame:1.2), deformed, ugly, deformed eyes, blur, out of focus, blurry, deformed cat, deformed, photo, anthropomorphic cat, monochrome, photo, pet collar, gun, weapon, blue, 3d, drones, drone, buildings in background, green', ], [ './examples/musk_resize.jpeg', './examples/poses/pose2.jpg', 'a man flying in the sky in Mars', 'Mars', '(lowres, low quality, worst quality:1.2), (text:1.2), watermark, (frame:1.2), deformed, ugly, deformed eyes, blur, out of focus, blurry, deformed cat, deformed, photo, anthropomorphic cat, monochrome, photo, pet collar, gun, weapon, blue, 3d, drones, drone, buildings in background, green', ], [ './examples/sam_resize.png', './examples/poses/pose4.jpg', 'a man doing a silly pose wearing a suite', 'Jungle', '(lowres, low quality, worst quality:1.2), (text:1.2), watermark, (frame:1.2), deformed, ugly, deformed eyes, blur, out of focus, blurry, deformed cat, deformed, photo, anthropomorphic cat, monochrome, photo, pet collar, gun, weapon, blue, 3d, drones, drone, buildings in background, gree', ], [ './examples/schmidhuber_resize.png', './examples/poses/pose3.jpg', 'a man sit on a chair', 'Neon', '(lowres, low quality, worst quality:1.2), (text:1.2), watermark, (frame:1.2), deformed, ugly, deformed eyes, blur, out of focus, blurry, deformed cat, deformed, photo, anthropomorphic cat, monochrome, photo, pet collar, gun, weapon, blue, 3d, drones, drone, buildings in background, green', ], [ './examples/kaifu_resize.png', './examples/poses/pose.jpg', 'a man', 'Vibrant Color', '(lowres, low quality, worst quality:1.2), (text:1.2), watermark, (frame:1.2), deformed, ugly, deformed eyes, blur, out of focus, blurry, deformed cat, deformed, photo, anthropomorphic cat, monochrome, photo, pet collar, gun, weapon, blue, 3d, drones, drone, buildings in background, green', ], ] return case def load_example (face_file, pose_file, prompt, style, negative_prompt): name = os.path.basename(face_file).split('_')[0] image = PIL.Image.open(open(f'./examples/generated/{name}.jpg', 'rb')) return image, gr.update(visible=True) upload_depot = {} def upload_assets_with_cache (client, paths): global upload_depot pending_paths = [path for path in paths if not path in upload_depot] if pending_paths: print('uploading images:', pending_paths) for key, value in zip(pending_paths, client.upload_assets(pending_paths)): upload_depot[key] = value return [upload_depot[path] for path in paths] def generate_image ( novita_key1, model_name, lora_selection, face_image_path, pose_image_path, prompt, negative_prompt, style_name, num_steps, identitynet_strength_ratio, adapter_strength_ratio, controlnet_strength_1, controlnet_strength_2, controlnet_strength_3, controlnet_strength_4, controlnet_selection, guidance_scale, seed, scheduler, #enable_LCM, #enhance_face_region, progress=gr.Progress(track_tqdm=True), ): if face_image_path is None: raise gr.Error(f'Cannot find any input face image! Please refer to step 1️⃣') #print('novita_key:', novita_key1) #print('face_image_path:', face_image_path) if not novita_key1: raise gr.Error(f'Please input your Novita Key!') try: client = get_novita_client(novita_key1) prompt, negative_prompt = apply_style(style_name, prompt, negative_prompt) prompt = prompt[:1024] or ' ' #print('prompt:', prompt) #print('negative_prompt:', negative_prompt) #print('seed:', seed) #print('identitynet_strength_ratio:', identitynet_strength_ratio) #print('adapter_strength_ratio:', adapter_strength_ratio) #print('scheduler:', scheduler) #print('guidance_scale:', guidance_scale) #print('num_steps:', num_steps) ref_image_path = pose_image_path if pose_image_path else face_image_path ref_image = PIL.Image.open(ref_image_path) width, height = ref_image.size large_edge = max(width, height) if large_edge < 1024: scaling = 1024 / large_edge width = int(width * scaling) height = int(height * scaling) ( CONTROLNET_DICT['pose'].strength, CONTROLNET_DICT['canny'].strength, CONTROLNET_DICT['depth'].strength, CONTROLNET_DICT['lineart'].strength, ) = [controlnet_strength_1, controlnet_strength_2, controlnet_strength_3, controlnet_strength_4] def progress_ (x): global last_check t = time() if t > last_check + 5: last_check = t print('progress:', t, x.task.status) res = client.instant_id( model_name=f'{model_name}.safetensors', face_images=[face_image_path], ref_images=[ref_image_path], prompt=prompt, negative_prompt=negative_prompt, controlnets=[CONTROLNET_DICT[name] for name in controlnet_selection if name in CONTROLNET_DICT], loras=[InstantIDLora( model_name=f'{name}.safetensors', strength=1, ) for name in lora_selection], steps=num_steps, seed=seed, guidance_scale=guidance_scale, sampler_name=scheduler, id_strength=identitynet_strength_ratio, adapter_strength=adapter_strength_ratio, width=width, height=height, response_image_type='jpeg', callback=progress_, ) print('task_id:', datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S"), res.task.task_id) if not hasattr(res, 'images_encoded'): raise gr.Error(f'Error: {res.task}') except Exception as e: raise gr.Error(f'Error: {e}') image = PIL.Image.open(BytesIO(base64.b64decode(res.images_encoded[0]))) return image, gr.update(visible=True) def get_payload ( model_name, lora_selection, face_image_path, pose_image_path, prompt, negative_prompt, style_name, num_steps, identitynet_strength_ratio, adapter_strength_ratio, controlnet_strength_1, controlnet_strength_2, controlnet_strength_3, controlnet_strength_4, controlnet_selection, guidance_scale, seed, scheduler, ): prompt, negative_prompt = apply_style(style_name, prompt, negative_prompt) ref_image_path = pose_image_path if pose_image_path else face_image_path ref_image = PIL.Image.open(ref_image_path) width, height = ref_image.size large_edge = max(width, height) if large_edge < 1024: scaling = 1024 / large_edge width = int(width * scaling) height = int(height * scaling) ( CONTROLNET_DICT['pose'].strength, CONTROLNET_DICT['canny'].strength, CONTROLNET_DICT['depth'].strength, CONTROLNET_DICT['lineart'].strength, ) = [controlnet_strength_1, controlnet_strength_2, controlnet_strength_3, controlnet_strength_4] return { 'extra': { 'response_image_type': 'jpeg', }, 'model_name': f'{model_name}.safetensors', 'face_image_assets_ids': "[assets_ids of id image, please manually upload to novita.ai]", 'ref_image_assets_ids': "[assets_ids of reference image, please manually upload to novita.ai]", 'prompt': prompt, 'negative_prompt': negative_prompt, 'controlnet': { 'units': [CONTROLNET_DICT[name] for name in controlnet_selection if name in CONTROLNET_DICT], }, 'loras': [dict( model_name=f'{name}.safetensors', strength=1, ) for name in lora_selection], 'image_num': 1, 'steps': num_steps, 'seed': seed, 'guidance_scale': guidance_scale, 'sampler_name': scheduler, 'id_strength': identitynet_strength_ratio, 'adapter_strength': adapter_strength_ratio, 'width': width, 'height': height, } # Description title = r'''