RealVis_v5.0_BF16_C

Running on Zero

App Files Files Community

ford442 commited on Jan 11

Commit

5858e45

verified ·

1 Parent(s): 3c1f632

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -10

app.py CHANGED Viewed

@@ -6,6 +6,9 @@
 # copies of the Software, and to permit persons to whom the Software is
 import spaces
 import os
 import random
 import uuid
 import gradio as gr
@@ -127,21 +130,22 @@ def scheduler_swap_callback(pipeline, step_index, timestep, callback_kwargs):
     return {"latents": callback_kwargs["latents"]}
 def load_and_prepare_model():
     vaeXL = AutoencoderKL.from_pretrained("stabilityai/sdxl-vae", safety_checker=None, use_safetensors=False).to(torch.bfloat16) #.to(device=device, dtype=torch.bfloat16)
     #vaeRV = AutoencoderKL.from_pretrained("SG161222/RealVisXL_V5.0", subfolder='vae', safety_checker=None, use_safetensors=False).to(device).to(torch.bfloat16) #.to(device=device, dtype=torch.bfloat16)
     #sched = EulerAncestralDiscreteScheduler.from_pretrained('ford442/RealVisXL_V5.0_BF16', subfolder='scheduler',beta_schedule="scaled_linear")
-    sched = EulerAncestralDiscreteScheduler.from_pretrained('ford442/RealVisXL_V5.0_BF16', subfolder='scheduler')
     pipe = StableDiffusionXLPipeline.from_pretrained(
         'ford442/RealVisXL_V5.0_BF16',
         #torch_dtype=torch.bfloat16,
         add_watermarker=False,
       #  low_cpu_mem_usage = False,
         token = HF_TOKEN,
-        scheduler = sched,
     )
     #sched = EulerAncestralDiscreteScheduler.from_pretrained('ford442/RealVisXL_V5.0_BF16', subfolder='scheduler',beta_schedule="scaled_linear", beta_start=0.00085, beta_end=0.012, steps_offset=1) #,use_karras_sigmas=True)
     pipe.vae = vaeXL #.to(torch.bfloat16)
-    #pipe.scheduler = sched
     #pipe.vae.do_resize=False
     #pipe.vae.vae_scale_factor=8
     pipe.vae.set_default_attn_processor()
@@ -164,23 +168,20 @@ def load_and_prepare_model():
     #pipe.unet.to(memory_format=torch.channels_last)
     #pipe.enable_vae_tiling()
-    #pipe.unet = torch.compile(pipe.unet, backend="hidet")
     pipe.to(device=device, dtype=torch.bfloat16)
     return pipe
 hidet.option.parallel_build(True)
-hidet.option.parallel_tune(-1,4.0)
 torch._dynamo.config.suppress_errors = True
 torch._dynamo.disallow_in_graph(diffusers.models.attention.BasicTransformerBlock)
-# Preload and compile both models
-pipe = load_and_prepare_model()
 # more search
-hidet.torch.dynamo_config.search_space(0)
 #hidet.torch.dynamo_config.dump_graph_ir("./local_graph")
 hidet.option.cache_dir("local_cache")
 # automatically transform the model to use float16 data type
@@ -191,7 +192,10 @@ hidet.option.cache_dir("local_cache")
 hidet.torch.dynamo_config.use_tensor_core()
 #hidet.torch.dynamo_config.steal_weights(False)
-pipe.unet = torch.compile(pipe.unet, backend="hidet")
 MAX_SEED = np.iinfo(np.int32).max
 neg_prompt_2 = " 'non-photorealistic':1.5, 'unrealistic skin','unattractive face':1.3, 'low quality':1.1, ('dull color scheme', 'dull colors', 'digital noise':1.2),'amateurish', 'poorly drawn face':1.3, 'poorly drawn', 'distorted face', 'low resolution', 'simplistic' "

 # copies of the Software, and to permit persons to whom the Software is
 import spaces
 import os
+import subprocess
+subprocess.run(['ulimit', '-s', '512M'])
 import random
 import uuid
 import gradio as gr
     return {"latents": callback_kwargs["latents"]}
 def load_and_prepare_model():
+    sched = EulerAncestralDiscreteScheduler.from_pretrained('ford442/RealVisXL_V5.0_BF16', subfolder='scheduler',beta_schedule="scaled_linear", beta_start=0.00085, beta_end=0.012, steps_offset=1) #,use_karras_sigmas=True)
     vaeXL = AutoencoderKL.from_pretrained("stabilityai/sdxl-vae", safety_checker=None, use_safetensors=False).to(torch.bfloat16) #.to(device=device, dtype=torch.bfloat16)
     #vaeRV = AutoencoderKL.from_pretrained("SG161222/RealVisXL_V5.0", subfolder='vae', safety_checker=None, use_safetensors=False).to(device).to(torch.bfloat16) #.to(device=device, dtype=torch.bfloat16)
     #sched = EulerAncestralDiscreteScheduler.from_pretrained('ford442/RealVisXL_V5.0_BF16', subfolder='scheduler',beta_schedule="scaled_linear")
+    #sched = EulerAncestralDiscreteScheduler.from_pretrained('ford442/RealVisXL_V5.0_BF16', subfolder='scheduler')
     pipe = StableDiffusionXLPipeline.from_pretrained(
         'ford442/RealVisXL_V5.0_BF16',
         #torch_dtype=torch.bfloat16,
         add_watermarker=False,
       #  low_cpu_mem_usage = False,
         token = HF_TOKEN,
+      #  scheduler = sched,
     )
     #sched = EulerAncestralDiscreteScheduler.from_pretrained('ford442/RealVisXL_V5.0_BF16', subfolder='scheduler',beta_schedule="scaled_linear", beta_start=0.00085, beta_end=0.012, steps_offset=1) #,use_karras_sigmas=True)
     pipe.vae = vaeXL #.to(torch.bfloat16)
+    pipe.scheduler = sched
     #pipe.vae.do_resize=False
     #pipe.vae.vae_scale_factor=8
     pipe.vae.set_default_attn_processor()
     #pipe.unet.to(memory_format=torch.channels_last)
     #pipe.enable_vae_tiling()
+    pipe.unet = torch.compile(pipe.unet, backend="hidet")
     pipe.to(device=device, dtype=torch.bfloat16)
     return pipe
 hidet.option.parallel_build(True)
+hidet.option.parallel_tune(-1,8.0)
 torch._dynamo.config.suppress_errors = True
 torch._dynamo.disallow_in_graph(diffusers.models.attention.BasicTransformerBlock)
 # more search
+hidet.torch.dynamo_config.search_space(1)
 #hidet.torch.dynamo_config.dump_graph_ir("./local_graph")
 hidet.option.cache_dir("local_cache")
 # automatically transform the model to use float16 data type
 hidet.torch.dynamo_config.use_tensor_core()
 #hidet.torch.dynamo_config.steal_weights(False)
+# Preload and compile both models
+pipe = load_and_prepare_model()
 MAX_SEED = np.iinfo(np.int32).max
 neg_prompt_2 = " 'non-photorealistic':1.5, 'unrealistic skin','unattractive face':1.3, 'low quality':1.1, ('dull color scheme', 'dull colors', 'digital noise':1.2),'amateurish', 'poorly drawn face':1.3, 'poorly drawn', 'distorted face', 'low resolution', 'simplistic' "