Spaces:

salahIguiliz
/

ControlLogoNet

Build error

App Files Files Community

ControlLogoNet / app.py

salahIguiliz

Update app.py

4fc2fae almost 2 years ago

raw

history blame contribute delete

4.01 kB


	from controlnet_aux import OpenposeDetector
	from diffusers import StableDiffusionControlNetPipeline, ControlNetModel
	from diffusers import UniPCMultistepScheduler
	import gradio as gr
	import torch
	from PIL import Image, ImageDraw, ImageFont
	import os
	import cv2
	import glob
	from PIL import Image
	import numpy as np
	from diffusers.utils import load_image
	import random

	# Constants
	low_threshold = 100
	high_threshold = 200

	# Models
	pose_model = OpenposeDetector.from_pretrained("lllyasviel/ControlNet")
	controlnet = ControlNetModel.from_pretrained(
	"lllyasviel/sd-controlnet-openpose"
	)
	pipe = StableDiffusionControlNetPipeline.from_pretrained(
	"runwayml/stable-diffusion-v1-5", controlnet=controlnet, safety_checker=None
	)
	pipe = pipe.to("cpu")


	def get_pose(image):
	return pose_model(image)



	def generate_an_image_from_text(text, text_size_, width, lenght):
	# Create a blank image
	image = Image.new('RGB', (width, lenght), color = (255, 255, 255))
	# Create a drawing object
	draw = ImageDraw.Draw(image)
	# font def
	dir_path = ''
	# Get a list of all the font files in the directory
	print("start generation")
	font_files = glob.glob(os.path.join(dir_path, '*.ttf'))
	# Get a list of font paths
	font_paths = []
	for font_file in font_files:
	font_paths.append(font_file)
	# Select a random font
	font_path = random.choice(font_paths)
	#print(font_path)
	font = ImageFont.truetype(font_path, text_size_)
	# Get the text size
	text_size = draw.textsize(text, font)
	# Calculate the x and y positions for the text
	x = (image.width - text_size[0]) / 2
	y = (image.height - text_size[1]) / 2
	# Draw the text on the image
	draw.text((x, y), text, fill=(0, 0, 0), font=font)
	print("end generation")

	return image

	def to_Canny(image):
	print("start canny")

	# Let's load the popular vermeer image
	image = np.array(image)

	low_threshold = 100
	high_threshold = 200

	image = cv2.Canny(image, low_threshold, high_threshold)
	image = image[:, :, None]
	image = np.concatenate([image, image, image], axis=2)
	canny_image = Image.fromarray(image)
	print("end canny")

	return canny_image

	def inference(prompt,canny_image,number,seed, steps ):
	print("start inference")


	pipe.scheduler = UniPCMultistepScheduler.from_config(pipe.scheduler.config)
	# This command loads the individual model components on GPU on-demand. So, we don't
	# need to explicitly call pipe.to("cuda").
	#pipe.enable_model_cpu_offload()
	# xformers
	#pipe.enable_xformers_memory_efficient_attention()
	# Generator seed,
	generator = torch.manual_seed(seed)
	image_ = canny_image
	prompt = prompt
	out_image = pipe(
	prompt, num_inference_steps=steps, generator=generator, image=image_, num_images_per_prompt=number)
	print('end inference')
	return out_image



	def generation(prompt,text,seed,police_size, lenght, width,number,num_inference_steps):
	img = generate_an_image_from_text(text,police_size,lenght,width)
	img = to_Canny(img)
	output = inference(prompt,img, number,seed,num_inference_steps)
	all_outputs = []
	for image in output.images:
	all_outputs.append(image)
	return all_outputs

	gr.Interface(fn=generation,
	inputs=[gr.Textbox(value="A steampunk Alphabetic Logo, steampunk style, with glowing mecha parts, mecha alphabets, high quality, high res, ultra HD"), gr.Textbox(), gr.Slider(0, 200,value=60), gr.Slider(0, 200, value=90), gr.Slider(0, 1024, value=512), gr.Slider(0, 1024, value=512),
	gr.Slider(0, 7,value=2, step=1),gr.Slider(0, 20,value=5, step=1)], outputs=gr.Gallery().style(grid=[2], height="auto"), title="Generate a logo using Text ",cache_examples=True, examples=[["A steampunk Alphabetic Logo, steampunk style, with glowing mecha parts, mecha alphabets, high quality, high res, ultra HD", "Logo",60,90,512,512,2,5]]).launch(enable_queue=True)