meme_world / app.py
Xhaheen's picture
Update app.py
38a0b0b
raw
history blame
7.07 kB
# # %%bash
# # # git lfs install
# # # git clone https://huggingface.co/spaces/Xhaheen/meme_world
# # # pip install -r /content/meme_world/requirements.txt
# # # pip install gradio
# # cd /meme_world
# import torch
# import re
# import gradio as gr
# from transformers import AutoTokenizer, ViTFeatureExtractor, VisionEncoderDecoderModel
# import cohere
# import os
# #
# # os.environ['key_srkian'] = ''
# key_srkian = os.environ["key_srkian"]
# co = cohere.Client(key_srkian)#srkian
# device='cpu'
# encoder_checkpoint = "nlpconnect/vit-gpt2-image-captioning"
# decoder_checkpoint = "nlpconnect/vit-gpt2-image-captioning"
# model_checkpoint = "nlpconnect/vit-gpt2-image-captioning"
# feature_extractor = ViTFeatureExtractor.from_pretrained(encoder_checkpoint)
# tokenizer = AutoTokenizer.from_pretrained(decoder_checkpoint)
# model = VisionEncoderDecoderModel.from_pretrained(model_checkpoint).to(device)
# def predict(department,image,max_length=64, num_beams=4):
# image = image.convert('RGB')
# image = feature_extractor(image, return_tensors="pt").pixel_values.to(device)
# clean_text = lambda x: x.replace('<|endoftext|>','').split('\n')[0]
# caption_ids = model.generate(image, max_length = max_length)[0]
# caption_text = clean_text(tokenizer.decode(caption_ids))
# dept=department
# context= caption_text
# response = co.generate(
# model='large',
# prompt=f'create non offensive one line meme for given department and context\n\ndepartment- data science\ncontext-a man sitting on a bench with a laptop\nmeme- \"I\'m not a data scientist, but I play one on my laptop.\"\n\ndepartment-startup\ncontext-a young boy is smiling while using a laptop\nmeme-\"When your startup gets funded and you can finally afford a new laptop\"\n\ndepartment- {dept}\ncontext-{context}\nmeme-',
# max_tokens=20,
# temperature=0.8,
# k=0,
# p=0.75,
# frequency_penalty=0,
# presence_penalty=0,
# stop_sequences=["department"],
# return_likelihoods='NONE')
# reponse=response.generations[0].text
# reponse = reponse.replace("department", "")
# Feedback_SQL="DEPT"+dept+"CAPT"+caption_text+"MAMAY"+reponse
# return reponse
# # input = gr.inputs.Image(label="Upload your Image", type = 'pil', optional=True)
# output = gr.outputs.Textbox(type="text",label="Meme")
# #examples = [f"example{i}.jpg" for i in range(1,7)]
# #examples = os.listdir()
# examples = [f"example{i}.png" for i in range(1,7)]
# #examples=os.listdir()
# #for fichier in examples:
# # if not(fichier.endswith(".png")):
# # examples.remove(fichier)
# description= " Looking for a fun and easy way to generate memes? Look no further than Meme world! Leveraging large language models like GPT-3PT-3 / Ai21 / Cohere, you can create memes that are sure to be a hit with your friends or network. Created with ♥️ by Arsalan @[Xaheen](https://www.linkedin.com/in/sallu-mandya/). kindly share your thoughts in discussion session and use the app responsibly #NO_Offense \n \n built with ❤️ @[Xhaheen](https://www.linkedin.com/in/sallu-mandya/)"
# title = "Meme world 🖼️"
# dropdown=["data science", "product management","marketing","startup" ,"agile","crypto" , "SEO" ]
# article = "Created By : Xaheen "
# interface = gr.Interface(
# fn=predict,
# inputs = [gr.inputs.Dropdown(dropdown),gr.inputs.Image(label="Upload your Image", type = 'pil', optional=True)],
# theme="grass",
# outputs=output,
# examples =[['data science', 'example5.png'],
# ['product management', 'example2.png'],
# ['startup', 'example3.png'],
# ['marketing', 'example4.png'],
# ['agile', 'example1.png'],
# ['crypto', 'example6.png']],
# title=title,
# description=description,
# article = article,
# )
# interface.launch(debug=True)
# Step 2: Set up the Gradio interface and import necessary packages
import gradio as gr
import openai
from transformers import VisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer
import torch
from PIL import Image
# Step 3: Load the provided image captioning model
model = VisionEncoderDecoderModel.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
feature_extractor = ViTImageProcessor.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
tokenizer = AutoTokenizer.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model.to(device)
# Step 4: Create a function to generate captions from images
max_length = 16
num_beams = 4
gen_kwargs = {"max_length": max_length, "num_beams": num_beams}
def generate_caption(image):
image = Image.fromarray(image.astype('uint8'), 'RGB')
if image.mode != "RGB":
image = image.convert(mode="RGB")
pixel_values = feature_extractor(images=[image], return_tensors="pt").pixel_values
pixel_values = pixel_values.to(device)
output_ids = model.generate(pixel_values, **gen_kwargs)
caption = tokenizer.decode(output_ids[0], skip_special_tokens=True).strip()
return caption
# Step 5: Create a function to generate memes using the GPT-3 API
def generate_meme(caption, department):
openai.api_key = os.environ["key"]
prompt = f"Create a non-offensive meme caption for the following image description in the context of {department} department: {caption}"
response = openai.Completion.create(engine="text-davinci-002", prompt=prompt, max_tokens=50, n=1, stop=None, temperature=0.7)
meme_caption = response.choices[0].text.strip()
return meme_caption
# Step 6: Define the main meme generation function
def meme_generator(image, department):
caption = generate_caption(image)
meme_caption = generate_meme(caption, department)
return meme_caption
examples = [f"example{i}.png" for i in range(1,7)]
# Step 7: Launch the Gradio application
image_input = gr.inputs.Image()
department_input = gr.inputs.Dropdown(choices=["data science", "product management","marketing","startup" ,"agile","crypto" , "SEO" ])
output_text = gr.outputs.Textbox()
gr.Interface(fn=meme_generator, inputs=[image_input, department_input], outputs=output_text, title="Meme world!",description= " Looking for a fun and easy way to generate memes? Look no further than Meme world! Leveraging large language models like GPT-3PT-3 / Ai21 / Cohere, you can create memes that are sure to be a hit with your friends or network. Created with ♥️ by Arsalan @[Xaheen](https://www.linkedin.com/in/sallu-mandya/). kindly share your thoughts in discussion session and use the app responsibly #NO_Offense \n \n built with ❤️ @[Xhaheen](https://www.linkedin.com/in/sallu-mandya/)", theme="grass",
examples =[['example5.png','data science' ],
['example2.png','product management'],
['example3.png','startup'],
['example4.png','marketing'],
['example1.png','agile'],
['example6.png','crypto']]).launch(debug=True)