|
import os |
|
import gradio as gr |
|
import random |
|
from openai import AzureOpenAI |
|
|
|
|
|
AZURE_API_VERSION = "2023-03-15-preview" |
|
|
|
client = AzureOpenAI(api_key=os.getenv("AZURE_OPENAI_API_KEY"), api_version=AZURE_API_VERSION, azure_endpoint=os.getenv("AZURE_OPENAI_ENDPOINT")) |
|
|
|
|
|
new_year_levels = [os.getenv("First_Word"), os.getenv("Second_Word"), os.getenv("Third_Word"), os.getenv("Fourth_Word"), os.getenv("Fifth_Word")] |
|
|
|
|
|
def ask_openai(prompt, secret_word): |
|
""" |
|
Sends the user prompt and safeguards to the OpenAI API to generate a response. |
|
""" |
|
system_message = os.getenv("SYSTM_MSG") |
|
|
|
try: |
|
response = client.chat.completions.create( |
|
model="gpt-4o", |
|
messages=[ |
|
{"role": "system", "content": system_message}, |
|
{"role": "user", "content": prompt} |
|
], |
|
temperature=0.7, |
|
max_tokens=100, |
|
) |
|
return response.choices[0].message.content |
|
except Exception as e: |
|
return f"Error: {str(e)}" |
|
|
|
|
|
|
|
def jailbreak_game(user_prompt, current_level, attempts): |
|
|
|
if current_level >= len(new_year_levels): |
|
return ( |
|
"Congratulations! π You have completed all levels. ", |
|
current_level, |
|
attempts) |
|
|
|
secret_word = new_year_levels[current_level] |
|
ai_response = ask_openai(user_prompt, secret_word) |
|
|
|
|
|
if secret_word in ai_response.lower(): |
|
if current_level + 1 < len(new_year_levels): |
|
return ( |
|
f"π You got it! The secret word for Level {current_level + 1} was '{secret_word}'. " |
|
f"Get ready for Level {current_level + 2}! π₯³", |
|
current_level + 1, |
|
attempts + 1) |
|
else: |
|
NY_msg = "β¨ May 2025 bring you endless joy, success, and fireworks of happiness! Happy New Year! β¨" |
|
try: |
|
response = client.chat.completions.create( |
|
model="gpt-4o", |
|
messages=[{"role": "user", "content": "Generate a unique Happy New year wish. Your response should be only the New Year wish."}], |
|
temperature=0.1, |
|
max_tokens=100, |
|
) |
|
NY_msg = response.choices[0].message.content |
|
except Exception as e: |
|
NY_msg = f"β¨ May 2025 bring you endless joy, success, and fireworks of happiness! Happy New Year! β¨" |
|
|
|
return ( |
|
f"π You got it! The secret word for Level {current_level + 1} was '{secret_word}'. " |
|
"You have completed all levels!π₯³ Here is a unique New Year message for you: " |
|
f"{NY_msg}", |
|
current_level + 1, |
|
attempts + 1) |
|
|
|
else: |
|
return ai_response, current_level, attempts + 1 |
|
|
|
def start_new_game(): |
|
welcome_message = ( |
|
"Welcome to the New Year 2025 Jailbreak Game! π\n" |
|
"Try to make me say the secret words related to New Year's Eve.\n" |
|
"You will go through 5 levels, each with a unique word, related to 'New Year'. Good luck!" |
|
) |
|
return welcome_message, 0, 0 |
|
|
|
|
|
with gr.Blocks() as app: |
|
with gr.Row(): |
|
gr.Markdown("## π New Year 2025 Jailbreak Game π") |
|
descripion, _0, _1 = start_new_game() |
|
gr.Markdown(descripion) |
|
|
|
user_prompt = gr.Textbox(label="Your Prompt", placeholder="Enter your prompt here...") |
|
game_output = gr.Textbox(label="AI Response", interactive=False) |
|
attempts = gr.Number(value=0, interactive=False, label="Attempts") |
|
current_level = gr.State(value=0) |
|
|
|
with gr.Row(): |
|
submit_button = gr.Button("Submit") |
|
new_game_button = gr.Button("Start New Game") |
|
|
|
submit_button.click(jailbreak_game, [user_prompt, current_level, attempts], [game_output, current_level, attempts]) |
|
new_game_button.click(start_new_game, [], [game_output, current_level, attempts]) |
|
|
|
|
|
app.launch() |