Spaces:

notmanoj
/

chronos

Paused

App Files Files Community

Manoj Kumar commited on Jan 10

Commit

9c8236d

1 Parent(s): 39179ce

updated question structure

Browse files

Files changed (1) hide show

app.py +42 -11

app.py CHANGED Viewed

@@ -9,21 +9,52 @@ db_schema = {
     "customers": ["customer_id", "name", "email", "phone_number"]
 }
-def dummy_function(schema_description, user_question):
-    print(user_question)
 # Schema as a context for the model
 schema_description = json.dumps(db_schema, indent=4)
 # Example interactive questions
-print("Ask a question about the database schema.")
-while True:
-    user_question = input("Question: ")
-    if user_question.lower() in ["exit", "quit"]:
-        print("Exiting...")
-        break
-    # Generate SQL query
-    sql_query = dummy_function(schema_description, user_question)
-    print(f"Generated SQL Query:\n{sql_query}\n")

     "customers": ["customer_id", "name", "email", "phone_number"]
 }
+# Load the model and tokenizer
+model_name = "EleutherAI/gpt-neox-20b"  # You can also use "Llama-2-7b" or another model
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto", torch_dtype=torch.float16)
+def generate_sql_query(context, question):
+    """
+    Generate an SQL query based on the question and context.
+    Args:
+        context (str): Description of the database schema or table relationships.
+        question (str): User's natural language query.
+    Returns:
+        str: Generated SQL query.
+    """
+    # Prepare the prompt
+    prompt = f"""
+    Context: {context}
+    Question: {question}
+    Write an SQL query to address the question based on the context.
+    Query:
+    """
+    # Tokenize input
+    inputs = tokenizer(prompt, return_tensors="pt", truncation=True, max_length=1024).to("cuda" if torch.cuda.is_available() else "cpu")
+    # Generate SQL query
+    output = model.generate(inputs.input_ids, max_length=512, num_beams=5, early_stopping=True)
+    query = tokenizer.decode(output[0], skip_special_tokens=True)
+    # Extract query from the output
+    sql_query = query.split("Query:")[-1].strip()
+    return sql_query
 # Schema as a context for the model
 schema_description = json.dumps(db_schema, indent=4)
 # Example interactive questions
+questions = [
+    "Show all products that cost more than $50.",
+    "List all customers who ordered a specific product.",
+]
+for user_question in questions:
+    print(f"Question: {user_question}")
+    sql_query = generate_sql_query(schema_description, user_question)
+    print(f"Generated SQL Query:\n{sql_query}\n")