|
from fastapi import FastAPI |
|
from pydantic import BaseModel |
|
from ctransformers import AutoModelForCausalLM, AutoTokenizer |
|
|
|
|
|
llm = AutoModelForCausalLM.from_pretrained("sqlcoder-7b.Q4_K_S.gguf") |
|
tokenizer = AutoTokenizer.from_pretrained("sqlcoder-7b.Q4_K_S.gguf") |
|
|
|
|
|
class Validation(BaseModel): |
|
prompt: str |
|
|
|
|
|
app = FastAPI() |
|
|
|
|
|
@app.post("/generate_sql") |
|
async def generate_sql(item: Validation): |
|
|
|
input_ids = tokenizer.encode(item.prompt, return_tensors="pt") |
|
|
|
|
|
completion = llm.generate(input_ids) |
|
|
|
|
|
generated_sql = tokenizer.decode(completion[0], skip_special_tokens=True) |
|
|
|
return {"generated_sql": generated_sql} |
|
|