| from fastapi import FastAPI |
| from pydantic import BaseModel |
| from ctransformers import AutoModelForCausalLM, AutoTokenizer |
|
|
| |
| llm = AutoModelForCausalLM.from_pretrained("sqlcoder-7b.Q4_K_S.gguf") |
| tokenizer = AutoTokenizer.from_pretrained("sqlcoder-7b.Q4_K_S.gguf") |
|
|
| |
| class Validation(BaseModel): |
| prompt: str |
|
|
| |
| app = FastAPI() |
|
|
| |
| @app.post("/generate_sql") |
| async def generate_sql(item: Validation): |
| |
| input_ids = tokenizer.encode(item.prompt, return_tensors="pt") |
|
|
| |
| completion = llm.generate(input_ids) |
|
|
| |
| generated_sql = tokenizer.decode(completion[0], skip_special_tokens=True) |
|
|
| return {"generated_sql": generated_sql} |
|
|