| from fastapi import FastAPI, Request |
| from fastapi.responses import StreamingResponse |
| from fastapi.middleware.cors import CORSMiddleware |
|
|
| from inference import generate_response |
| import time |
|
|
| app = FastAPI() |
|
|
| app.add_middleware( |
| CORSMiddleware, |
| allow_origins=["http://localhost:5173"], |
| allow_credentials=True, |
| allow_methods=["*"], |
| allow_headers=["*"], |
| ) |
|
|
|
|
| @app.post("/chat") |
| async def chat(req: Request): |
| body = await req.json() |
| prompt = body.get("prompt") |
| return StreamingResponse(generate_response(prompt), media_type="text/plain") |
|
|