| from llama_cpp.server.app import create_app, Settings |
| from fastapi.responses import HTMLResponse |
| from fastapi.middleware.cors import CORSMiddleware |
| from fastapi.responses import RedirectResponse |
| import os |
|
|
| model_path = "/home/user/model/gguf-model.gguf" |
|
|
| app = create_app( |
| Settings( |
| n_threads=4, |
| model=model_path, |
| embedding=True, |
| n_gpu_layers=33 |
| ) |
| ) |
| app.add_middleware( |
| CORSMiddleware, |
| allow_origins=["*"], |
| allow_credentials=True, |
| allow_methods=["*"], |
| allow_headers=["*"], |
| ) |
|
|
| @app.get("/") |
| async def redirect_root_to_docs(): |
| return RedirectResponse("/docs") |
|
|
| if __name__ == "__main__": |
| import uvicorn |
| uvicorn.run(app, host="0.0.0.0", port=7860) |
|
|