| | from llama_cpp.server.app import create_app, Settings |
| | from fastapi.responses import HTMLResponse |
| | from fastapi.middleware.cors import CORSMiddleware |
| | from fastapi.responses import RedirectResponse |
| | import os |
| |
|
| | model_path = "/home/user/model/gguf-model.gguf" |
| |
|
| | app = create_app( |
| | Settings( |
| | n_threads=4, |
| | model=model_path, |
| | embedding=True, |
| | n_gpu_layers=33 |
| | ) |
| | ) |
| | app.add_middleware( |
| | CORSMiddleware, |
| | allow_origins=["*"], |
| | allow_credentials=True, |
| | allow_methods=["*"], |
| | allow_headers=["*"], |
| | ) |
| |
|
| | @app.get("/") |
| | async def redirect_root_to_docs(): |
| | return RedirectResponse("/docs") |
| |
|
| | if __name__ == "__main__": |
| | import uvicorn |
| | uvicorn.run(app, host="0.0.0.0", port=7860) |
| |
|