from llama_cpp.server.app import create_app, Settings from fastapi.responses import HTMLResponse from fastapi.middleware.cors import CORSMiddleware from fastapi.responses import RedirectResponse import os app = create_app( Settings( n_threads=4, model="model/gguf-model.gguf", embedding=True, n_gpu_layers=33 ) ) app.add_middleware( CORSMiddleware, allow_origins=["*"], allow_credentials=True, allow_methods=["*"], allow_headers=["*"], ) @app.get("/") async def redirect_root_to_docs(): return RedirectResponse("/docs") if __name__ == "__main__": import uvicorn uvicorn.run(app, host="0.0.0.0", port=7860)