Spaces:

Alovestocode
/

router-router-zero

Running on Zero

Alovestocode commited on Nov 6

Commit

6a8403c

verified ·

1 Parent(s): 00b5731

Load model during startup for GPU reservation

Files changed (2) hide show

__pycache__/app.cpython-313.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-313.pyc and b/__pycache__/app.cpython-313.pyc differ

app.py CHANGED Viewed

@@ -141,6 +141,16 @@ def healthcheck() -> dict[str, str]:
     return {"status": "ok", "model": MODEL_ID}
 @fastapi_app.post("/v1/generate", response_model=GenerateResponse)
 def generate_endpoint(payload: GeneratePayload) -> GenerateResponse:
     try:

     return {"status": "ok", "model": MODEL_ID}
+@fastapi_app.on_event("startup")
+def warm_start() -> None:
+    """Ensure the GPU reservation is established during startup."""
+    try:
+        get_model()
+    except Exception as exc:
+        # Surface the failure early so the container exits with a useful log.
+        raise RuntimeError(f"Model warm-up failed: {exc}") from exc
 @fastapi_app.post("/v1/generate", response_model=GenerateResponse)
 def generate_endpoint(payload: GeneratePayload) -> GenerateResponse:
     try: