Commit
·
b5db444
1
Parent(s):
b215cfc
Initial model sever setup
Browse files- Dockerfile +13 -0
- app.py +40 -0
- requirements.txt +6 -0
Dockerfile
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FROM python:3.10-slim
|
| 2 |
+
|
| 3 |
+
WORKDIR /code
|
| 4 |
+
|
| 5 |
+
COPY ./requirements.txt /code/requirements.txt
|
| 6 |
+
|
| 7 |
+
RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
|
| 8 |
+
|
| 9 |
+
COPY ./app.py /code/app.py
|
| 10 |
+
|
| 11 |
+
EXPOSE 7860
|
| 12 |
+
|
| 13 |
+
CMD ["uvicorn","app:app","--host","0.0.0.0","--port","7860"]
|
app.py
ADDED
|
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from fastapi import FastAPI, HTTPException
|
| 2 |
+
from pydantic import BaseModel
|
| 3 |
+
from sentence_transformers import SentenceTransformer
|
| 4 |
+
import logging
|
| 5 |
+
|
| 6 |
+
logging.basicConfig(level=logging.INFO)
|
| 7 |
+
logger=logging.getLogger(__name__)
|
| 8 |
+
|
| 9 |
+
logger.info("Server Starting")
|
| 10 |
+
try:
|
| 11 |
+
logger.info("Loading model")
|
| 12 |
+
model=SentenceTransformer("Sid-the-sloth/leetcode_unixcoder_final")
|
| 13 |
+
logger.info("Model Loaded")
|
| 14 |
+
except:
|
| 15 |
+
logger.error("Failed to load Model")
|
| 16 |
+
model=None
|
| 17 |
+
|
| 18 |
+
app=FastAPI()
|
| 19 |
+
|
| 20 |
+
#Req and Response Pydantic models
|
| 21 |
+
class EmbedRequest(BaseModel):
|
| 22 |
+
text : str
|
| 23 |
+
|
| 24 |
+
class EmbedResponse(BaseModel):
|
| 25 |
+
embedding: list[float]
|
| 26 |
+
|
| 27 |
+
@app.get("/")
|
| 28 |
+
def root_status():
|
| 29 |
+
return {"status":"ok","model":model is not None}
|
| 30 |
+
|
| 31 |
+
@app.post("/embed",response_model=EmbedResponse)
|
| 32 |
+
def get_embedding(request: EmbedRequest):
|
| 33 |
+
if model is None:
|
| 34 |
+
HTTPException(status_code=503,detail="Model could not be loaded")
|
| 35 |
+
try:
|
| 36 |
+
embedding=model.encode(request.text).tolist()
|
| 37 |
+
return EmbedResponse(embedding=embedding)
|
| 38 |
+
except Exception as e:
|
| 39 |
+
logger.error("Error during embedding generation %s",e)
|
| 40 |
+
return HTTPException(status_code=500,detail="Error generating embeddings")
|
requirements.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
fastapi==0.116.1
|
| 2 |
+
uvicorn==0.35.0
|
| 3 |
+
sentence-transformers==5.1.0
|
| 4 |
+
torch==2.8.0
|
| 5 |
+
python-dotenv==1.1.1
|
| 6 |
+
pydantic
|