| from fastapi import FastAPI, HTTPException |
| from pydantic import BaseModel |
| from sentence_transformers import SentenceTransformer |
| import numpy as np |
|
|
| |
| app = FastAPI() |
|
|
| |
| |
| model = SentenceTransformer("Alibaba-NLP/gte-base-en-v1.5", trust_remote_code=True) |
|
|
| |
| class TextInput(BaseModel): |
| text: str |
|
|
| |
| @app.get("/") |
| async def home(): |
| return {"message": "Welcome to embedded model"} |
|
|
| |
| @app.post("/embed") |
| async def generate_embedding(text_input: TextInput): |
| """ |
| Generate a 768-dimensional embedding for the input text. |
| Returns the embedding in a structured format with rounded values. |
| """ |
| try: |
| |
| embedding = model.encode(text_input.text, convert_to_tensor=True).cpu().numpy() |
|
|
| |
| rounded_embedding = np.round(embedding, decimals=2).tolist() |
|
|
| |
| dimensions = len(rounded_embedding) |
|
|
| |
| return { |
| "dimensions": dimensions, |
| "embeddings": [rounded_embedding] |
| } |
| except Exception as e: |
| |
| raise HTTPException(status_code=500, detail=str(e)) |
|
|
| |
| if __name__ == "__main__": |
| import uvicorn |
| uvicorn.run(app, host="0.0.0.0", port=7860) |