rag-demo / main.py
moraxgiga's picture
Update main.py
a067681 verified
raw
history blame
512 Bytes
from fastapi import FastAPI, HTTPException
from pydantic import BaseModel, root_validator
from transformers import AutoModel
from typing import List
import os, platform
os.environ['TRANSFORMERS_CACHE'] = 'E:/Documents/AI/.Cache'
model = AutoModel.from_pretrained('moraxgiga/jina', trust_remote_code=True)
app = FastAPI()
class Validation(BaseModel):
prompt: List[str]
#Endpoint
@app.post("/jina_embedding")
async def generate_embeddings(text):
return {"embeddings": model.encode(text).tolist()}