Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
File size: 914 Bytes
4aebf77 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 |
from sentence_transformers import SentenceTransformer
from openai import OpenAI
from dotenv import load_dotenv
load_dotenv()
# Step 1: Load SentenceTransformer model
# Old MiniLM version:
# model = SentenceTransformer("sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2")
# Better MPNet alternative:
model = SentenceTransformer("sentence-transformers/paraphrase-multilingual-mpnet-base-v2")
client = OpenAI()
def _get_hf_embedding(text: str) -> list:
return model.encode(text).tolist()
def _get_openai_embedding(text: str) -> list:
response = client.embeddings.create(
model="text-embedding-3-large", # or "text-embedding-3-large"
input=text
)
return response.data[0].embedding
def get_embedding(text: str) -> list:
"""
Switch according to the embedding model you want.
"""
# return _get_hf_embedding(text)
return _get_openai_embedding(text) |