File size: 768 Bytes
05a2a0c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
## Mini Encoder 

from sentence_transformers import SentenceTransformer

## Model 1: mini-encoder
model = SentenceTransformer('sentence-transformers/all-MiniLM-L6-v2')

def get_embeddings(sentences):
    embeddings = model.encode(sentences)
    return embeddings

## Model 2: intfloat/multilingual-e5-large
from sentence_transformers import SentenceTransformer

modelbig = SentenceTransformer("sentence-transformers/gtr-t5-large")

"""
sentences = [
    "That is a happy person",
    "That is a happy dog",
    "That is a very happy person",
    "Today is a sunny day"
]
similarities = model.similarity(embeddings, embeddings)
print(similarities.shape)
# [4, 4]

"""
def get_embeddings_big(sentences):
    embeddings = modelbig.encode(sentences)
    return embeddings