MVPilgrim
restore
6b502ec
raw
history blame
3.17 kB
// _ _
// __ _____ __ ___ ___ __ _| |_ ___
// \ \ /\ / / _ \/ _` \ \ / / |/ _` | __/ _ \
// \ V V / __/ (_| |\ V /| | (_| | || __/
// \_/\_/ \___|\__,_| \_/ |_|\__,_|\__\___|
//
// Copyright © 2016 - 2024 Weaviate B.V. All rights reserved.
//
// CONTACT: [email protected]
//
package clients
import (
"bytes"
"context"
"encoding/json"
"fmt"
"io"
"net/http"
"time"
"github.com/pkg/errors"
"github.com/sirupsen/logrus"
"github.com/weaviate/weaviate/modules/text2vec-transformers/ent"
)
type vectorizer struct {
originPassage string
originQuery string
httpClient *http.Client
logger logrus.FieldLogger
}
func New(originPassage, originQuery string, timeout time.Duration, logger logrus.FieldLogger) *vectorizer {
return &vectorizer{
originPassage: originPassage,
originQuery: originQuery,
httpClient: &http.Client{
Timeout: timeout,
},
logger: logger,
}
}
func (v *vectorizer) VectorizeObject(ctx context.Context, input string,
config ent.VectorizationConfig,
) (*ent.VectorizationResult, error) {
return v.vectorize(ctx, input, config, v.urlPassage)
}
func (v *vectorizer) VectorizeQuery(ctx context.Context, input string,
config ent.VectorizationConfig,
) (*ent.VectorizationResult, error) {
return v.vectorize(ctx, input, config, v.urlQuery)
}
func (v *vectorizer) vectorize(ctx context.Context, input string,
config ent.VectorizationConfig, url func(string) string,
) (*ent.VectorizationResult, error) {
body, err := json.Marshal(vecRequest{
Text: input,
Config: vecRequestConfig{
PoolingStrategy: config.PoolingStrategy,
},
})
if err != nil {
return nil, errors.Wrapf(err, "marshal body")
}
req, err := http.NewRequestWithContext(ctx, "POST", url("/vectors"),
bytes.NewReader(body))
if err != nil {
return nil, errors.Wrap(err, "create POST request")
}
res, err := v.httpClient.Do(req)
if err != nil {
return nil, errors.Wrap(err, "send POST request")
}
defer res.Body.Close()
bodyBytes, err := io.ReadAll(res.Body)
if err != nil {
return nil, errors.Wrap(err, "read response body")
}
var resBody vecRequest
if err := json.Unmarshal(bodyBytes, &resBody); err != nil {
return nil, errors.Wrap(err, "unmarshal response body")
}
if res.StatusCode > 399 {
return nil, errors.Errorf("fail with status %d: %s", res.StatusCode,
resBody.Error)
}
return &ent.VectorizationResult{
Text: resBody.Text,
Dimensions: resBody.Dims,
Vector: resBody.Vector,
}, nil
}
func (v *vectorizer) urlPassage(path string) string {
return fmt.Sprintf("%s%s", v.originPassage, path)
}
func (v *vectorizer) urlQuery(path string) string {
return fmt.Sprintf("%s%s", v.originQuery, path)
}
type vecRequest struct {
Text string `json:"text"`
Dims int `json:"dims"`
Vector []float32 `json:"vector"`
Error string `json:"error"`
Config vecRequestConfig `json:"config"`
}
type vecRequestConfig struct {
PoolingStrategy string `json:"pooling_strategy"`
}