Spaces:
Running
Running
File size: 2,821 Bytes
6b502ec |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 |
// _ _
// __ _____ __ ___ ___ __ _| |_ ___
// \ \ /\ / / _ \/ _` \ \ / / |/ _` | __/ _ \
// \ V V / __/ (_| |\ V /| | (_| | || __/
// \_/\_/ \___|\__,_| \_/ |_|\__,_|\__\___|
//
// Copyright © 2016 - 2024 Weaviate B.V. All rights reserved.
//
// CONTACT: [email protected]
//
package vectorizer
import (
"context"
"testing"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
)
// as used in the nearText searcher
func TestVectorizingTexts(t *testing.T) {
type testCase struct {
name string
input []string
expectedPoolingStrategy string
poolingStrategy string
}
tests := []testCase{
{
name: "single word",
input: []string{"hello"},
poolingStrategy: "cls",
expectedPoolingStrategy: "cls",
},
{
name: "multiple words",
input: []string{"hello world, this is me!"},
poolingStrategy: "cls",
expectedPoolingStrategy: "cls",
},
{
name: "multiple sentences (joined with a dot)",
input: []string{"this is sentence 1", "and here's number 2"},
poolingStrategy: "cls",
expectedPoolingStrategy: "cls",
},
{
name: "multiple sentences already containing a dot",
input: []string{"this is sentence 1.", "and here's number 2"},
poolingStrategy: "cls",
expectedPoolingStrategy: "cls",
},
{
name: "multiple sentences already containing a question mark",
input: []string{"this is sentence 1?", "and here's number 2"},
poolingStrategy: "cls",
expectedPoolingStrategy: "cls",
},
{
name: "multiple sentences already containing an exclamation mark",
input: []string{"this is sentence 1!", "and here's number 2"},
poolingStrategy: "cls",
expectedPoolingStrategy: "cls",
},
{
name: "multiple sentences already containing comma",
input: []string{"this is sentence 1,", "and here's number 2"},
poolingStrategy: "cls",
expectedPoolingStrategy: "cls",
},
}
for _, test := range tests {
t.Run(test.name, func(t *testing.T) {
client := &fakeClient{}
v := New(client)
settings := &fakeClassConfig{
poolingStrategy: test.poolingStrategy,
}
vec, err := v.Texts(context.Background(), test.input, settings)
require.Nil(t, err)
assert.Equal(t, []float32{0, 1, 2, 3}, vec)
assert.Equal(t, client.lastConfig.PoolingStrategy, test.expectedPoolingStrategy)
})
}
}
|