Spaces:
Running
Running
File size: 5,561 Bytes
b110593 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 |
// _ _
// __ _____ __ ___ ___ __ _| |_ ___
// \ \ /\ / / _ \/ _` \ \ / / |/ _` | __/ _ \
// \ V V / __/ (_| |\ V /| | (_| | || __/
// \_/\_/ \___|\__,_| \_/ |_|\__,_|\__\___|
//
// Copyright © 2016 - 2024 Weaviate B.V. All rights reserved.
//
// CONTACT: [email protected]
//
package vectorizer
import (
"context"
"testing"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
)
// as used in the nearText searcher
func TestVectorizingTexts(t *testing.T) {
type testCase struct {
name string
input []string
expectedOpenAIType string
openAIType string
expectedOpenAIModel string
openAIModel string
modelVersion string
expectedModelVersion string
}
tests := []testCase{
{
name: "single word",
input: []string{"hello"},
openAIType: "text",
expectedOpenAIType: "text",
openAIModel: "ada",
expectedOpenAIModel: "ada",
// use something that doesn't exist on purpose to rule out that this was
// set by a default, but validate that the version was set explicitly
// due to https://github.com/weaviate/weaviate/issues/2458
modelVersion: "003",
expectedModelVersion: "003",
},
{
name: "multiple words",
input: []string{"hello world, this is me!"},
openAIType: "text",
expectedOpenAIType: "text",
openAIModel: "ada",
expectedOpenAIModel: "ada",
// use something that doesn't exist on purpose to rule out that this was
// set by a default, but validate that the version was set explicitly
// due to https://github.com/weaviate/weaviate/issues/2458
modelVersion: "003",
expectedModelVersion: "003",
},
{
name: "multiple sentences (joined with a dot)",
input: []string{"this is sentence 1", "and here's number 2"},
openAIType: "text",
expectedOpenAIType: "text",
openAIModel: "ada",
expectedOpenAIModel: "ada",
// use something that doesn't exist on purpose to rule out that this was
// set by a default, but validate that the version was set explicitly
// due to https://github.com/weaviate/weaviate/issues/2458
modelVersion: "003",
expectedModelVersion: "003",
},
{
name: "multiple sentences already containing a dot",
input: []string{"this is sentence 1.", "and here's number 2"},
openAIType: "text",
expectedOpenAIType: "text",
openAIModel: "ada",
expectedOpenAIModel: "ada",
// use something that doesn't exist on purpose to rule out that this was
// set by a default, but validate that the version was set explicitly
// due to https://github.com/weaviate/weaviate/issues/2458
modelVersion: "003",
expectedModelVersion: "003",
},
{
name: "multiple sentences already containing a question mark",
input: []string{"this is sentence 1?", "and here's number 2"},
openAIType: "text",
expectedOpenAIType: "text",
openAIModel: "ada",
expectedOpenAIModel: "ada",
// use something that doesn't exist on purpose to rule out that this was
// set by a default, but validate that the version was set explicitly
// due to https://github.com/weaviate/weaviate/issues/2458
modelVersion: "003",
expectedModelVersion: "003",
},
{
name: "multiple sentences already containing an exclamation mark",
input: []string{"this is sentence 1!", "and here's number 2"},
openAIType: "text",
expectedOpenAIType: "text",
openAIModel: "ada",
expectedOpenAIModel: "ada",
// use something that doesn't exist on purpose to rule out that this was
// set by a default, but validate that the version was set explicitly
// due to https://github.com/weaviate/weaviate/issues/2458
modelVersion: "003",
expectedModelVersion: "003",
},
{
name: "multiple sentences already containing comma",
input: []string{"this is sentence 1,", "and here's number 2"},
openAIType: "text",
expectedOpenAIType: "text",
openAIModel: "ada",
expectedOpenAIModel: "ada",
// use something that doesn't exist on purpose to rule out that this was
// set by a default, but validate that the version was set explicitly
// due to https://github.com/weaviate/weaviate/issues/2458
modelVersion: "003",
expectedModelVersion: "003",
},
}
for _, test := range tests {
t.Run(test.name, func(t *testing.T) {
client := &fakeClient{}
v := New(client)
cfg := &fakeClassConfig{
classConfig: map[string]interface{}{
"type": test.openAIType,
"model": test.openAIModel,
"modelVersion": test.modelVersion,
},
}
vec, err := v.Texts(context.Background(), test.input, cfg)
require.Nil(t, err)
assert.Equal(t, []float32{0.1, 1.1, 2.1, 3.1}, vec)
assert.Equal(t, test.input, client.lastInput)
assert.Equal(t, client.lastConfig.Type, test.expectedOpenAIType)
assert.Equal(t, client.lastConfig.Model, test.expectedOpenAIModel)
assert.Equal(t, client.lastConfig.ModelVersion, test.expectedModelVersion)
})
}
}
|