Spaces:
Running
Running
File size: 4,376 Bytes
b110593 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 |
// _ _
// __ _____ __ ___ ___ __ _| |_ ___
// \ \ /\ / / _ \/ _` \ \ / / |/ _` | __/ _ \
// \ V V / __/ (_| |\ V /| | (_| | || __/
// \_/\_/ \___|\__,_| \_/ |_|\__,_|\__\___|
//
// Copyright © 2016 - 2024 Weaviate B.V. All rights reserved.
//
// CONTACT: [email protected]
//
package aggregator
import (
"context"
"fmt"
"github.com/pkg/errors"
"github.com/sirupsen/logrus"
"github.com/weaviate/weaviate/adapters/repos/db/helpers"
"github.com/weaviate/weaviate/adapters/repos/db/inverted"
"github.com/weaviate/weaviate/adapters/repos/db/inverted/stopwords"
"github.com/weaviate/weaviate/adapters/repos/db/lsmkv"
"github.com/weaviate/weaviate/entities/aggregation"
"github.com/weaviate/weaviate/entities/schema"
schemaUC "github.com/weaviate/weaviate/usecases/schema"
)
type vectorIndex interface {
SearchByVectorDistance(vector []float32, targetDistance float32, maxLimit int64,
allowList helpers.AllowList) ([]uint64, []float32, error)
SearchByVector(vector []float32, k int, allowList helpers.AllowList) ([]uint64, []float32, error)
}
type Aggregator struct {
logger logrus.FieldLogger
store *lsmkv.Store
params aggregation.Params
getSchema schemaUC.SchemaGetter
classSearcher inverted.ClassSearcher // to support ref-filters
vectorIndex vectorIndex
stopwords stopwords.StopwordDetector
shardVersion uint16
propLenTracker *inverted.JsonShardMetaData
isFallbackToSearchable inverted.IsFallbackToSearchable
tenant string
nestedCrossRefLimit int64
}
func New(store *lsmkv.Store, params aggregation.Params,
getSchema schemaUC.SchemaGetter, classSearcher inverted.ClassSearcher,
stopwords stopwords.StopwordDetector, shardVersion uint16,
vectorIndex vectorIndex, logger logrus.FieldLogger,
propLenTracker *inverted.JsonShardMetaData,
isFallbackToSearchable inverted.IsFallbackToSearchable,
tenant string, nestedCrossRefLimit int64,
) *Aggregator {
return &Aggregator{
logger: logger,
store: store,
params: params,
getSchema: getSchema,
classSearcher: classSearcher,
stopwords: stopwords,
shardVersion: shardVersion,
vectorIndex: vectorIndex,
propLenTracker: propLenTracker,
isFallbackToSearchable: isFallbackToSearchable,
tenant: tenant,
nestedCrossRefLimit: nestedCrossRefLimit,
}
}
func (a *Aggregator) GetPropertyLengthTracker() *inverted.JsonShardMetaData {
return a.propLenTracker
}
func (a *Aggregator) Do(ctx context.Context) (*aggregation.Result, error) {
if a.params.GroupBy != nil {
return newGroupedAggregator(a).Do(ctx)
}
if a.params.Filters != nil || len(a.params.SearchVector) > 0 || a.params.Hybrid != nil {
return newFilteredAggregator(a).Do(ctx)
}
return newUnfilteredAggregator(a).Do(ctx)
}
func (a *Aggregator) aggTypeOfProperty(
name schema.PropertyName,
) (aggregation.PropertyType, schema.DataType, error) {
s := a.getSchema.GetSchemaSkipAuth()
schemaProp, err := s.GetProperty(a.params.ClassName, name)
if err != nil {
return "", "", errors.Wrapf(err, "property %s", name)
}
if schema.IsRefDataType(schemaProp.DataType) {
return aggregation.PropertyTypeReference, schema.DataTypeCRef, nil
}
dt := schema.DataType(schemaProp.DataType[0])
switch dt {
case schema.DataTypeInt, schema.DataTypeNumber, schema.DataTypeIntArray,
schema.DataTypeNumberArray:
return aggregation.PropertyTypeNumerical, dt, nil
case schema.DataTypeBoolean, schema.DataTypeBooleanArray:
return aggregation.PropertyTypeBoolean, dt, nil
case schema.DataTypeText, schema.DataTypeTextArray:
return aggregation.PropertyTypeText, dt, nil
case schema.DataTypeDate, schema.DataTypeDateArray:
return aggregation.PropertyTypeDate, dt, nil
case schema.DataTypeGeoCoordinates:
return "", "", fmt.Errorf("dataType geoCoordinates can't be aggregated")
case schema.DataTypePhoneNumber:
return "", "", fmt.Errorf("dataType phoneNumber can't be aggregated")
default:
return "", "", fmt.Errorf("unrecoginzed dataType %v", schemaProp.DataType[0])
}
}
|