Spaces:
Running
Running
File size: 811 Bytes
b110593 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 |
// _ _
// __ _____ __ ___ ___ __ _| |_ ___
// \ \ /\ / / _ \/ _` \ \ / / |/ _` | __/ _ \
// \ V V / __/ (_| |\ V /| | (_| | || __/
// \_/\_/ \___|\__,_| \_/ |_|\__,_|\__\___|
//
// Copyright © 2016 - 2024 Weaviate B.V. All rights reserved.
//
// CONTACT: [email protected]
//
package classification
// TODO: This code is duplicated across weaviate and contextionary which makes
// changes risky. Can we find a single source of truth for this logic
import (
"strings"
"unicode"
)
func newSplitter() *splitter {
return &splitter{}
}
type splitter struct{}
func (s *splitter) Split(corpus string) []string {
return strings.FieldsFunc(corpus, func(c rune) bool {
return !unicode.IsLetter(c) && !unicode.IsNumber(c)
})
}
|