KevinStephenson
Adding in weaviate code
b110593
raw
history blame
1.2 kB
// _ _
// __ _____ __ ___ ___ __ _| |_ ___
// \ \ /\ / / _ \/ _` \ \ / / |/ _` | __/ _ \
// \ V V / __/ (_| |\ V /| | (_| | || __/
// \_/\_/ \___|\__,_| \_/ |_|\__,_|\__\___|
//
// Copyright © 2016 - 2024 Weaviate B.V. All rights reserved.
//
// CONTACT: [email protected]
//
package clients
import (
"fmt"
"strings"
"github.com/pkoukk/tiktoken-go"
)
func getTokensCount(model string, messages []message) (int, error) {
tke, err := tiktoken.EncodingForModel(model)
if err != nil {
return 0, fmt.Errorf("encoding for model %s: %w", model, err)
}
tokensPerMessage := 3
if strings.HasPrefix(model, "gpt-3.5-turbo") {
tokensPerMessage = 4
}
tokensPerName := 1
if strings.HasPrefix(model, "gpt-3.5-turbo") {
tokensPerName = -1
}
tokensCount := 3
for _, message := range messages {
tokensCount += tokensPerMessage
tokensCount += len(tke.Encode(message.Role, nil, nil))
tokensCount += len(tke.Encode(message.Content, nil, nil))
if message.Name != "" {
tokensCount += tokensPerName
tokensCount += len(tke.Encode(message.Name, nil, nil))
}
}
return tokensCount, nil
}