Spaces:
Running
Running
// _ _ | |
// __ _____ __ ___ ___ __ _| |_ ___ | |
// \ \ /\ / / _ \/ _` \ \ / / |/ _` | __/ _ \ | |
// \ V V / __/ (_| |\ V /| | (_| | || __/ | |
// \_/\_/ \___|\__,_| \_/ |_|\__,_|\__\___| | |
// | |
// Copyright © 2016 - 2024 Weaviate B.V. All rights reserved. | |
// | |
// CONTACT: [email protected] | |
// | |
package scaler | |
import ( | |
"context" | |
"fmt" | |
"io" | |
"os" | |
"path/filepath" | |
"github.com/weaviate/weaviate/entities/backup" | |
"golang.org/x/sync/errgroup" | |
) | |
// client the client interface is used to communicate with remote nodes | |
type client interface { | |
PutFile(ctx context.Context, hostName, indexName, | |
shardName, fileName string, payload io.ReadSeekCloser) error | |
// CreateShard creates an empty shard on the remote node. | |
// This is required in order to sync files to a specific shard on the remote node. | |
CreateShard(ctx context.Context, | |
hostName, indexName, shardName string) error | |
// ReInitShard re-initialized new shard after all files has been synced to the remote node | |
// Otherwise, it would not recognize the files when | |
// serving traffic later. | |
ReInitShard(ctx context.Context, | |
hostName, indexName, shardName string) error | |
IncreaseReplicationFactor(ctx context.Context, host, class string, dist ShardDist) error | |
} | |
// rsync synchronizes shards with remote nodes | |
type rsync struct { | |
client client | |
cluster cluster | |
persistenceRoot string | |
} | |
func newRSync(c client, cl cluster, rootPath string) *rsync { | |
return &rsync{client: c, cluster: cl, persistenceRoot: rootPath} | |
} | |
// Push pushes local shards of a class to remote nodes | |
func (r *rsync) Push(ctx context.Context, shardsBackups []*backup.ShardDescriptor, dist ShardDist, className string) error { | |
var g errgroup.Group | |
g.SetLimit(_NUMCPU * 2) | |
for _, desc := range shardsBackups { | |
shardName := desc.Name | |
additions := dist[shardName] | |
desc := desc | |
g.Go(func() error { | |
return r.PushShard(ctx, className, desc, additions) | |
}) | |
} | |
return g.Wait() | |
} | |
// PushShard replicates a shard on a set of nodes | |
func (r *rsync) PushShard(ctx context.Context, className string, desc *backup.ShardDescriptor, nodes []string) error { | |
// Iterate over the new target nodes and copy files | |
for _, node := range nodes { | |
host, ok := r.cluster.NodeHostname(node) | |
if !ok { | |
return fmt.Errorf("%w: %q", ErrUnresolvedName, node) | |
} | |
if err := r.client.CreateShard(ctx, host, className, desc.Name); err != nil { | |
return fmt.Errorf("create new shard on remote node %q: %w", node, err) | |
} | |
// Transfer each file that's part of the backup. | |
for _, file := range desc.Files { | |
err := r.PutFile(ctx, file, host, className, desc.Name) | |
if err != nil { | |
return fmt.Errorf("copy files to remote node %q: %w", node, err) | |
} | |
} | |
// Transfer shard metadata files | |
err := r.PutFile(ctx, desc.ShardVersionPath, host, className, desc.Name) | |
if err != nil { | |
return fmt.Errorf("copy shard version to remote node %q: %w", node, err) | |
} | |
err = r.PutFile(ctx, desc.DocIDCounterPath, host, className, desc.Name) | |
if err != nil { | |
return fmt.Errorf("copy index counter to remote node %q: %w", node, err) | |
} | |
err = r.PutFile(ctx, desc.PropLengthTrackerPath, host, className, desc.Name) | |
if err != nil { | |
return fmt.Errorf("copy prop length tracker to remote node %q: %w", node, err) | |
} | |
// Now that all files are on the remote node's new shard, the shard needs | |
// to be reinitialized. Otherwise, it would not recognize the files when | |
// serving traffic later. | |
if err := r.client.ReInitShard(ctx, host, className, desc.Name); err != nil { | |
return fmt.Errorf("create new shard on remote node %q: %w", node, err) | |
} | |
} | |
return nil | |
} | |
func (r *rsync) PutFile(ctx context.Context, sourceFileName string, | |
hostname, className, shardName string, | |
) error { | |
absPath := filepath.Join(r.persistenceRoot, sourceFileName) | |
f, err := os.Open(absPath) | |
if err != nil { | |
return fmt.Errorf("open file %q for reading: %w", absPath, err) | |
} | |
return r.client.PutFile(ctx, hostname, className, shardName, sourceFileName, f) | |
} | |