seaweedfs/weed/server/volume_grpc_client_to_master.go

267 lines
8.5 KiB
Go
Raw Normal View History

2017-01-10 17:01:12 +08:00
package weed_server
import (
"fmt"
2022-05-16 10:41:18 +08:00
"os"
2019-04-15 14:00:37 +08:00
"time"
"github.com/seaweedfs/seaweedfs/weed/operation"
2022-05-16 10:41:18 +08:00
"google.golang.org/grpc"
"github.com/seaweedfs/seaweedfs/weed/pb"
"github.com/seaweedfs/seaweedfs/weed/security"
"github.com/seaweedfs/seaweedfs/weed/storage/backend"
"github.com/seaweedfs/seaweedfs/weed/storage/erasure_coding"
"golang.org/x/net/context"
2017-01-10 17:01:12 +08:00
"github.com/seaweedfs/seaweedfs/weed/glog"
"github.com/seaweedfs/seaweedfs/weed/pb/master_pb"
"github.com/seaweedfs/seaweedfs/weed/util"
2017-01-10 17:01:12 +08:00
)
func (vs *VolumeServer) GetMaster() pb.ServerAddress {
return vs.currentMaster
}
func (vs *VolumeServer) checkWithMaster() (err error) {
2021-09-11 17:06:30 +08:00
for {
for _, master := range vs.SeedMasterNodes {
err = operation.WithMasterServerClient(false, master, vs.grpcDialOption, func(masterClient master_pb.SeaweedClient) error {
resp, err := masterClient.GetMasterConfiguration(context.Background(), &master_pb.GetMasterConfigurationRequest{})
if err != nil {
return fmt.Errorf("get master %s configuration: %v", master, err)
}
vs.metricsAddress, vs.metricsIntervalSec = resp.MetricsAddress, int(resp.MetricsIntervalSeconds)
backend.LoadFromPbStorageBackends(resp.StorageBackends)
return nil
})
if err == nil {
return
} else {
glog.V(0).Infof("checkWithMaster %s: %v", master, err)
}
}
time.Sleep(1790 * time.Millisecond)
}
}
2017-01-10 17:01:12 +08:00
func (vs *VolumeServer) heartbeat() {
glog.V(0).Infof("Volume server start with seed master nodes: %v", vs.SeedMasterNodes)
2017-01-10 17:01:12 +08:00
vs.store.SetDataCenter(vs.dataCenter)
vs.store.SetRack(vs.rack)
grpcDialOption := security.LoadClientTLS(util.GetViper(), "grpc.volume")
2019-02-19 04:11:52 +08:00
var err error
var newLeader pb.ServerAddress
2020-09-14 12:25:51 +08:00
for vs.isHeartbeating {
for _, master := range vs.SeedMasterNodes {
if newLeader != "" {
// the new leader may actually is the same master
// need to wait a bit before adding itself
time.Sleep(3 * time.Second)
master = newLeader
}
2019-05-28 13:54:58 +08:00
vs.store.MasterAddress = master
newLeader, err = vs.doHeartbeat(master, grpcDialOption, time.Duration(vs.pulseSeconds)*time.Second)
if err != nil {
2022-09-19 09:14:24 +08:00
glog.V(0).Infof("heartbeat to %s error: %v", master, err)
time.Sleep(time.Duration(vs.pulseSeconds) * time.Second)
2019-04-16 00:09:46 +08:00
newLeader = ""
2019-05-28 13:54:58 +08:00
vs.store.MasterAddress = ""
}
2020-09-14 12:25:51 +08:00
if !vs.isHeartbeating {
break
}
2017-01-10 17:01:12 +08:00
}
}
}
2020-09-14 12:25:51 +08:00
func (vs *VolumeServer) StopHeartbeat() (isAlreadyStopping bool) {
if !vs.isHeartbeating {
return true
}
vs.isHeartbeating = false
close(vs.stopChan)
2020-09-14 12:25:51 +08:00
return false
}
func (vs *VolumeServer) doHeartbeat(masterAddress pb.ServerAddress, grpcDialOption grpc.DialOption, sleepInterval time.Duration) (newLeader pb.ServerAddress, err error) {
2017-01-10 17:01:12 +08:00
ctx, cancel := context.WithCancel(context.Background())
defer cancel()
grpcConnection, err := pb.GrpcDial(ctx, masterAddress.ToGrpcAddress(), false, grpcDialOption)
2017-01-10 17:01:12 +08:00
if err != nil {
return "", fmt.Errorf("fail to dial %s : %v", masterAddress, err)
2017-01-10 17:01:12 +08:00
}
defer grpcConnection.Close()
2017-01-10 17:01:12 +08:00
client := master_pb.NewSeaweedClient(grpcConnection)
stream, err := client.SendHeartbeat(ctx)
2017-01-10 17:01:12 +08:00
if err != nil {
glog.V(0).Infof("SendHeartbeat to %s: %v", masterAddress, err)
return "", err
2017-01-10 17:01:12 +08:00
}
glog.V(0).Infof("Heartbeat to: %v", masterAddress)
vs.currentMaster = masterAddress
2017-01-10 17:01:12 +08:00
doneChan := make(chan error, 1)
2017-01-10 17:01:12 +08:00
go func() {
for {
in, err := stream.Recv()
if err != nil {
doneChan <- err
2017-01-10 17:01:12 +08:00
return
}
if len(in.DuplicatedUuids) > 0 {
2022-06-10 22:03:11 +08:00
var duplicateDir []string
for _, loc := range vs.store.Locations {
for _, uuid := range in.DuplicatedUuids {
if uuid == loc.DirectoryUuid {
2022-06-10 22:03:11 +08:00
duplicateDir = append(duplicateDir, loc.Directory)
}
}
}
2022-06-10 22:03:11 +08:00
glog.Errorf("Shut down Volume Server due to duplicate volume directories: %v", duplicateDir)
os.Exit(1)
2022-05-16 10:41:18 +08:00
}
if in.GetVolumeSizeLimit() != 0 && vs.store.GetVolumeSizeLimit() != in.GetVolumeSizeLimit() {
2019-04-15 14:00:37 +08:00
vs.store.SetVolumeSizeLimit(in.GetVolumeSizeLimit())
if vs.store.MaybeAdjustVolumeMax() {
if err = stream.Send(vs.store.CollectHeartbeat()); err != nil {
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", vs.currentMaster, err)
2021-09-11 17:06:43 +08:00
return
}
}
}
if in.GetLeader() != "" && string(vs.currentMaster) != in.GetLeader() {
glog.V(0).Infof("Volume Server found a new master newLeader: %v instead of %v", in.GetLeader(), vs.currentMaster)
newLeader = pb.ServerAddress(in.GetLeader())
doneChan <- nil
return
}
2017-01-10 17:01:12 +08:00
}
}()
if err = stream.Send(vs.store.CollectHeartbeat()); err != nil {
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterAddress, err)
return "", err
}
if err = stream.Send(vs.store.CollectErasureCodingHeartbeat()); err != nil {
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterAddress, err)
return "", err
}
volumeTickChan := time.NewTicker(sleepInterval)
ecShardTickChan := time.NewTicker(17 * sleepInterval)
dataCenter := vs.store.GetDataCenter()
rack := vs.store.GetRack()
ip := vs.store.Ip
port := uint32(vs.store.Port)
2017-01-10 17:01:12 +08:00
for {
select {
2019-04-21 02:35:20 +08:00
case volumeMessage := <-vs.store.NewVolumesChan:
deltaBeat := &master_pb.Heartbeat{
Ip: ip,
Port: port,
DataCenter: dataCenter,
Rack: rack,
2019-04-30 11:22:19 +08:00
NewVolumes: []*master_pb.VolumeShortInformationMessage{
2019-04-21 02:35:20 +08:00
&volumeMessage,
},
}
2021-09-12 03:59:15 +08:00
glog.V(0).Infof("volume server %s:%d adds volume %d", vs.store.Ip, vs.store.Port, volumeMessage.Id)
if err = stream.Send(deltaBeat); err != nil {
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterAddress, err)
return "", err
}
case ecShardMessage := <-vs.store.NewEcShardsChan:
deltaBeat := &master_pb.Heartbeat{
Ip: ip,
Port: port,
DataCenter: dataCenter,
Rack: rack,
NewEcShards: []*master_pb.VolumeEcShardInformationMessage{
&ecShardMessage,
},
}
2021-09-12 03:59:15 +08:00
glog.V(0).Infof("volume server %s:%d adds ec shard %d:%d", vs.store.Ip, vs.store.Port, ecShardMessage.Id,
erasure_coding.ShardBits(ecShardMessage.EcIndexBits).ShardIds())
if err = stream.Send(deltaBeat); err != nil {
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterAddress, err)
return "", err
}
2019-04-21 02:35:20 +08:00
case volumeMessage := <-vs.store.DeletedVolumesChan:
deltaBeat := &master_pb.Heartbeat{
Ip: ip,
Port: port,
DataCenter: dataCenter,
Rack: rack,
2019-04-30 11:22:19 +08:00
DeletedVolumes: []*master_pb.VolumeShortInformationMessage{
2019-04-21 02:35:20 +08:00
&volumeMessage,
},
}
2021-09-12 03:59:15 +08:00
glog.V(0).Infof("volume server %s:%d deletes volume %d", vs.store.Ip, vs.store.Port, volumeMessage.Id)
if err = stream.Send(deltaBeat); err != nil {
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterAddress, err)
return "", err
}
case ecShardMessage := <-vs.store.DeletedEcShardsChan:
deltaBeat := &master_pb.Heartbeat{
Ip: ip,
Port: port,
DataCenter: dataCenter,
Rack: rack,
DeletedEcShards: []*master_pb.VolumeEcShardInformationMessage{
&ecShardMessage,
},
}
2021-09-12 03:59:15 +08:00
glog.V(0).Infof("volume server %s:%d deletes ec shard %d:%d", vs.store.Ip, vs.store.Port, ecShardMessage.Id,
erasure_coding.ShardBits(ecShardMessage.EcIndexBits).ShardIds())
if err = stream.Send(deltaBeat); err != nil {
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterAddress, err)
return "", err
}
case <-volumeTickChan.C:
2020-09-14 12:25:51 +08:00
glog.V(4).Infof("volume server %s:%d heartbeat", vs.store.Ip, vs.store.Port)
vs.store.MaybeAdjustVolumeMax()
2020-09-14 12:25:51 +08:00
if err = stream.Send(vs.store.CollectHeartbeat()); err != nil {
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterAddress, err)
2020-09-14 12:25:51 +08:00
return "", err
}
case <-ecShardTickChan.C:
2020-08-31 11:12:04 +08:00
glog.V(4).Infof("volume server %s:%d ec heartbeat", vs.store.Ip, vs.store.Port)
if err = stream.Send(vs.store.CollectErasureCodingHeartbeat()); err != nil {
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterAddress, err)
return "", err
}
case err = <-doneChan:
return
2020-09-14 12:25:51 +08:00
case <-vs.stopChan:
var volumeMessages []*master_pb.VolumeInformationMessage
emptyBeat := &master_pb.Heartbeat{
Ip: ip,
Port: port,
2021-02-18 12:57:08 +08:00
PublicUrl: vs.store.PublicUrl,
MaxFileKey: uint64(0),
DataCenter: dataCenter,
Rack: rack,
2021-02-18 12:57:08 +08:00
Volumes: volumeMessages,
HasNoVolumes: len(volumeMessages) == 0,
}
2020-10-31 06:21:54 +08:00
glog.V(1).Infof("volume server %s:%d stops and deletes all volumes", vs.store.Ip, vs.store.Port)
if err = stream.Send(emptyBeat); err != nil {
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterAddress, err)
return "", err
}
2020-09-14 12:25:51 +08:00
return
2017-01-10 17:01:12 +08:00
}
}
}