2017-01-10 09:01:12 +00:00
|
|
|
package weed_server
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
2019-04-15 06:00:37 +00:00
|
|
|
"time"
|
|
|
|
|
2020-01-29 17:09:55 +00:00
|
|
|
"google.golang.org/grpc"
|
|
|
|
|
2020-03-04 08:39:47 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb"
|
2019-02-18 20:11:52 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/security"
|
2019-11-29 09:05:09 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/storage/backend"
|
2019-05-24 20:28:44 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/storage/erasure_coding"
|
2020-01-29 17:09:55 +00:00
|
|
|
|
|
|
|
"golang.org/x/net/context"
|
2017-01-10 09:01:12 +00:00
|
|
|
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
2018-05-10 06:11:54 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb/master_pb"
|
2018-07-04 02:07:55 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/util"
|
2017-01-10 09:01:12 +00:00
|
|
|
)
|
|
|
|
|
2018-06-01 07:39:39 +00:00
|
|
|
func (vs *VolumeServer) GetMaster() string {
|
|
|
|
return vs.currentMaster
|
|
|
|
}
|
2017-01-10 09:01:12 +00:00
|
|
|
func (vs *VolumeServer) heartbeat() {
|
|
|
|
|
2019-05-28 04:22:23 +00:00
|
|
|
glog.V(0).Infof("Volume server start with seed master nodes: %v", vs.SeedMasterNodes)
|
2017-01-10 09:01:12 +00:00
|
|
|
vs.store.SetDataCenter(vs.dataCenter)
|
|
|
|
vs.store.SetRack(vs.rack)
|
|
|
|
|
2020-01-29 17:09:55 +00:00
|
|
|
grpcDialOption := security.LoadClientTLS(util.GetViper(), "grpc.volume")
|
2019-02-18 20:11:52 +00:00
|
|
|
|
2018-06-01 07:39:39 +00:00
|
|
|
var err error
|
|
|
|
var newLeader string
|
2017-01-10 09:01:12 +00:00
|
|
|
for {
|
2019-05-28 04:22:23 +00:00
|
|
|
for _, master := range vs.SeedMasterNodes {
|
2018-06-01 07:39:39 +00:00
|
|
|
if newLeader != "" {
|
2020-04-29 00:29:10 +00:00
|
|
|
// the new leader may actually is the same master
|
|
|
|
// need to wait a bit before adding itself
|
|
|
|
time.Sleep(3 * time.Second)
|
2018-06-01 07:39:39 +00:00
|
|
|
master = newLeader
|
|
|
|
}
|
2020-03-04 08:39:47 +00:00
|
|
|
masterGrpcAddress, parseErr := pb.ParseServerToGrpcAddress(master)
|
2019-01-18 22:14:47 +00:00
|
|
|
if parseErr != nil {
|
2019-04-16 08:15:30 +00:00
|
|
|
glog.V(0).Infof("failed to parse master grpc %v: %v", masterGrpcAddress, parseErr)
|
2019-01-18 22:14:47 +00:00
|
|
|
continue
|
|
|
|
}
|
2019-05-28 05:54:58 +00:00
|
|
|
vs.store.MasterAddress = master
|
2020-02-26 06:23:59 +00:00
|
|
|
newLeader, err = vs.doHeartbeat(master, masterGrpcAddress, grpcDialOption, time.Duration(vs.pulseSeconds)*time.Second)
|
2018-06-01 07:39:39 +00:00
|
|
|
if err != nil {
|
|
|
|
glog.V(0).Infof("heartbeat error: %v", err)
|
|
|
|
time.Sleep(time.Duration(vs.pulseSeconds) * time.Second)
|
2019-04-15 16:09:46 +00:00
|
|
|
newLeader = ""
|
2019-05-28 05:54:58 +00:00
|
|
|
vs.store.MasterAddress = ""
|
2018-06-01 07:39:39 +00:00
|
|
|
}
|
2017-01-10 09:01:12 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-26 06:23:59 +00:00
|
|
|
func (vs *VolumeServer) doHeartbeat(masterNode, masterGrpcAddress string, grpcDialOption grpc.DialOption, sleepInterval time.Duration) (newLeader string, err error) {
|
2017-01-10 09:01:12 +00:00
|
|
|
|
2020-03-04 08:39:47 +00:00
|
|
|
grpcConection, err := pb.GrpcDial(context.Background(), masterGrpcAddress, grpcDialOption)
|
2017-01-10 09:01:12 +00:00
|
|
|
if err != nil {
|
2019-01-11 10:23:31 +00:00
|
|
|
return "", fmt.Errorf("fail to dial %s : %v", masterNode, err)
|
2017-01-10 09:01:12 +00:00
|
|
|
}
|
|
|
|
defer grpcConection.Close()
|
|
|
|
|
2018-05-10 06:11:54 +00:00
|
|
|
client := master_pb.NewSeaweedClient(grpcConection)
|
2020-02-26 06:23:59 +00:00
|
|
|
stream, err := client.SendHeartbeat(context.Background())
|
2017-01-10 09:01:12 +00:00
|
|
|
if err != nil {
|
2018-06-01 07:39:39 +00:00
|
|
|
glog.V(0).Infof("SendHeartbeat to %s: %v", masterNode, err)
|
|
|
|
return "", err
|
2017-01-10 09:01:12 +00:00
|
|
|
}
|
2018-06-01 07:39:39 +00:00
|
|
|
glog.V(0).Infof("Heartbeat to: %v", masterNode)
|
|
|
|
vs.currentMaster = masterNode
|
2017-01-10 09:01:12 +00:00
|
|
|
|
2017-01-10 09:30:00 +00:00
|
|
|
doneChan := make(chan error, 1)
|
|
|
|
|
2017-01-10 09:01:12 +00:00
|
|
|
go func() {
|
|
|
|
for {
|
|
|
|
in, err := stream.Recv()
|
|
|
|
if err != nil {
|
2017-01-10 09:30:00 +00:00
|
|
|
doneChan <- err
|
2017-01-10 09:01:12 +00:00
|
|
|
return
|
|
|
|
}
|
2020-03-22 23:21:42 +00:00
|
|
|
if in.GetVolumeSizeLimit() != 0 && vs.store.GetVolumeSizeLimit() != in.GetVolumeSizeLimit() {
|
2019-04-15 06:00:37 +00:00
|
|
|
vs.store.SetVolumeSizeLimit(in.GetVolumeSizeLimit())
|
2020-03-22 23:21:42 +00:00
|
|
|
if vs.store.MaybeAdjustVolumeMax() {
|
|
|
|
if err = stream.Send(vs.store.CollectHeartbeat()); err != nil {
|
2020-08-06 16:48:54 +00:00
|
|
|
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", vs.currentMaster, err)
|
2020-03-22 23:21:42 +00:00
|
|
|
}
|
|
|
|
}
|
2017-01-23 05:36:36 +00:00
|
|
|
}
|
2020-08-06 16:48:54 +00:00
|
|
|
if in.GetLeader() != "" && vs.currentMaster != in.GetLeader() {
|
|
|
|
glog.V(0).Infof("Volume Server found a new master newLeader: %v instead of %v", in.GetLeader(), vs.currentMaster)
|
2018-06-01 07:39:39 +00:00
|
|
|
newLeader = in.GetLeader()
|
2017-01-18 17:34:27 +00:00
|
|
|
doneChan <- nil
|
|
|
|
return
|
|
|
|
}
|
2019-06-17 21:51:47 +00:00
|
|
|
if in.GetMetricsAddress() != "" && vs.MetricsAddress != in.GetMetricsAddress() {
|
|
|
|
vs.MetricsAddress = in.GetMetricsAddress()
|
|
|
|
vs.MetricsIntervalSec = int(in.GetMetricsIntervalSeconds())
|
|
|
|
}
|
2019-11-29 09:05:09 +00:00
|
|
|
if len(in.StorageBackends) > 0 {
|
|
|
|
backend.LoadFromPbStorageBackends(in.StorageBackends)
|
|
|
|
}
|
2017-01-10 09:01:12 +00:00
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
2017-01-10 09:30:00 +00:00
|
|
|
if err = stream.Send(vs.store.CollectHeartbeat()); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterNode, err)
|
2018-06-01 07:39:39 +00:00
|
|
|
return "", err
|
2017-01-10 09:30:00 +00:00
|
|
|
}
|
|
|
|
|
2019-05-22 05:41:20 +00:00
|
|
|
if err = stream.Send(vs.store.CollectErasureCodingHeartbeat()); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterNode, err)
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
|
|
|
|
volumeTickChan := time.Tick(sleepInterval)
|
|
|
|
ecShardTickChan := time.Tick(17 * sleepInterval)
|
2017-01-10 09:30:00 +00:00
|
|
|
|
2017-01-10 09:01:12 +00:00
|
|
|
for {
|
2017-01-10 09:30:00 +00:00
|
|
|
select {
|
2019-04-20 18:35:20 +00:00
|
|
|
case volumeMessage := <-vs.store.NewVolumesChan:
|
2018-08-24 08:26:56 +00:00
|
|
|
deltaBeat := &master_pb.Heartbeat{
|
2019-04-30 03:22:19 +00:00
|
|
|
NewVolumes: []*master_pb.VolumeShortInformationMessage{
|
2019-04-20 18:35:20 +00:00
|
|
|
&volumeMessage,
|
|
|
|
},
|
2018-08-24 08:26:56 +00:00
|
|
|
}
|
2019-04-20 18:35:20 +00:00
|
|
|
glog.V(1).Infof("volume server %s:%d adds volume %d", vs.store.Ip, vs.store.Port, volumeMessage.Id)
|
2018-08-24 08:26:56 +00:00
|
|
|
if err = stream.Send(deltaBeat); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterNode, err)
|
|
|
|
return "", err
|
|
|
|
}
|
2019-05-22 05:41:20 +00:00
|
|
|
case ecShardMessage := <-vs.store.NewEcShardsChan:
|
|
|
|
deltaBeat := &master_pb.Heartbeat{
|
|
|
|
NewEcShards: []*master_pb.VolumeEcShardInformationMessage{
|
|
|
|
&ecShardMessage,
|
|
|
|
},
|
|
|
|
}
|
2019-05-24 20:28:44 +00:00
|
|
|
glog.V(1).Infof("volume server %s:%d adds ec shard %d:%d", vs.store.Ip, vs.store.Port, ecShardMessage.Id,
|
|
|
|
erasure_coding.ShardBits(ecShardMessage.EcIndexBits).ShardIds())
|
2019-05-22 05:41:20 +00:00
|
|
|
if err = stream.Send(deltaBeat); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterNode, err)
|
|
|
|
return "", err
|
|
|
|
}
|
2019-04-20 18:35:20 +00:00
|
|
|
case volumeMessage := <-vs.store.DeletedVolumesChan:
|
2018-08-24 08:26:56 +00:00
|
|
|
deltaBeat := &master_pb.Heartbeat{
|
2019-04-30 03:22:19 +00:00
|
|
|
DeletedVolumes: []*master_pb.VolumeShortInformationMessage{
|
2019-04-20 18:35:20 +00:00
|
|
|
&volumeMessage,
|
|
|
|
},
|
2018-08-24 08:26:56 +00:00
|
|
|
}
|
2019-04-20 18:35:20 +00:00
|
|
|
glog.V(1).Infof("volume server %s:%d deletes volume %d", vs.store.Ip, vs.store.Port, volumeMessage.Id)
|
2018-08-24 08:26:56 +00:00
|
|
|
if err = stream.Send(deltaBeat); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterNode, err)
|
|
|
|
return "", err
|
|
|
|
}
|
2019-05-22 05:41:20 +00:00
|
|
|
case ecShardMessage := <-vs.store.DeletedEcShardsChan:
|
|
|
|
deltaBeat := &master_pb.Heartbeat{
|
|
|
|
DeletedEcShards: []*master_pb.VolumeEcShardInformationMessage{
|
|
|
|
&ecShardMessage,
|
|
|
|
},
|
|
|
|
}
|
2019-05-24 20:28:44 +00:00
|
|
|
glog.V(1).Infof("volume server %s:%d deletes ec shard %d:%d", vs.store.Ip, vs.store.Port, ecShardMessage.Id,
|
|
|
|
erasure_coding.ShardBits(ecShardMessage.EcIndexBits).ShardIds())
|
2019-05-22 05:41:20 +00:00
|
|
|
if err = stream.Send(deltaBeat); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to update to master %s: %v", masterNode, err)
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
case <-volumeTickChan:
|
2020-08-26 11:16:11 +00:00
|
|
|
if vs.SendHeartbeat {
|
2020-08-31 03:12:04 +00:00
|
|
|
glog.V(4).Infof("volume server %s:%d heartbeat", vs.store.Ip, vs.store.Port)
|
2020-08-26 11:16:11 +00:00
|
|
|
if err = stream.Send(vs.store.CollectHeartbeat()); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterNode, err)
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
} else {
|
2020-08-31 03:12:04 +00:00
|
|
|
glog.V(4).Infof("volume server %s:%d skip send heartbeat", vs.store.Ip, vs.store.Port)
|
2017-01-10 09:30:00 +00:00
|
|
|
}
|
2019-05-22 05:41:20 +00:00
|
|
|
case <-ecShardTickChan:
|
2020-08-31 03:12:04 +00:00
|
|
|
glog.V(4).Infof("volume server %s:%d ec heartbeat", vs.store.Ip, vs.store.Port)
|
2019-05-22 05:41:20 +00:00
|
|
|
if err = stream.Send(vs.store.CollectErasureCodingHeartbeat()); err != nil {
|
|
|
|
glog.V(0).Infof("Volume Server Failed to talk with master %s: %v", masterNode, err)
|
|
|
|
return "", err
|
|
|
|
}
|
2019-01-07 08:09:15 +00:00
|
|
|
case err = <-doneChan:
|
2018-06-01 07:39:39 +00:00
|
|
|
return
|
2017-01-10 09:01:12 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|