mirror of
https://github.com/seaweedfs/seaweedfs.git
synced 2024-01-19 02:48:24 +00:00
Merge pull request #3338 from kmlebedev/issues/3083
rollback over onPeerUpdate implementation of automatic clean-up of failed servers in favor of synchronous ping
This commit is contained in:
commit
b59bc607bf
|
@ -102,7 +102,7 @@ func (ma *MetaAggregator) loopSubscribeToOneFiler(f *Filer, self pb.ServerAddres
|
||||||
if err != nil {
|
if err != nil {
|
||||||
errLvl := glog.Level(0)
|
errLvl := glog.Level(0)
|
||||||
if strings.Contains(err.Error(), "duplicated local subscription detected") {
|
if strings.Contains(err.Error(), "duplicated local subscription detected") {
|
||||||
errLvl = glog.Level(1)
|
errLvl = glog.Level(4)
|
||||||
}
|
}
|
||||||
glog.V(errLvl).Infof("subscribing remote %s meta change: %v", peer, err)
|
glog.V(errLvl).Infof("subscribing remote %s meta change: %v", peer, err)
|
||||||
}
|
}
|
||||||
|
|
|
@ -1,7 +1,6 @@
|
||||||
package weed_server
|
package weed_server
|
||||||
|
|
||||||
import (
|
import (
|
||||||
"context"
|
|
||||||
"fmt"
|
"fmt"
|
||||||
"github.com/seaweedfs/seaweedfs/weed/stats"
|
"github.com/seaweedfs/seaweedfs/weed/stats"
|
||||||
"net/http"
|
"net/http"
|
||||||
|
@ -32,9 +31,8 @@ import (
|
||||||
)
|
)
|
||||||
|
|
||||||
const (
|
const (
|
||||||
SequencerType = "master.sequencer.type"
|
SequencerType = "master.sequencer.type"
|
||||||
SequencerSnowflakeId = "master.sequencer.sequencer_snowflake_id"
|
SequencerSnowflakeId = "master.sequencer.sequencer_snowflake_id"
|
||||||
RaftServerRemovalTime = 72 * time.Minute
|
|
||||||
)
|
)
|
||||||
|
|
||||||
type MasterOption struct {
|
type MasterOption struct {
|
||||||
|
@ -65,9 +63,6 @@ type MasterServer struct {
|
||||||
|
|
||||||
boundedLeaderChan chan int
|
boundedLeaderChan chan int
|
||||||
|
|
||||||
onPeerUpdateDoneCn chan string
|
|
||||||
onPeerUpdateDoneCnExist bool
|
|
||||||
|
|
||||||
// notifying clients
|
// notifying clients
|
||||||
clientChansLock sync.RWMutex
|
clientChansLock sync.RWMutex
|
||||||
clientChans map[string]chan *master_pb.KeepConnectedResponse
|
clientChans map[string]chan *master_pb.KeepConnectedResponse
|
||||||
|
@ -118,7 +113,6 @@ func NewMasterServer(r *mux.Router, option *MasterOption, peers map[string]pb.Se
|
||||||
Cluster: cluster.NewCluster(),
|
Cluster: cluster.NewCluster(),
|
||||||
}
|
}
|
||||||
ms.boundedLeaderChan = make(chan int, 16)
|
ms.boundedLeaderChan = make(chan int, 16)
|
||||||
ms.onPeerUpdateDoneCn = make(chan string)
|
|
||||||
|
|
||||||
ms.MasterClient.OnPeerUpdate = ms.OnPeerUpdate
|
ms.MasterClient.OnPeerUpdate = ms.OnPeerUpdate
|
||||||
|
|
||||||
|
@ -351,50 +345,18 @@ func (ms *MasterServer) OnPeerUpdate(update *master_pb.ClusterNodeUpdate, startF
|
||||||
peerAddress := pb.ServerAddress(update.Address)
|
peerAddress := pb.ServerAddress(update.Address)
|
||||||
peerName := string(peerAddress)
|
peerName := string(peerAddress)
|
||||||
isLeader := ms.Topo.HashicorpRaft.State() == hashicorpRaft.Leader
|
isLeader := ms.Topo.HashicorpRaft.State() == hashicorpRaft.Leader
|
||||||
if update.IsAdd {
|
if update.IsAdd && isLeader {
|
||||||
if isLeader {
|
raftServerFound := false
|
||||||
raftServerFound := false
|
for _, server := range ms.Topo.HashicorpRaft.GetConfiguration().Configuration().Servers {
|
||||||
for _, server := range ms.Topo.HashicorpRaft.GetConfiguration().Configuration().Servers {
|
if string(server.ID) == peerName {
|
||||||
if string(server.ID) == peerName {
|
raftServerFound = true
|
||||||
raftServerFound = true
|
|
||||||
}
|
|
||||||
}
|
|
||||||
if !raftServerFound {
|
|
||||||
glog.V(0).Infof("adding new raft server: %s", peerName)
|
|
||||||
ms.Topo.HashicorpRaft.AddVoter(
|
|
||||||
hashicorpRaft.ServerID(peerName),
|
|
||||||
hashicorpRaft.ServerAddress(peerAddress.ToGrpcAddress()), 0, 0)
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if ms.onPeerUpdateDoneCnExist {
|
if !raftServerFound {
|
||||||
ms.onPeerUpdateDoneCn <- peerName
|
glog.V(0).Infof("adding new raft server: %s", peerName)
|
||||||
|
ms.Topo.HashicorpRaft.AddVoter(
|
||||||
|
hashicorpRaft.ServerID(peerName),
|
||||||
|
hashicorpRaft.ServerAddress(peerAddress.ToGrpcAddress()), 0, 0)
|
||||||
}
|
}
|
||||||
} else if isLeader {
|
|
||||||
go func(peerName string) {
|
|
||||||
raftServerRemovalTimeAfter := time.After(RaftServerRemovalTime)
|
|
||||||
for {
|
|
||||||
select {
|
|
||||||
case <-raftServerRemovalTimeAfter:
|
|
||||||
err := ms.MasterClient.WithClient(false, func(client master_pb.SeaweedClient) error {
|
|
||||||
_, err := client.RaftRemoveServer(context.Background(), &master_pb.RaftRemoveServerRequest{
|
|
||||||
Id: peerName,
|
|
||||||
Force: false,
|
|
||||||
})
|
|
||||||
return err
|
|
||||||
})
|
|
||||||
if err != nil {
|
|
||||||
glog.Warningf("failed to removing old raft server %s: %v", peerName, err)
|
|
||||||
}
|
|
||||||
glog.V(0).Infof("old raft server %s removed", peerName)
|
|
||||||
return
|
|
||||||
case peerDone := <-ms.onPeerUpdateDoneCn:
|
|
||||||
if peerName == peerDone {
|
|
||||||
glog.V(0).Infof("raft server %s remove canceled", peerName)
|
|
||||||
return
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}(peerName)
|
|
||||||
ms.onPeerUpdateDoneCnExist = true
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue