volume servers always connect to the master leader

This commit is contained in:
Chris Lu 2017-01-13 10:20:40 -08:00
parent d953ed442c
commit 3065506b38
4 changed files with 25 additions and 38 deletions

View file

@ -13,20 +13,20 @@ type ClusterStatusResult struct {
Peers []string `json:"Peers,omitempty"` Peers []string `json:"Peers,omitempty"`
} }
func ListMasters(server string) ([]string, error) { func ListMasters(server string) (leader string, peers []string, err error) {
jsonBlob, err := util.Get("http://" + server + "/cluster/status") jsonBlob, err := util.Get("http://" + server + "/cluster/status")
glog.V(2).Info("list masters result :", string(jsonBlob)) glog.V(2).Info("list masters result :", string(jsonBlob))
if err != nil { if err != nil {
return nil, err return "", nil, err
} }
var ret ClusterStatusResult var ret ClusterStatusResult
err = json.Unmarshal(jsonBlob, &ret) err = json.Unmarshal(jsonBlob, &ret)
if err != nil { if err != nil {
return nil, err return "", nil, err
} }
masters := ret.Peers peers = ret.Peers
if ret.IsLeader { if ret.IsLeader {
masters = append(masters, ret.Leader) peers = append(peers, ret.Leader)
} }
return masters, nil return ret.Leader, peers, nil
} }

View file

@ -117,17 +117,6 @@ func NewFilerServer(r *http.ServeMux, ip string, port int, master string, dir st
fs.masterNodes = storage.NewMasterNodes(fs.master) fs.masterNodes = storage.NewMasterNodes(fs.master)
glog.V(0).Infof("Filer server bootstraps with master %s", fs.getMasterNode()) glog.V(0).Infof("Filer server bootstraps with master %s", fs.getMasterNode())
//force initialize with all available master nodes
for {
_, err := fs.masterNodes.FindMaster()
if err != nil {
glog.Infof("filer server failed to get master cluster info:%s", err.Error())
time.Sleep(3 * time.Second)
} else {
break
}
}
for { for {
glog.V(4).Infof("Filer server sending to master %s", fs.getMasterNode()) glog.V(4).Infof("Filer server sending to master %s", fs.getMasterNode())
master, err := fs.detectHealthyMaster(fs.getMasterNode()) master, err := fs.detectHealthyMaster(fs.getMasterNode())

View file

@ -23,13 +23,14 @@ func (vs *VolumeServer) heartbeat() {
err := vs.doHeartbeat(time.Duration(vs.pulseSeconds) * time.Second) err := vs.doHeartbeat(time.Duration(vs.pulseSeconds) * time.Second)
if err != nil { if err != nil {
glog.V(0).Infof("heartbeat error: %v", err) glog.V(0).Infof("heartbeat error: %v", err)
time.Sleep(time.Duration(3*vs.pulseSeconds) * time.Second) time.Sleep(time.Duration(vs.pulseSeconds) * time.Second)
} }
} }
} }
func (vs *VolumeServer) doHeartbeat(sleepInterval time.Duration) error { func (vs *VolumeServer) doHeartbeat(sleepInterval time.Duration) error {
vs.masterNodes.Reset()
masterNode, err := vs.masterNodes.FindMaster() masterNode, err := vs.masterNodes.FindMaster()
if err != nil { if err != nil {
return fmt.Errorf("No master found: %v", err) return fmt.Errorf("No master found: %v", err)

View file

@ -3,7 +3,6 @@ package storage
import ( import (
"errors" "errors"
"fmt" "fmt"
"math/rand"
"strconv" "strconv"
"strings" "strings"
@ -18,48 +17,46 @@ const (
type MasterNodes struct { type MasterNodes struct {
nodes []string nodes []string
lastNode int leader string
} }
func (mn *MasterNodes) String() string { func (mn *MasterNodes) String() string {
return fmt.Sprintf("nodes:%v, lastNode:%d", mn.nodes, mn.lastNode) return fmt.Sprintf("nodes:%v, leader:%s", mn.nodes, mn.leader)
} }
func NewMasterNodes(bootstrapNode string) (mn *MasterNodes) { func NewMasterNodes(bootstrapNode string) (mn *MasterNodes) {
mn = &MasterNodes{nodes: []string{bootstrapNode}, lastNode: -1} mn = &MasterNodes{nodes: []string{bootstrapNode}, leader: ""}
return return
} }
func (mn *MasterNodes) Reset() { func (mn *MasterNodes) Reset() {
glog.V(4).Infof("Resetting master nodes: %v", mn) if mn.leader != "" {
if len(mn.nodes) > 1 && mn.lastNode >= 0 { mn.leader = ""
glog.V(0).Infof("Reset master %s from: %v", mn.nodes[mn.lastNode], mn.nodes) glog.V(0).Infof("Resetting master nodes: %v", mn)
mn.lastNode = -mn.lastNode - 1
} }
} }
func (mn *MasterNodes) FindMaster() (string, error) { func (mn *MasterNodes) FindMaster() (leader string, err error) {
if len(mn.nodes) == 0 { if len(mn.nodes) == 0 {
return "", errors.New("No master node found!") return "", errors.New("No master node found!")
} }
if mn.lastNode < 0 { if mn.leader == "" {
for _, m := range mn.nodes { for _, m := range mn.nodes {
glog.V(4).Infof("Listing masters on %s", m) glog.V(4).Infof("Listing masters on %s", m)
if masters, e := operation.ListMasters(m); e == nil { if leader, masters, e := operation.ListMasters(m); e == nil {
if len(masters) == 0 { if leader != "" {
continue
}
mn.nodes = append(masters, m) mn.nodes = append(masters, m)
mn.lastNode = rand.Intn(len(mn.nodes)) mn.leader = leader
glog.V(2).Infof("current master nodes is %v", mn) glog.V(2).Infof("current master nodes is %v", mn)
break break
}
} else { } else {
glog.V(4).Infof("Failed listing masters on %s: %v", m, e) glog.V(4).Infof("Failed listing masters on %s: %v", m, e)
} }
} }
} }
if mn.lastNode < 0 { if mn.leader == "" {
return "", errors.New("No master node available!") return "", errors.New("No master node available!")
} }
return mn.nodes[mn.lastNode], nil return mn.leader, nil
} }
/* /*