| | |
| | | * See the License for the specific language governing permissions and |
| | | * limitations under the License. |
| | | */ |
| | | package serf |
| | | package syncdb |
| | | |
| | | import ( |
| | | "context" |
| | | "encoding/json" |
| | | "errors" |
| | | "fmt" |
| | | "github.com/hashicorp/memberlist" |
| | | "net" |
| | | "strconv" |
| | | |
| | | "time" |
| | | |
| | | "github.com/apache/servicecomb-service-center/pkg/log" |
| | | "github.com/hashicorp/serf/cmd/serf/command/agent" |
| | | "github.com/hashicorp/serf/serf" |
| | | "basic.com/valib/serf.git/cmd/serf/command/agent" |
| | | "basic.com/valib/serf.git/serf" |
| | | //"github.com/apache/servicecomb-service-center/pkg/log" |
| | | "basic.com/valib/logger.git" |
| | | ) |
| | | |
| | | // Agent warps the serf agent |
| | | type Agent struct { |
| | | *agent.Agent |
| | | conf *Config |
| | | readyCh chan struct{} |
| | | errorCh chan error |
| | | conf *Config |
| | | readyCh chan struct{} |
| | | errorCh chan error |
| | | handleEv HandleEventFunc |
| | | } |
| | | |
| | | //用户自定义事件处理 |
| | | type HandleEventFunc func(event serf.Event) |
| | | |
| | | type NodeInfo struct { |
| | | ClusterID string `json:"clusterID"` |
| | | NodeID string `json:"nodeID"` |
| | | NodeAddress string `json:"nodeAddress"` |
| | | IsAlive int `json:"isAlive"` |
| | | } |
| | | |
| | | // Create create serf agent with config |
| | | func Create(conf *Config) (*Agent, error) { |
| | | func Create(conf *Config, snapshotPath string) (*Agent, error) { |
| | | // config cover to serf config |
| | | serfConf, err := conf.convertToSerf() |
| | | serfConf, err := conf.convertToSerf(snapshotPath) |
| | | if err != nil { |
| | | return nil, err |
| | | } |
| | | |
| | | // create serf agent with serf config |
| | | serfAgent, err := agent.Create(conf.Config, serfConf, nil) |
| | | logger.Info("conf.Config.EncryptKey:", conf.EncryptKey) |
| | | serfAgent, err := agent.Create(conf.Config, serfConf, logger.GetLogFile()) |
| | | if err != nil { |
| | | return nil, err |
| | | } |
| | | // Create the keyring |
| | | keyring, err := memberlist.NewKeyring(nil, []byte(conf.EncryptKey)) |
| | | if err != nil { |
| | | logger.Error("Failed to restore keyring: %s", err) |
| | | return nil, err |
| | | } |
| | | serfConf.MemberlistConfig.Keyring = keyring |
| | | |
| | | logger.Info("[INFO] agent: Restored keyring with %d keys from %s", |
| | | len(conf.EncryptKey), conf.EncryptKey) |
| | | |
| | | return &Agent{ |
| | | Agent: serfAgent, |
| | | conf: conf, |
| | |
| | | }, nil |
| | | } |
| | | |
| | | func (a *Agent) RegisterHandleEventFunc(f HandleEventFunc) { |
| | | if f != nil { |
| | | a.handleEv = f |
| | | } |
| | | } |
| | | |
| | | // Start agent |
| | | func (a *Agent) Start(ctx context.Context) { |
| | | err := a.Agent.Start() |
| | | if err != nil { |
| | | log.Errorf(err, "start serf agent failed") |
| | | logger.Error(err, "start serf agent failed") |
| | | a.errorCh <- err |
| | | return |
| | | } |
| | |
| | | |
| | | err = a.retryJoin(ctx) |
| | | if err != nil { |
| | | log.Errorf(err, "start serf agent failed") |
| | | logger.Error(err, "start serf agent failed") |
| | | if err != ctx.Err() && a.errorCh != nil { |
| | | a.errorCh <- err |
| | | } |
| | | } |
| | | |
| | | go a.BroadcastMemberlist(BroadcastInterval * time.Second) |
| | | } |
| | | |
| | | // HandleEvent Handles serf.EventMemberJoin events, |
| | |
| | | // when the startup mode is "ModeCluster", |
| | | // used for logical grouping of serf nodes |
| | | func (a *Agent) HandleEvent(event serf.Event) { |
| | | if event.EventType() != serf.EventMemberJoin { |
| | | return |
| | | if a.handleEv != nil { |
| | | a.handleEv(event) |
| | | } |
| | | } |
| | | |
| | | if a.conf.Mode == ModeCluster { |
| | | if len(a.GroupMembers(a.conf.ClusterName)) < groupExpect { |
| | | return |
| | | } |
| | | |
| | | func (a *Agent) BroadcastMemberlist(delay time.Duration) { |
| | | //serf := a.serf |
| | | serf := a.Agent.Serf() |
| | | mb := serf.LocalMember() |
| | | mblist := serf.Memberlist() |
| | | logger.Info("mb:", mb) |
| | | |
| | | // copy local node |
| | | localNode := *mblist.LocalNode() |
| | | nodeID := a.conf.NodeName |
| | | nodeAddress := localNode.Address() |
| | | clusterID := mb.Tags[tagKeyClusterID] |
| | | isAlive := int(mb.Status) |
| | | |
| | | message, _ := json.Marshal(NodeInfo{ |
| | | clusterID, |
| | | nodeID, |
| | | nodeAddress, |
| | | isAlive, |
| | | }) |
| | | |
| | | // replace node address |
| | | localNode.Addr = net.ParseIP(BroadcastIP) |
| | | //localNode.Addr = net.IPv4(255,255,255,255) |
| | | localNode.Port = BroadcastPort |
| | | for { |
| | | // logger.Info("localNode: %v %v\n", nodeName, nodeAddress) |
| | | mblist.SendBestEffort(&localNode, []byte(message)) |
| | | time.Sleep(delay) |
| | | } |
| | | a.DeregisterEventHandler(a) |
| | | close(a.readyCh) |
| | | } |
| | | |
| | | // Ready Returns a channel that will be closed when serf is ready |
| | |
| | | // Stop serf agent |
| | | func (a *Agent) Stop() { |
| | | if a.errorCh != nil { |
| | | a.Leave() |
| | | a.Shutdown() |
| | | logger.Info("a.Shutdown()", a.Leave()) |
| | | logger.Info("a.Shutdown()", a.Shutdown()) |
| | | close(a.errorCh) |
| | | a.errorCh = nil |
| | | } |
| | |
| | | return nil |
| | | } |
| | | |
| | | // GroupMembers returns a point-in-time snapshot of the members of by groupName |
| | | func (a *Agent) GroupMembers(groupName string) (members []serf.Member) { |
| | | // GroupMembers returns a point-in-time snapshot of the members of by clusterID |
| | | func (a *Agent) GroupMembers(clusterID string) (members []serf.Member) { |
| | | serfAgent := a.Agent.Serf() |
| | | if serfAgent != nil { |
| | | for _, member := range serfAgent.Members() { |
| | | log.Debugf("member = %s, groupName = %s", member.Name, member.Tags[tagKeyClusterName]) |
| | | if member.Tags[tagKeyClusterName] == groupName { |
| | | logger.Info("member = %s, clusterID = %s", member.Name, member.Tags[tagKeyClusterID]) |
| | | if member.Tags[tagKeyClusterID] == clusterID { |
| | | members = append(members, member) |
| | | } |
| | | } |
| | |
| | | |
| | | func (a *Agent) retryJoin(ctx context.Context) (err error) { |
| | | if len(a.conf.RetryJoin) == 0 { |
| | | log.Infof("retry join mumber %d", len(a.conf.RetryJoin)) |
| | | logger.Error("retry join mumber %d", len(a.conf.RetryJoin)) |
| | | return nil |
| | | } |
| | | |
| | |
| | | attempt := 0 |
| | | ticker := time.NewTicker(a.conf.RetryInterval) |
| | | for { |
| | | log.Infof("serf: Joining cluster...(replay: %v)", a.conf.ReplayOnJoin) |
| | | logger.Info("serf: Joining cluster...(replay: %v)", a.conf.ReplayOnJoin) |
| | | var n int |
| | | |
| | | // Try to join the specified serf nodes |
| | | n, err = a.Join(a.conf.RetryJoin, a.conf.ReplayOnJoin) |
| | | if err == nil { |
| | | log.Infof("serf: Join completed. Synced with %d initial agents", n) |
| | | logger.Error("serf: Join completed. Synced with %d initial agents", n) |
| | | break |
| | | } |
| | | attempt++ |
| | |
| | | // else agent will try to join other nodes until successful always |
| | | if a.conf.RetryMaxAttempts > 0 && attempt > a.conf.RetryMaxAttempts { |
| | | err = errors.New("serf: maximum retry join attempts made, exiting") |
| | | log.Errorf(err, err.Error()) |
| | | logger.Error(err, err.Error()) |
| | | break |
| | | } |
| | | select { |
| | |
| | | ticker.Stop() |
| | | return |
| | | } |
| | | |
| | | //Init serf Init |
| | | func Init(clusterID string, password string, nodeID string, addrs []string, snapshotPath string, hef HandleEventFunc) (*Agent, error) { |
| | | agent, err := InitNode(clusterID, password, nodeID, snapshotPath, hef) |
| | | if err != nil { |
| | | logger.Error("InitNode failed, error: %s", err) |
| | | return agent, err |
| | | } |
| | | |
| | | err = agent.JoinByNodeAddrs(addrs) |
| | | if err != nil { |
| | | logger.Error("JoinByNodeIP failed, error: %s", err) |
| | | return agent, err |
| | | } |
| | | |
| | | return agent, err |
| | | } |
| | | |
| | | //InitNode web后台收到创建集群的请求, |
| | | func InitNode(clusterID string, password string, nodeID string, snapshotPath string, hef HandleEventFunc) (*Agent, error) { |
| | | conf := DefaultConfig() |
| | | logger.Info("clusterID:", clusterID, "password:", password, "nodeID:", nodeID) |
| | | conf.ClusterID = clusterID |
| | | conf.NodeName = nodeID |
| | | if password == "" { |
| | | conf.EncryptKey = DefaultEncryptKey |
| | | } else { |
| | | if len(password) >= 16 { |
| | | password = password[:16] |
| | | } else { |
| | | password = fmt.Sprintf("%016s", password)[:16] |
| | | //return nil, fmt.Errorf("error password") |
| | | } |
| | | conf.EncryptKey = password |
| | | } |
| | | agent, err := Create(conf, snapshotPath) |
| | | if err != nil { |
| | | logger.Error("create agent failed, error: %s", err) |
| | | return agent, err |
| | | } |
| | | |
| | | agent.Start(context.Background()) |
| | | //<- agent.readyCh |
| | | go func() { |
| | | agent.ShutdownCh() |
| | | }() |
| | | time.Sleep(time.Second) |
| | | logger.Info("Stats:", agent.Agent.Serf().Stats()) |
| | | logger.Info("EncryptionEnabled:", agent.Agent.Serf().EncryptionEnabled()) |
| | | logger.Info("create agent sucess!!") |
| | | |
| | | return agent, nil |
| | | } |
| | | |
| | | func (a *Agent) JoinByNodeAddrs(addrs []string) error { |
| | | var nodes []string |
| | | |
| | | if len(addrs) == 0 { |
| | | return fmt.Errorf("No Nodes To Join!") |
| | | } |
| | | for _, addr := range addrs { |
| | | nodes = append(nodes, addr) |
| | | } |
| | | |
| | | a.Agent.Join(nodes, true) |
| | | |
| | | return nil |
| | | } |
| | | |
| | | //func (a *Agent) JoinByNodeIP(ips []string) error { |
| | | // var nodes []string |
| | | // |
| | | // if len(ips) == 0 { |
| | | // return fmt.Errorf("No Nodes To Join!") |
| | | // } |
| | | // for _, ip := range ips { |
| | | // node := fmt.Sprintf("%s:%d", ip, DefaultBindPort) |
| | | // nodes = append(nodes, node) |
| | | // } |
| | | // |
| | | // n, err := a.Agent.Join(nodes, true) |
| | | // if err != nil || n == 0 { |
| | | // return fmt.Errorf("Error Encrypt Key!") |
| | | // } |
| | | // |
| | | // return err |
| | | //} |
| | | |
| | | func (a *Agent) GetNodes() (nodes []NodeInfo) { |
| | | var node NodeInfo |
| | | logger.Info("a.conf.ClusterID:", a.conf.ClusterID) |
| | | mbs := a.GroupMembers(a.conf.ClusterID) |
| | | for _, mb := range mbs { |
| | | node.NodeID = mb.Name |
| | | node.NodeAddress = mb.Addr.String() + ":" + strconv.Itoa(int(mb.Port)) |
| | | node.IsAlive = int(mb.Status) |
| | | node.ClusterID = mb.Tags[tagKeyClusterID] |
| | | |
| | | nodes = append(nodes, node) |
| | | } |
| | | |
| | | return nodes |
| | | } |