123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199 |
- package weed_server
- import (
- "encoding/json"
- "io"
- "math/rand/v2"
- "os"
- "path"
- "time"
- transport "github.com/Jille/raft-grpc-transport"
- "google.golang.org/grpc"
- "github.com/seaweedfs/seaweedfs/weed/pb"
- hashicorpRaft "github.com/hashicorp/raft"
- "github.com/seaweedfs/raft"
- "github.com/seaweedfs/seaweedfs/weed/glog"
- "github.com/seaweedfs/seaweedfs/weed/topology"
- )
- type RaftServerOption struct {
- GrpcDialOption grpc.DialOption
- Peers map[string]pb.ServerAddress
- ServerAddr pb.ServerAddress
- DataDir string
- Topo *topology.Topology
- RaftResumeState bool
- HeartbeatInterval time.Duration
- ElectionTimeout time.Duration
- RaftBootstrap bool
- }
- type RaftServer struct {
- peers map[string]pb.ServerAddress // initial peers to join with
- raftServer raft.Server
- RaftHashicorp *hashicorpRaft.Raft
- TransportManager *transport.Manager
- dataDir string
- serverAddr pb.ServerAddress
- topo *topology.Topology
- *raft.GrpcServer
- }
- type StateMachine struct {
- raft.StateMachine
- topo *topology.Topology
- }
- var _ hashicorpRaft.FSM = &StateMachine{}
- func (s StateMachine) Save() ([]byte, error) {
- state := topology.MaxVolumeIdCommand{
- MaxVolumeId: s.topo.GetMaxVolumeId(),
- }
- glog.V(1).Infof("Save raft state %+v", state)
- return json.Marshal(state)
- }
- func (s StateMachine) Recovery(data []byte) error {
- state := topology.MaxVolumeIdCommand{}
- err := json.Unmarshal(data, &state)
- if err != nil {
- return err
- }
- glog.V(1).Infof("Recovery raft state %+v", state)
- s.topo.UpAdjustMaxVolumeId(state.MaxVolumeId)
- return nil
- }
- func (s *StateMachine) Apply(l *hashicorpRaft.Log) interface{} {
- before := s.topo.GetMaxVolumeId()
- state := topology.MaxVolumeIdCommand{}
- err := json.Unmarshal(l.Data, &state)
- if err != nil {
- return err
- }
- s.topo.UpAdjustMaxVolumeId(state.MaxVolumeId)
- glog.V(1).Infoln("max volume id", before, "==>", s.topo.GetMaxVolumeId())
- return nil
- }
- func (s *StateMachine) Snapshot() (hashicorpRaft.FSMSnapshot, error) {
- return &topology.MaxVolumeIdCommand{
- MaxVolumeId: s.topo.GetMaxVolumeId(),
- }, nil
- }
- func (s *StateMachine) Restore(r io.ReadCloser) error {
- b, err := io.ReadAll(r)
- if err != nil {
- return err
- }
- if err := s.Recovery(b); err != nil {
- return err
- }
- return nil
- }
- func NewRaftServer(option *RaftServerOption) (*RaftServer, error) {
- s := &RaftServer{
- peers: option.Peers,
- serverAddr: option.ServerAddr,
- dataDir: option.DataDir,
- topo: option.Topo,
- }
- if glog.V(4) {
- raft.SetLogLevel(2)
- }
- raft.RegisterCommand(&topology.MaxVolumeIdCommand{})
- var err error
- transporter := raft.NewGrpcTransporter(option.GrpcDialOption)
- glog.V(0).Infof("Starting RaftServer with %v", option.ServerAddr)
- // always clear previous log to avoid server is promotable
- os.RemoveAll(path.Join(s.dataDir, "log"))
- if !option.RaftResumeState {
- // always clear previous metadata
- os.RemoveAll(path.Join(s.dataDir, "conf"))
- os.RemoveAll(path.Join(s.dataDir, "snapshot"))
- }
- if err := os.MkdirAll(path.Join(s.dataDir, "snapshot"), os.ModePerm); err != nil {
- return nil, err
- }
- stateMachine := StateMachine{topo: option.Topo}
- s.raftServer, err = raft.NewServer(string(s.serverAddr), s.dataDir, transporter, stateMachine, option.Topo, s.serverAddr.ToGrpcAddress())
- if err != nil {
- glog.V(0).Infoln(err)
- return nil, err
- }
- heartbeatInterval := time.Duration(float64(option.HeartbeatInterval) * (rand.Float64()*0.25 + 1))
- s.raftServer.SetHeartbeatInterval(heartbeatInterval)
- s.raftServer.SetElectionTimeout(option.ElectionTimeout)
- if err := s.raftServer.LoadSnapshot(); err != nil {
- return nil, err
- }
- if err := s.raftServer.Start(); err != nil {
- return nil, err
- }
- for name, peer := range s.peers {
- if err := s.raftServer.AddPeer(name, peer.ToGrpcAddress()); err != nil {
- return nil, err
- }
- }
- // Remove deleted peers
- for existsPeerName := range s.raftServer.Peers() {
- if existingPeer, found := s.peers[existsPeerName]; !found {
- if err := s.raftServer.RemovePeer(existsPeerName); err != nil {
- glog.V(0).Infoln(err)
- return nil, err
- } else {
- glog.V(0).Infof("removing old peer: %s", existingPeer)
- }
- }
- }
- s.GrpcServer = raft.NewGrpcServer(s.raftServer)
- glog.V(0).Infof("current cluster leader: %v", s.raftServer.Leader())
- return s, nil
- }
- func (s *RaftServer) Peers() (members []string) {
- if s.raftServer != nil {
- peers := s.raftServer.Peers()
- for _, p := range peers {
- members = append(members, p.Name)
- }
- } else if s.RaftHashicorp != nil {
- cfg := s.RaftHashicorp.GetConfiguration()
- for _, p := range cfg.Configuration().Servers {
- members = append(members, string(p.ID))
- }
- }
- return
- }
- func (s *RaftServer) DoJoinCommand() {
- glog.V(0).Infoln("Initializing new cluster")
- if _, err := s.raftServer.Do(&raft.DefaultJoinCommand{
- Name: s.raftServer.Name(),
- ConnectionString: s.serverAddr.ToGrpcAddress(),
- }); err != nil {
- glog.Errorf("fail to send join command: %v", err)
- }
- }
|