123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417 |
- package weed_server
- import (
- "context"
- "fmt"
- "net/http"
- "net/http/httputil"
- "net/url"
- "os"
- "regexp"
- "strings"
- "sync"
- "time"
- "github.com/seaweedfs/seaweedfs/weed/stats"
- "github.com/seaweedfs/seaweedfs/weed/cluster"
- "github.com/seaweedfs/seaweedfs/weed/pb"
- "github.com/gorilla/mux"
- hashicorpRaft "github.com/hashicorp/raft"
- "github.com/seaweedfs/raft"
- "google.golang.org/grpc"
- "github.com/seaweedfs/seaweedfs/weed/glog"
- "github.com/seaweedfs/seaweedfs/weed/pb/master_pb"
- "github.com/seaweedfs/seaweedfs/weed/security"
- "github.com/seaweedfs/seaweedfs/weed/sequence"
- "github.com/seaweedfs/seaweedfs/weed/shell"
- "github.com/seaweedfs/seaweedfs/weed/topology"
- "github.com/seaweedfs/seaweedfs/weed/util"
- "github.com/seaweedfs/seaweedfs/weed/wdclient"
- )
- const (
- SequencerType = "master.sequencer.type"
- SequencerSnowflakeId = "master.sequencer.sequencer_snowflake_id"
- )
- type MasterOption struct {
- Master pb.ServerAddress
- MetaFolder string
- VolumeSizeLimitMB uint32
- VolumePreallocate bool
- // PulseSeconds int
- DefaultReplicaPlacement string
- GarbageThreshold float64
- WhiteList []string
- DisableHttp bool
- MetricsAddress string
- MetricsIntervalSec int
- IsFollower bool
- }
- type MasterServer struct {
- master_pb.UnimplementedSeaweedServer
- option *MasterOption
- guard *security.Guard
- preallocateSize int64
- Topo *topology.Topology
- vg *topology.VolumeGrowth
- volumeGrowthRequestChan chan *topology.VolumeGrowRequest
- boundedLeaderChan chan int
- // notifying clients
- clientChansLock sync.RWMutex
- clientChans map[string]chan *master_pb.KeepConnectedResponse
- grpcDialOption grpc.DialOption
- MasterClient *wdclient.MasterClient
- adminLocks *AdminLocks
- Cluster *cluster.Cluster
- }
- func NewMasterServer(r *mux.Router, option *MasterOption, peers map[string]pb.ServerAddress) *MasterServer {
- v := util.GetViper()
- signingKey := v.GetString("jwt.signing.key")
- v.SetDefault("jwt.signing.expires_after_seconds", 10)
- expiresAfterSec := v.GetInt("jwt.signing.expires_after_seconds")
- readSigningKey := v.GetString("jwt.signing.read.key")
- v.SetDefault("jwt.signing.read.expires_after_seconds", 60)
- readExpiresAfterSec := v.GetInt("jwt.signing.read.expires_after_seconds")
- v.SetDefault("master.replication.treat_replication_as_minimums", false)
- replicationAsMin := v.GetBool("master.replication.treat_replication_as_minimums")
- v.SetDefault("master.volume_growth.copy_1", 7)
- v.SetDefault("master.volume_growth.copy_2", 6)
- v.SetDefault("master.volume_growth.copy_3", 3)
- v.SetDefault("master.volume_growth.copy_other", 1)
- v.SetDefault("master.volume_growth.threshold", 0.9)
- topology.VolumeGrowStrategy.Copy1Count = v.GetInt("master.volume_growth.copy_1")
- topology.VolumeGrowStrategy.Copy2Count = v.GetInt("master.volume_growth.copy_2")
- topology.VolumeGrowStrategy.Copy3Count = v.GetInt("master.volume_growth.copy_3")
- topology.VolumeGrowStrategy.CopyOtherCount = v.GetInt("master.volume_growth.copy_other")
- topology.VolumeGrowStrategy.Threshold = v.GetFloat64("master.volume_growth.threshold")
- var preallocateSize int64
- if option.VolumePreallocate {
- preallocateSize = int64(option.VolumeSizeLimitMB) * (1 << 20)
- }
- grpcDialOption := security.LoadClientTLS(v, "grpc.master")
- ms := &MasterServer{
- option: option,
- preallocateSize: preallocateSize,
- volumeGrowthRequestChan: make(chan *topology.VolumeGrowRequest, 1<<6),
- clientChans: make(map[string]chan *master_pb.KeepConnectedResponse),
- grpcDialOption: grpcDialOption,
- MasterClient: wdclient.NewMasterClient(grpcDialOption, "", cluster.MasterType, option.Master, "", "", *pb.NewServiceDiscoveryFromMap(peers)),
- adminLocks: NewAdminLocks(),
- Cluster: cluster.NewCluster(),
- }
- ms.boundedLeaderChan = make(chan int, 16)
- ms.MasterClient.SetOnPeerUpdateFn(ms.OnPeerUpdate)
- seq := ms.createSequencer(option)
- if nil == seq {
- glog.Fatalf("create sequencer failed.")
- }
- ms.Topo = topology.NewTopology("topo", seq, uint64(ms.option.VolumeSizeLimitMB)*1024*1024, 5, replicationAsMin)
- ms.vg = topology.NewDefaultVolumeGrowth()
- glog.V(0).Infoln("Volume Size Limit is", ms.option.VolumeSizeLimitMB, "MB")
- ms.guard = security.NewGuard(ms.option.WhiteList, signingKey, expiresAfterSec, readSigningKey, readExpiresAfterSec)
- handleStaticResources2(r)
- r.HandleFunc("/", ms.proxyToLeader(ms.uiStatusHandler))
- r.HandleFunc("/ui/index.html", ms.uiStatusHandler)
- if !ms.option.DisableHttp {
- r.HandleFunc("/dir/assign", ms.proxyToLeader(ms.guard.WhiteList(ms.dirAssignHandler)))
- r.HandleFunc("/dir/lookup", ms.guard.WhiteList(ms.dirLookupHandler))
- r.HandleFunc("/dir/status", ms.proxyToLeader(ms.guard.WhiteList(ms.dirStatusHandler)))
- r.HandleFunc("/col/delete", ms.proxyToLeader(ms.guard.WhiteList(ms.collectionDeleteHandler)))
- r.HandleFunc("/vol/grow", ms.proxyToLeader(ms.guard.WhiteList(ms.volumeGrowHandler)))
- r.HandleFunc("/vol/status", ms.proxyToLeader(ms.guard.WhiteList(ms.volumeStatusHandler)))
- r.HandleFunc("/vol/vacuum", ms.proxyToLeader(ms.guard.WhiteList(ms.volumeVacuumHandler)))
- r.HandleFunc("/submit", ms.guard.WhiteList(ms.submitFromMasterServerHandler))
- /*
- r.HandleFunc("/stats/health", ms.guard.WhiteList(statsHealthHandler))
- r.HandleFunc("/stats/counter", ms.guard.WhiteList(statsCounterHandler))
- r.HandleFunc("/stats/memory", ms.guard.WhiteList(statsMemoryHandler))
- */
- r.HandleFunc("/{fileId}", ms.redirectHandler)
- }
- ms.Topo.StartRefreshWritableVolumes(
- ms.grpcDialOption,
- ms.option.GarbageThreshold,
- topology.VolumeGrowStrategy.Threshold,
- ms.preallocateSize,
- )
- ms.ProcessGrowRequest()
- if !option.IsFollower {
- ms.startAdminScripts()
- }
- return ms
- }
- func (ms *MasterServer) SetRaftServer(raftServer *RaftServer) {
- var raftServerName string
- ms.Topo.RaftServerAccessLock.Lock()
- if raftServer.raftServer != nil {
- ms.Topo.RaftServer = raftServer.raftServer
- ms.Topo.RaftServer.AddEventListener(raft.LeaderChangeEventType, func(e raft.Event) {
- glog.V(0).Infof("leader change event: %+v => %+v", e.PrevValue(), e.Value())
- stats.MasterLeaderChangeCounter.WithLabelValues(fmt.Sprintf("%+v", e.Value())).Inc()
- if ms.Topo.RaftServer.Leader() != "" {
- glog.V(0).Infof("[%s] %s becomes leader.", ms.Topo.RaftServer.Name(), ms.Topo.RaftServer.Leader())
- }
- })
- raftServerName = fmt.Sprintf("[%s]", ms.Topo.RaftServer.Name())
- } else if raftServer.RaftHashicorp != nil {
- ms.Topo.HashicorpRaft = raftServer.RaftHashicorp
- leaderCh := raftServer.RaftHashicorp.LeaderCh()
- prevLeader, _ := ms.Topo.HashicorpRaft.LeaderWithID()
- raftServerName = ms.Topo.HashicorpRaft.String()
- go func() {
- for {
- select {
- case isLeader := <-leaderCh:
- ms.Topo.RaftServerAccessLock.RLock()
- leader, _ := ms.Topo.HashicorpRaft.LeaderWithID()
- ms.Topo.RaftServerAccessLock.RUnlock()
- glog.V(0).Infof("is leader %+v change event: %+v => %+v", isLeader, prevLeader, leader)
- stats.MasterLeaderChangeCounter.WithLabelValues(fmt.Sprintf("%+v", leader)).Inc()
- prevLeader = leader
- }
- }
- }()
- }
- ms.Topo.RaftServerAccessLock.Unlock()
- if ms.Topo.IsLeader() {
- glog.V(0).Infof("%s I am the leader!", raftServerName)
- } else {
- var raftServerLeader string
- ms.Topo.RaftServerAccessLock.RLock()
- if ms.Topo.RaftServer != nil {
- raftServerLeader = ms.Topo.RaftServer.Leader()
- } else if ms.Topo.HashicorpRaft != nil {
- raftServerName = ms.Topo.HashicorpRaft.String()
- raftServerLeaderAddr, _ := ms.Topo.HashicorpRaft.LeaderWithID()
- raftServerLeader = string(raftServerLeaderAddr)
- }
- ms.Topo.RaftServerAccessLock.RUnlock()
- glog.V(0).Infof("%s %s - is the leader.", raftServerName, raftServerLeader)
- }
- }
- func (ms *MasterServer) proxyToLeader(f http.HandlerFunc) http.HandlerFunc {
- return func(w http.ResponseWriter, r *http.Request) {
- if ms.Topo.IsLeader() {
- f(w, r)
- return
- }
- // get the current raft leader
- leaderAddr, _ := ms.Topo.MaybeLeader()
- raftServerLeader := leaderAddr.ToHttpAddress()
- if raftServerLeader == "" {
- f(w, r)
- return
- }
- ms.boundedLeaderChan <- 1
- defer func() { <-ms.boundedLeaderChan }()
- targetUrl, err := url.Parse("http://" + raftServerLeader)
- if err != nil {
- writeJsonError(w, r, http.StatusInternalServerError,
- fmt.Errorf("Leader URL http://%s Parse Error: %v", raftServerLeader, err))
- return
- }
- // proxy to leader
- glog.V(4).Infoln("proxying to leader", raftServerLeader)
- proxy := httputil.NewSingleHostReverseProxy(targetUrl)
- director := proxy.Director
- proxy.Director = func(req *http.Request) {
- actualHost, err := security.GetActualRemoteHost(req)
- if err == nil {
- req.Header.Set("HTTP_X_FORWARDED_FOR", actualHost)
- }
- director(req)
- }
- proxy.Transport = util.Transport
- proxy.ServeHTTP(w, r)
- }
- }
- func (ms *MasterServer) startAdminScripts() {
- v := util.GetViper()
- adminScripts := v.GetString("master.maintenance.scripts")
- if adminScripts == "" {
- return
- }
- glog.V(0).Infof("adminScripts: %v", adminScripts)
- v.SetDefault("master.maintenance.sleep_minutes", 17)
- sleepMinutes := v.GetInt("master.maintenance.sleep_minutes")
- scriptLines := strings.Split(adminScripts, "\n")
- if !strings.Contains(adminScripts, "lock") {
- scriptLines = append(append([]string{}, "lock"), scriptLines...)
- scriptLines = append(scriptLines, "unlock")
- }
- masterAddress := string(ms.option.Master)
- var shellOptions shell.ShellOptions
- shellOptions.GrpcDialOption = security.LoadClientTLS(v, "grpc.master")
- shellOptions.Masters = &masterAddress
- shellOptions.Directory = "/"
- emptyFilerGroup := ""
- shellOptions.FilerGroup = &emptyFilerGroup
- commandEnv := shell.NewCommandEnv(&shellOptions)
- reg, _ := regexp.Compile(`'.*?'|".*?"|\S+`)
- go commandEnv.MasterClient.KeepConnectedToMaster(context.Background())
- go func() {
- for {
- time.Sleep(time.Duration(sleepMinutes) * time.Minute)
- if ms.Topo.IsLeader() && ms.MasterClient.GetMaster(context.Background()) != "" {
- shellOptions.FilerAddress = ms.GetOneFiler(cluster.FilerGroupName(*shellOptions.FilerGroup))
- if shellOptions.FilerAddress == "" {
- continue
- }
- for _, line := range scriptLines {
- for _, c := range strings.Split(line, ";") {
- processEachCmd(reg, c, commandEnv)
- }
- }
- }
- }
- }()
- }
- func processEachCmd(reg *regexp.Regexp, line string, commandEnv *shell.CommandEnv) {
- cmds := reg.FindAllString(line, -1)
- if len(cmds) == 0 {
- return
- }
- args := make([]string, len(cmds[1:]))
- for i := range args {
- args[i] = strings.Trim(string(cmds[1+i]), "\"'")
- }
- cmd := cmds[0]
- for _, c := range shell.Commands {
- if c.Name() == cmd {
- glog.V(0).Infof("executing: %s %v", cmd, args)
- if err := c.Do(args, commandEnv, os.Stdout); err != nil {
- glog.V(0).Infof("error: %v", err)
- }
- }
- }
- }
- func (ms *MasterServer) createSequencer(option *MasterOption) sequence.Sequencer {
- var seq sequence.Sequencer
- v := util.GetViper()
- seqType := strings.ToLower(v.GetString(SequencerType))
- glog.V(1).Infof("[%s] : [%s]", SequencerType, seqType)
- switch strings.ToLower(seqType) {
- case "snowflake":
- var err error
- snowflakeId := v.GetInt(SequencerSnowflakeId)
- seq, err = sequence.NewSnowflakeSequencer(string(option.Master), snowflakeId)
- if err != nil {
- glog.Error(err)
- seq = nil
- }
- case "raft":
- fallthrough
- default:
- seq = sequence.NewMemorySequencer()
- }
- return seq
- }
- func (ms *MasterServer) OnPeerUpdate(update *master_pb.ClusterNodeUpdate, startFrom time.Time) {
- ms.Topo.RaftServerAccessLock.RLock()
- defer ms.Topo.RaftServerAccessLock.RUnlock()
- if update.NodeType != cluster.MasterType || ms.Topo.HashicorpRaft == nil {
- return
- }
- glog.V(4).Infof("OnPeerUpdate: %+v", update)
- peerAddress := pb.ServerAddress(update.Address)
- peerName := string(peerAddress)
- if ms.Topo.HashicorpRaft.State() != hashicorpRaft.Leader {
- return
- }
- if update.IsAdd {
- raftServerFound := false
- for _, server := range ms.Topo.HashicorpRaft.GetConfiguration().Configuration().Servers {
- if string(server.ID) == peerName {
- raftServerFound = true
- }
- }
- if !raftServerFound {
- glog.V(0).Infof("adding new raft server: %s", peerName)
- ms.Topo.HashicorpRaft.AddVoter(
- hashicorpRaft.ServerID(peerName),
- hashicorpRaft.ServerAddress(peerAddress.ToGrpcAddress()), 0, 0)
- }
- } else {
- pb.WithMasterClient(false, peerAddress, ms.grpcDialOption, true, func(client master_pb.SeaweedClient) error {
- ctx, cancel := context.WithTimeout(context.TODO(), 15*time.Second)
- defer cancel()
- if _, err := client.Ping(ctx, &master_pb.PingRequest{Target: string(peerAddress), TargetType: cluster.MasterType}); err != nil {
- glog.V(0).Infof("master %s didn't respond to pings. remove raft server", peerName)
- if err := ms.MasterClient.WithClient(false, func(client master_pb.SeaweedClient) error {
- _, err := client.RaftRemoveServer(context.Background(), &master_pb.RaftRemoveServerRequest{
- Id: peerName,
- Force: false,
- })
- return err
- }); err != nil {
- glog.Warningf("failed removing old raft server: %v", err)
- return err
- }
- } else {
- glog.V(0).Infof("master %s successfully responded to ping", peerName)
- }
- return nil
- })
- }
- }
- func (ms *MasterServer) Shutdown() {
- if ms.Topo == nil || ms.Topo.HashicorpRaft == nil {
- return
- }
- if ms.Topo.HashicorpRaft.State() == hashicorpRaft.Leader {
- ms.Topo.HashicorpRaft.LeadershipTransfer()
- }
- ms.Topo.HashicorpRaft.Shutdown()
- }
|