123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326 |
- package wdclient
- import (
- "context"
- "fmt"
- "math/rand"
- "sync"
- "time"
- "github.com/seaweedfs/seaweedfs/weed/stats"
- "github.com/seaweedfs/seaweedfs/weed/util"
- "google.golang.org/grpc"
- "github.com/seaweedfs/seaweedfs/weed/glog"
- "github.com/seaweedfs/seaweedfs/weed/pb"
- "github.com/seaweedfs/seaweedfs/weed/pb/master_pb"
- )
- type MasterClient struct {
- FilerGroup string
- clientType string
- clientHost pb.ServerAddress
- rack string
- currentMaster pb.ServerAddress
- currentMasterLock sync.RWMutex
- masters map[string]pb.ServerAddress
- grpcDialOption grpc.DialOption
- *vidMap
- vidMapCacheSize int
- OnPeerUpdate func(update *master_pb.ClusterNodeUpdate, startFrom time.Time)
- OnPeerUpdateLock sync.RWMutex
- }
- func NewMasterClient(grpcDialOption grpc.DialOption, filerGroup string, clientType string, clientHost pb.ServerAddress, clientDataCenter string, rack string, masters map[string]pb.ServerAddress) *MasterClient {
- return &MasterClient{
- FilerGroup: filerGroup,
- clientType: clientType,
- clientHost: clientHost,
- rack: rack,
- masters: masters,
- grpcDialOption: grpcDialOption,
- vidMap: newVidMap(clientDataCenter),
- vidMapCacheSize: 5,
- }
- }
- func (mc *MasterClient) SetOnPeerUpdateFn(onPeerUpdate func(update *master_pb.ClusterNodeUpdate, startFrom time.Time)) {
- mc.OnPeerUpdateLock.Lock()
- mc.OnPeerUpdate = onPeerUpdate
- mc.OnPeerUpdateLock.Unlock()
- }
- func (mc *MasterClient) GetLookupFileIdFunction() LookupFileIdFunctionType {
- return mc.LookupFileIdWithFallback
- }
- func (mc *MasterClient) LookupFileIdWithFallback(fileId string) (fullUrls []string, err error) {
- fullUrls, err = mc.vidMap.LookupFileId(fileId)
- if err == nil && len(fullUrls) > 0 {
- return
- }
- err = pb.WithMasterClient(false, mc.GetMaster(), mc.grpcDialOption, false, func(client master_pb.SeaweedClient) error {
- resp, err := client.LookupVolume(context.Background(), &master_pb.LookupVolumeRequest{
- VolumeOrFileIds: []string{fileId},
- })
- if err != nil {
- return fmt.Errorf("LookupVolume %s failed: %v", fileId, err)
- }
- for vid, vidLocation := range resp.VolumeIdLocations {
- for _, vidLoc := range vidLocation.Locations {
- loc := Location{
- Url: vidLoc.Url,
- PublicUrl: vidLoc.PublicUrl,
- GrpcPort: int(vidLoc.GrpcPort),
- DataCenter: vidLoc.DataCenter,
- }
- mc.vidMap.addLocation(uint32(vid), loc)
- httpUrl := "http://" + loc.Url + "/" + fileId
- // Prefer same data center
- if mc.DataCenter != "" && mc.DataCenter == loc.DataCenter {
- fullUrls = append([]string{httpUrl}, fullUrls...)
- } else {
- fullUrls = append(fullUrls, httpUrl)
- }
- }
- }
- return nil
- })
- return
- }
- func (mc *MasterClient) getCurrentMaster() pb.ServerAddress {
- mc.currentMasterLock.RLock()
- defer mc.currentMasterLock.RUnlock()
- return mc.currentMaster
- }
- func (mc *MasterClient) setCurrentMaster(master pb.ServerAddress) {
- mc.currentMasterLock.Lock()
- mc.currentMaster = master
- mc.currentMasterLock.Unlock()
- }
- func (mc *MasterClient) GetMaster() pb.ServerAddress {
- mc.WaitUntilConnected()
- return mc.getCurrentMaster()
- }
- func (mc *MasterClient) GetMasters() map[string]pb.ServerAddress {
- mc.WaitUntilConnected()
- return mc.masters
- }
- func (mc *MasterClient) WaitUntilConnected() {
- for {
- if mc.getCurrentMaster() != "" {
- return
- }
- time.Sleep(time.Duration(rand.Int31n(200)) * time.Millisecond)
- }
- }
- func (mc *MasterClient) KeepConnectedToMaster() {
- glog.V(1).Infof("%s.%s masterClient bootstraps with masters %v", mc.FilerGroup, mc.clientType, mc.masters)
- for {
- mc.tryAllMasters()
- time.Sleep(time.Second)
- }
- }
- func (mc *MasterClient) FindLeaderFromOtherPeers(myMasterAddress pb.ServerAddress) (leader string) {
- for _, master := range mc.masters {
- if master == myMasterAddress {
- continue
- }
- if grpcErr := pb.WithMasterClient(false, master, mc.grpcDialOption, false, func(client master_pb.SeaweedClient) error {
- ctx, cancel := context.WithTimeout(context.Background(), 120*time.Millisecond)
- defer cancel()
- resp, err := client.GetMasterConfiguration(ctx, &master_pb.GetMasterConfigurationRequest{})
- if err != nil {
- return err
- }
- leader = resp.Leader
- return nil
- }); grpcErr != nil {
- glog.V(0).Infof("connect to %s: %v", master, grpcErr)
- }
- if leader != "" {
- glog.V(0).Infof("existing leader is %s", leader)
- return
- }
- }
- glog.V(0).Infof("No existing leader found!")
- return
- }
- func (mc *MasterClient) tryAllMasters() {
- var nextHintedLeader pb.ServerAddress
- for _, master := range mc.masters {
- nextHintedLeader = mc.tryConnectToMaster(master)
- for nextHintedLeader != "" {
- nextHintedLeader = mc.tryConnectToMaster(nextHintedLeader)
- }
- mc.setCurrentMaster("")
- }
- }
- func (mc *MasterClient) tryConnectToMaster(master pb.ServerAddress) (nextHintedLeader pb.ServerAddress) {
- glog.V(1).Infof("%s.%s masterClient Connecting to master %v", mc.FilerGroup, mc.clientType, master)
- stats.MasterClientConnectCounter.WithLabelValues("total").Inc()
- gprcErr := pb.WithMasterClient(true, master, mc.grpcDialOption, false, func(client master_pb.SeaweedClient) error {
- ctx, cancel := context.WithCancel(context.Background())
- defer cancel()
- stream, err := client.KeepConnected(ctx)
- if err != nil {
- glog.V(1).Infof("%s.%s masterClient failed to keep connected to %s: %v", mc.FilerGroup, mc.clientType, master, err)
- stats.MasterClientConnectCounter.WithLabelValues(stats.FailedToKeepConnected).Inc()
- return err
- }
- if err = stream.Send(&master_pb.KeepConnectedRequest{
- FilerGroup: mc.FilerGroup,
- DataCenter: mc.DataCenter,
- Rack: mc.rack,
- ClientType: mc.clientType,
- ClientAddress: string(mc.clientHost),
- Version: util.Version(),
- }); err != nil {
- glog.V(0).Infof("%s.%s masterClient failed to send to %s: %v", mc.FilerGroup, mc.clientType, master, err)
- stats.MasterClientConnectCounter.WithLabelValues(stats.FailedToSend).Inc()
- return err
- }
- glog.V(1).Infof("%s.%s masterClient Connected to %v", mc.FilerGroup, mc.clientType, master)
- resp, err := stream.Recv()
- if err != nil {
- glog.V(0).Infof("%s.%s masterClient failed to receive from %s: %v", mc.FilerGroup, mc.clientType, master, err)
- stats.MasterClientConnectCounter.WithLabelValues(stats.FailedToReceive).Inc()
- return err
- }
- // check if it is the leader to determine whether to reset the vidMap
- if resp.VolumeLocation != nil {
- if resp.VolumeLocation.Leader != "" && string(master) != resp.VolumeLocation.Leader {
- glog.V(0).Infof("master %v redirected to leader %v", master, resp.VolumeLocation.Leader)
- nextHintedLeader = pb.ServerAddress(resp.VolumeLocation.Leader)
- stats.MasterClientConnectCounter.WithLabelValues(stats.RedirectedToLeader).Inc()
- return nil
- }
- mc.resetVidMap()
- mc.updateVidMap(resp)
- } else {
- mc.resetVidMap()
- }
- mc.setCurrentMaster(master)
- for {
- resp, err := stream.Recv()
- if err != nil {
- glog.V(0).Infof("%s.%s masterClient failed to receive from %s: %v", mc.FilerGroup, mc.clientType, master, err)
- stats.MasterClientConnectCounter.WithLabelValues(stats.FailedToReceive).Inc()
- return err
- }
- if resp.VolumeLocation != nil {
- // maybe the leader is changed
- if resp.VolumeLocation.Leader != "" && string(mc.GetMaster()) != resp.VolumeLocation.Leader {
- glog.V(0).Infof("currentMaster %v redirected to leader %v", mc.GetMaster(), resp.VolumeLocation.Leader)
- nextHintedLeader = pb.ServerAddress(resp.VolumeLocation.Leader)
- stats.MasterClientConnectCounter.WithLabelValues(stats.RedirectedToLeader).Inc()
- return nil
- }
- mc.updateVidMap(resp)
- }
- if resp.ClusterNodeUpdate != nil {
- update := resp.ClusterNodeUpdate
- mc.OnPeerUpdateLock.RLock()
- if mc.OnPeerUpdate != nil {
- if update.FilerGroup == mc.FilerGroup {
- if update.IsAdd {
- glog.V(0).Infof("+ %s.%s %s leader:%v\n", update.FilerGroup, update.NodeType, update.Address, update.IsLeader)
- } else {
- glog.V(0).Infof("- %s.%s %s leader:%v\n", update.FilerGroup, update.NodeType, update.Address, update.IsLeader)
- }
- stats.MasterClientConnectCounter.WithLabelValues(stats.OnPeerUpdate).Inc()
- mc.OnPeerUpdate(update, time.Now())
- }
- }
- mc.OnPeerUpdateLock.RUnlock()
- }
- }
- })
- if gprcErr != nil {
- stats.MasterClientConnectCounter.WithLabelValues(stats.Failed).Inc()
- glog.V(1).Infof("%s.%s masterClient failed to connect with master %v: %v", mc.FilerGroup, mc.clientType, master, gprcErr)
- }
- return
- }
- func (mc *MasterClient) updateVidMap(resp *master_pb.KeepConnectedResponse) {
- if resp.VolumeLocation.IsEmptyUrl() {
- glog.V(0).Infof("updateVidMap ignore short heartbeat: %+v", resp)
- return
- }
- // process new volume location
- loc := Location{
- Url: resp.VolumeLocation.Url,
- PublicUrl: resp.VolumeLocation.PublicUrl,
- DataCenter: resp.VolumeLocation.DataCenter,
- GrpcPort: int(resp.VolumeLocation.GrpcPort),
- }
- for _, newVid := range resp.VolumeLocation.NewVids {
- glog.V(2).Infof("%s.%s: %s masterClient adds volume %d", mc.FilerGroup, mc.clientType, loc.Url, newVid)
- mc.addLocation(newVid, loc)
- }
- for _, deletedVid := range resp.VolumeLocation.DeletedVids {
- glog.V(2).Infof("%s.%s: %s masterClient removes volume %d", mc.FilerGroup, mc.clientType, loc.Url, deletedVid)
- mc.deleteLocation(deletedVid, loc)
- }
- for _, newEcVid := range resp.VolumeLocation.NewEcVids {
- glog.V(2).Infof("%s.%s: %s masterClient adds ec volume %d", mc.FilerGroup, mc.clientType, loc.Url, newEcVid)
- mc.addEcLocation(newEcVid, loc)
- }
- for _, deletedEcVid := range resp.VolumeLocation.DeletedEcVids {
- glog.V(2).Infof("%s.%s: %s masterClient removes ec volume %d", mc.FilerGroup, mc.clientType, loc.Url, deletedEcVid)
- mc.deleteEcLocation(deletedEcVid, loc)
- }
- glog.V(1).Infof("updateVidMap(%s) %s.%s: %s volume add: %d, del: %d, add ec: %d del ec: %d",
- resp.VolumeLocation.DataCenter, mc.FilerGroup, mc.clientType, loc.Url,
- len(resp.VolumeLocation.NewVids), len(resp.VolumeLocation.DeletedVids),
- len(resp.VolumeLocation.NewEcVids), len(resp.VolumeLocation.DeletedEcVids))
- }
- func (mc *MasterClient) WithClient(streamingMode bool, fn func(client master_pb.SeaweedClient) error) error {
- return util.Retry("master grpc", func() error {
- return pb.WithMasterClient(streamingMode, mc.GetMaster(), mc.grpcDialOption, false, func(client master_pb.SeaweedClient) error {
- return fn(client)
- })
- })
- }
- func (mc *MasterClient) resetVidMap() {
- tail := &vidMap{
- vid2Locations: mc.vid2Locations,
- ecVid2Locations: mc.ecVid2Locations,
- DataCenter: mc.DataCenter,
- cache: mc.cache,
- }
- nvm := newVidMap(mc.DataCenter)
- nvm.cache = tail
- mc.vidMap = nvm
- //trim
- for i := 0; i < mc.vidMapCacheSize && tail.cache != nil; i++ {
- if i == mc.vidMapCacheSize-1 {
- tail.cache = nil
- } else {
- tail = tail.cache
- }
- }
- }
|