123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229 |
- package topology
- import (
- "encoding/json"
- "errors"
- "fmt"
- "google.golang.org/grpc"
- "net/http"
- "net/url"
- "strconv"
- "strings"
- "time"
- "github.com/seaweedfs/seaweedfs/weed/glog"
- "github.com/seaweedfs/seaweedfs/weed/operation"
- "github.com/seaweedfs/seaweedfs/weed/security"
- "github.com/seaweedfs/seaweedfs/weed/stats"
- "github.com/seaweedfs/seaweedfs/weed/storage"
- "github.com/seaweedfs/seaweedfs/weed/storage/needle"
- "github.com/seaweedfs/seaweedfs/weed/storage/types"
- "github.com/seaweedfs/seaweedfs/weed/util"
- "github.com/seaweedfs/seaweedfs/weed/util/buffer_pool"
- util_http "github.com/seaweedfs/seaweedfs/weed/util/http"
- )
- func ReplicatedWrite(masterFn operation.GetMasterFn, grpcDialOption grpc.DialOption, s *storage.Store, volumeId needle.VolumeId, n *needle.Needle, r *http.Request, contentMd5 string) (isUnchanged bool, err error) {
- //check JWT
- jwt := security.GetJwt(r)
- // check whether this is a replicated write request
- var remoteLocations []operation.Location
- if r.FormValue("type") != "replicate" {
- // this is the initial request
- remoteLocations, err = GetWritableRemoteReplications(s, grpcDialOption, volumeId, masterFn)
- if err != nil {
- glog.V(0).Infoln(err)
- return
- }
- }
- // read fsync value
- fsync := false
- if r.FormValue("fsync") == "true" {
- fsync = true
- }
- if s.GetVolume(volumeId) != nil {
- start := time.Now()
- isUnchanged, err = s.WriteVolumeNeedle(volumeId, n, true, fsync)
- stats.VolumeServerRequestHistogram.WithLabelValues(stats.WriteToLocalDisk).Observe(time.Since(start).Seconds())
- if err != nil {
- stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorWriteToLocalDisk).Inc()
- err = fmt.Errorf("failed to write to local disk: %v", err)
- glog.V(0).Infoln(err)
- return
- }
- }
- if len(remoteLocations) > 0 { //send to other replica locations
- start := time.Now()
- err = DistributedOperation(remoteLocations, func(location operation.Location) error {
- u := url.URL{
- Scheme: "http",
- Host: location.Url,
- Path: r.URL.Path,
- }
- q := url.Values{
- "type": {"replicate"},
- "ttl": {n.Ttl.String()},
- }
- if n.LastModified > 0 {
- q.Set("ts", strconv.FormatUint(n.LastModified, 10))
- }
- if n.IsChunkedManifest() {
- q.Set("cm", "true")
- }
- u.RawQuery = q.Encode()
- pairMap := make(map[string]string)
- if n.HasPairs() {
- tmpMap := make(map[string]string)
- err := json.Unmarshal(n.Pairs, &tmpMap)
- if err != nil {
- stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorUnmarshalPairs).Inc()
- glog.V(0).Infoln("Unmarshal pairs error:", err)
- }
- for k, v := range tmpMap {
- pairMap[needle.PairNamePrefix+k] = v
- }
- }
- bytesBuffer := buffer_pool.SyncPoolGetBuffer()
- defer buffer_pool.SyncPoolPutBuffer(bytesBuffer)
- // volume server do not know about encryption
- // TODO optimize here to compress data only once
- uploadOption := &operation.UploadOption{
- UploadUrl: u.String(),
- Filename: string(n.Name),
- Cipher: false,
- IsInputCompressed: n.IsCompressed(),
- MimeType: string(n.Mime),
- PairMap: pairMap,
- Jwt: jwt,
- Md5: contentMd5,
- BytesBuffer: bytesBuffer,
- }
- uploader, err := operation.NewUploader()
- if err != nil {
- glog.Errorf("replication-UploadData, err:%v, url:%s", err, u.String())
- return err
- }
- _, err = uploader.UploadData(n.Data, uploadOption)
- if err != nil {
- glog.Errorf("replication-UploadData, err:%v, url:%s", err, u.String())
- }
- return err
- })
- stats.VolumeServerRequestHistogram.WithLabelValues(stats.WriteToReplicas).Observe(time.Since(start).Seconds())
- if err != nil {
- stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorWriteToReplicas).Inc()
- err = fmt.Errorf("failed to write to replicas for volume %d: %v", volumeId, err)
- glog.V(0).Infoln(err)
- return false, err
- }
- }
- return
- }
- func ReplicatedDelete(masterFn operation.GetMasterFn, grpcDialOption grpc.DialOption, store *storage.Store, volumeId needle.VolumeId, n *needle.Needle, r *http.Request) (size types.Size, err error) {
- //check JWT
- jwt := security.GetJwt(r)
- var remoteLocations []operation.Location
- if r.FormValue("type") != "replicate" {
- remoteLocations, err = GetWritableRemoteReplications(store, grpcDialOption, volumeId, masterFn)
- if err != nil {
- glog.V(0).Infoln(err)
- return
- }
- }
- size, err = store.DeleteVolumeNeedle(volumeId, n)
- if err != nil {
- glog.V(0).Infoln("delete error:", err)
- return
- }
- if len(remoteLocations) > 0 { //send to other replica locations
- if err = DistributedOperation(remoteLocations, func(location operation.Location) error {
- return util_http.Delete("http://"+location.Url+r.URL.Path+"?type=replicate", string(jwt))
- }); err != nil {
- size = 0
- }
- }
- return
- }
- type DistributedOperationResult map[string]error
- func (dr DistributedOperationResult) Error() error {
- var errs []string
- for k, v := range dr {
- if v != nil {
- errs = append(errs, fmt.Sprintf("[%s]: %v", k, v))
- }
- }
- if len(errs) == 0 {
- return nil
- }
- return errors.New(strings.Join(errs, "\n"))
- }
- type RemoteResult struct {
- Host string
- Error error
- }
- func DistributedOperation(locations []operation.Location, op func(location operation.Location) error) error {
- length := len(locations)
- results := make(chan RemoteResult)
- for _, location := range locations {
- go func(location operation.Location, results chan RemoteResult) {
- results <- RemoteResult{location.Url, op(location)}
- }(location, results)
- }
- ret := DistributedOperationResult(make(map[string]error))
- for i := 0; i < length; i++ {
- result := <-results
- ret[result.Host] = result.Error
- }
- return ret.Error()
- }
- func GetWritableRemoteReplications(s *storage.Store, grpcDialOption grpc.DialOption, volumeId needle.VolumeId, masterFn operation.GetMasterFn) (remoteLocations []operation.Location, err error) {
- v := s.GetVolume(volumeId)
- if v != nil && v.ReplicaPlacement.GetCopyCount() == 1 {
- return
- }
- // not on local store, or has replications
- lookupResult, lookupErr := operation.LookupVolumeId(masterFn, grpcDialOption, volumeId.String())
- if lookupErr == nil {
- selfUrl := util.JoinHostPort(s.Ip, s.Port)
- for _, location := range lookupResult.Locations {
- if location.Url != selfUrl {
- remoteLocations = append(remoteLocations, location)
- }
- }
- } else {
- err = fmt.Errorf("replicating lookup failed for %d: %v", volumeId, lookupErr)
- return
- }
- if v != nil {
- // has one local and has remote replications
- copyCount := v.ReplicaPlacement.GetCopyCount()
- if len(lookupResult.Locations) < copyCount {
- err = fmt.Errorf("replicating operations [%d] is less than volume %d replication copy count [%d]",
- len(lookupResult.Locations), volumeId, copyCount)
- }
- }
- return
- }
|