You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							240 lines
						
					
					
						
							7.0 KiB
						
					
					
				
			
		
		
		
			
			
			
		
		
	
	
							240 lines
						
					
					
						
							7.0 KiB
						
					
					
				
								package topology
							 | 
						|
								
							 | 
						|
								import (
							 | 
						|
									"context"
							 | 
						|
									"encoding/json"
							 | 
						|
									"errors"
							 | 
						|
									"fmt"
							 | 
						|
									"google.golang.org/grpc"
							 | 
						|
									"net/http"
							 | 
						|
									"net/url"
							 | 
						|
									"strconv"
							 | 
						|
									"strings"
							 | 
						|
									"time"
							 | 
						|
								
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/glog"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/operation"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/security"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/stats"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/storage"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/storage/needle"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/storage/types"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/util"
							 | 
						|
									"github.com/seaweedfs/seaweedfs/weed/util/buffer_pool"
							 | 
						|
									util_http "github.com/seaweedfs/seaweedfs/weed/util/http"
							 | 
						|
								)
							 | 
						|
								
							 | 
						|
								func ReplicatedWrite(ctx context.Context, masterFn operation.GetMasterFn, grpcDialOption grpc.DialOption, s *storage.Store, volumeId needle.VolumeId, n *needle.Needle, r *http.Request, contentMd5 string) (isUnchanged bool, err error) {
							 | 
						|
								
							 | 
						|
									//check JWT
							 | 
						|
									jwt := security.GetJwt(r)
							 | 
						|
								
							 | 
						|
									// check whether this is a replicated write request
							 | 
						|
									var remoteLocations []operation.Location
							 | 
						|
									if r.FormValue("type") != "replicate" {
							 | 
						|
										// this is the initial request
							 | 
						|
										remoteLocations, err = GetWritableRemoteReplications(s, grpcDialOption, volumeId, masterFn)
							 | 
						|
										if err != nil {
							 | 
						|
											glog.V(0).Infoln(err)
							 | 
						|
											return
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									// read fsync value
							 | 
						|
									fsync := false
							 | 
						|
									if r.FormValue("fsync") == "true" {
							 | 
						|
										fsync = true
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									if s.GetVolume(volumeId) != nil {
							 | 
						|
										start := time.Now()
							 | 
						|
								
							 | 
						|
										inFlightGauge := stats.VolumeServerInFlightRequestsGauge.WithLabelValues(stats.WriteToLocalDisk)
							 | 
						|
										inFlightGauge.Inc()
							 | 
						|
										defer inFlightGauge.Dec()
							 | 
						|
								
							 | 
						|
										isUnchanged, err = s.WriteVolumeNeedle(volumeId, n, true, fsync)
							 | 
						|
										stats.VolumeServerRequestHistogram.WithLabelValues(stats.WriteToLocalDisk).Observe(time.Since(start).Seconds())
							 | 
						|
										if err != nil {
							 | 
						|
											stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorWriteToLocalDisk).Inc()
							 | 
						|
											err = fmt.Errorf("failed to write to local disk: %w", err)
							 | 
						|
											glog.V(0).Infoln(err)
							 | 
						|
											return
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									if len(remoteLocations) > 0 { //send to other replica locations
							 | 
						|
										start := time.Now()
							 | 
						|
								
							 | 
						|
										inFlightGauge := stats.VolumeServerInFlightRequestsGauge.WithLabelValues(stats.WriteToReplicas)
							 | 
						|
										inFlightGauge.Inc()
							 | 
						|
										defer inFlightGauge.Dec()
							 | 
						|
								
							 | 
						|
										err = DistributedOperation(remoteLocations, func(location operation.Location) error {
							 | 
						|
											u := url.URL{
							 | 
						|
												Scheme: "http",
							 | 
						|
												Host:   location.Url,
							 | 
						|
												Path:   r.URL.Path,
							 | 
						|
											}
							 | 
						|
											q := url.Values{
							 | 
						|
												"type": {"replicate"},
							 | 
						|
												"ttl":  {n.Ttl.String()},
							 | 
						|
											}
							 | 
						|
											if n.LastModified > 0 {
							 | 
						|
												q.Set("ts", strconv.FormatUint(n.LastModified, 10))
							 | 
						|
											}
							 | 
						|
											if n.IsChunkedManifest() {
							 | 
						|
												q.Set("cm", "true")
							 | 
						|
											}
							 | 
						|
											u.RawQuery = q.Encode()
							 | 
						|
								
							 | 
						|
											pairMap := make(map[string]string)
							 | 
						|
											if n.HasPairs() {
							 | 
						|
												tmpMap := make(map[string]string)
							 | 
						|
												err := json.Unmarshal(n.Pairs, &tmpMap)
							 | 
						|
												if err != nil {
							 | 
						|
													stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorUnmarshalPairs).Inc()
							 | 
						|
													glog.V(0).Infoln("Unmarshal pairs error:", err)
							 | 
						|
												}
							 | 
						|
												for k, v := range tmpMap {
							 | 
						|
													pairMap[needle.PairNamePrefix+k] = v
							 | 
						|
												}
							 | 
						|
											}
							 | 
						|
											bytesBuffer := buffer_pool.SyncPoolGetBuffer()
							 | 
						|
											defer buffer_pool.SyncPoolPutBuffer(bytesBuffer)
							 | 
						|
								
							 | 
						|
											// volume server do not know about encryption
							 | 
						|
											// TODO optimize here to compress data only once
							 | 
						|
											uploadOption := &operation.UploadOption{
							 | 
						|
												UploadUrl:         u.String(),
							 | 
						|
												Filename:          string(n.Name),
							 | 
						|
												Cipher:            false,
							 | 
						|
												IsInputCompressed: n.IsCompressed(),
							 | 
						|
												MimeType:          string(n.Mime),
							 | 
						|
												PairMap:           pairMap,
							 | 
						|
												Jwt:               jwt,
							 | 
						|
												Md5:               contentMd5,
							 | 
						|
												BytesBuffer:       bytesBuffer,
							 | 
						|
											}
							 | 
						|
								
							 | 
						|
											uploader, err := operation.NewUploader()
							 | 
						|
											if err != nil {
							 | 
						|
												glog.Errorf("replication-UploadData, err:%v, url:%s", err, u.String())
							 | 
						|
												return err
							 | 
						|
											}
							 | 
						|
											_, err = uploader.UploadData(ctx, n.Data, uploadOption)
							 | 
						|
											if err != nil {
							 | 
						|
												glog.Errorf("replication-UploadData, err:%v, url:%s", err, u.String())
							 | 
						|
											}
							 | 
						|
											return err
							 | 
						|
										})
							 | 
						|
										stats.VolumeServerRequestHistogram.WithLabelValues(stats.WriteToReplicas).Observe(time.Since(start).Seconds())
							 | 
						|
										if err != nil {
							 | 
						|
											stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorWriteToReplicas).Inc()
							 | 
						|
											err = fmt.Errorf("failed to write to replicas for volume %d: %v", volumeId, err)
							 | 
						|
											glog.V(0).Infoln(err)
							 | 
						|
											return false, err
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
									return
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								func ReplicatedDelete(masterFn operation.GetMasterFn, grpcDialOption grpc.DialOption, store *storage.Store, volumeId needle.VolumeId, n *needle.Needle, r *http.Request) (size types.Size, err error) {
							 | 
						|
								
							 | 
						|
									//check JWT
							 | 
						|
									jwt := security.GetJwt(r)
							 | 
						|
								
							 | 
						|
									var remoteLocations []operation.Location
							 | 
						|
									if r.FormValue("type") != "replicate" {
							 | 
						|
										remoteLocations, err = GetWritableRemoteReplications(store, grpcDialOption, volumeId, masterFn)
							 | 
						|
										if err != nil {
							 | 
						|
											glog.V(0).Infoln(err)
							 | 
						|
											return
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									size, err = store.DeleteVolumeNeedle(volumeId, n)
							 | 
						|
									if err != nil {
							 | 
						|
										glog.V(0).Infoln("delete error:", err)
							 | 
						|
										return
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									if len(remoteLocations) > 0 { //send to other replica locations
							 | 
						|
										if err = DistributedOperation(remoteLocations, func(location operation.Location) error {
							 | 
						|
											return util_http.Delete("http://"+location.Url+r.URL.Path+"?type=replicate", string(jwt))
							 | 
						|
										}); err != nil {
							 | 
						|
											size = 0
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
									return
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								type DistributedOperationResult map[string]error
							 | 
						|
								
							 | 
						|
								func (dr DistributedOperationResult) Error() error {
							 | 
						|
									var errs []string
							 | 
						|
									for k, v := range dr {
							 | 
						|
										if v != nil {
							 | 
						|
											errs = append(errs, fmt.Sprintf("[%s]: %v", k, v))
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
									if len(errs) == 0 {
							 | 
						|
										return nil
							 | 
						|
									}
							 | 
						|
									return errors.New(strings.Join(errs, "\n"))
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								type RemoteResult struct {
							 | 
						|
									Host  string
							 | 
						|
									Error error
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								func DistributedOperation(locations []operation.Location, op func(location operation.Location) error) error {
							 | 
						|
									length := len(locations)
							 | 
						|
									results := make(chan RemoteResult)
							 | 
						|
									for _, location := range locations {
							 | 
						|
										go func(location operation.Location, results chan RemoteResult) {
							 | 
						|
											results <- RemoteResult{location.Url, op(location)}
							 | 
						|
										}(location, results)
							 | 
						|
									}
							 | 
						|
									ret := DistributedOperationResult(make(map[string]error))
							 | 
						|
									for i := 0; i < length; i++ {
							 | 
						|
										result := <-results
							 | 
						|
										ret[result.Host] = result.Error
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									return ret.Error()
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								func GetWritableRemoteReplications(s *storage.Store, grpcDialOption grpc.DialOption, volumeId needle.VolumeId, masterFn operation.GetMasterFn) (remoteLocations []operation.Location, err error) {
							 | 
						|
								
							 | 
						|
									v := s.GetVolume(volumeId)
							 | 
						|
									if v != nil && v.ReplicaPlacement.GetCopyCount() == 1 {
							 | 
						|
										return
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									// not on local store, or has replications
							 | 
						|
									lookupResult, lookupErr := operation.LookupVolumeId(masterFn, grpcDialOption, volumeId.String())
							 | 
						|
									if lookupErr == nil {
							 | 
						|
										selfUrl := util.JoinHostPort(s.Ip, s.Port)
							 | 
						|
										for _, location := range lookupResult.Locations {
							 | 
						|
											if location.Url != selfUrl {
							 | 
						|
												remoteLocations = append(remoteLocations, location)
							 | 
						|
											}
							 | 
						|
										}
							 | 
						|
									} else {
							 | 
						|
										err = fmt.Errorf("replicating lookup failed for %d: %v", volumeId, lookupErr)
							 | 
						|
										return
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									if v != nil {
							 | 
						|
										// has one local and has remote replications
							 | 
						|
										copyCount := v.ReplicaPlacement.GetCopyCount()
							 | 
						|
										if len(lookupResult.Locations) < copyCount {
							 | 
						|
											err = fmt.Errorf("replicating operations [%d] is less than volume %d replication copy count [%d]",
							 | 
						|
												len(lookupResult.Locations), volumeId, copyCount)
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									return
							 | 
						|
								}
							 |