You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							240 lines
						
					
					
						
							7.0 KiB
						
					
					
				
			
		
		
		
			
			
			
		
		
	
	
							240 lines
						
					
					
						
							7.0 KiB
						
					
					
				| package topology | |
| 
 | |
| import ( | |
| 	"context" | |
| 	"encoding/json" | |
| 	"errors" | |
| 	"fmt" | |
| 	"google.golang.org/grpc" | |
| 	"net/http" | |
| 	"net/url" | |
| 	"strconv" | |
| 	"strings" | |
| 	"time" | |
| 
 | |
| 	"github.com/seaweedfs/seaweedfs/weed/glog" | |
| 	"github.com/seaweedfs/seaweedfs/weed/operation" | |
| 	"github.com/seaweedfs/seaweedfs/weed/security" | |
| 	"github.com/seaweedfs/seaweedfs/weed/stats" | |
| 	"github.com/seaweedfs/seaweedfs/weed/storage" | |
| 	"github.com/seaweedfs/seaweedfs/weed/storage/needle" | |
| 	"github.com/seaweedfs/seaweedfs/weed/storage/types" | |
| 	"github.com/seaweedfs/seaweedfs/weed/util" | |
| 	"github.com/seaweedfs/seaweedfs/weed/util/buffer_pool" | |
| 	util_http "github.com/seaweedfs/seaweedfs/weed/util/http" | |
| ) | |
| 
 | |
| func ReplicatedWrite(ctx context.Context, masterFn operation.GetMasterFn, grpcDialOption grpc.DialOption, s *storage.Store, volumeId needle.VolumeId, n *needle.Needle, r *http.Request, contentMd5 string) (isUnchanged bool, err error) { | |
| 
 | |
| 	//check JWT | |
| 	jwt := security.GetJwt(r) | |
| 
 | |
| 	// check whether this is a replicated write request | |
| 	var remoteLocations []operation.Location | |
| 	if r.FormValue("type") != "replicate" { | |
| 		// this is the initial request | |
| 		remoteLocations, err = GetWritableRemoteReplications(s, grpcDialOption, volumeId, masterFn) | |
| 		if err != nil { | |
| 			glog.V(0).Infoln(err) | |
| 			return | |
| 		} | |
| 	} | |
| 
 | |
| 	// read fsync value | |
| 	fsync := false | |
| 	if r.FormValue("fsync") == "true" { | |
| 		fsync = true | |
| 	} | |
| 
 | |
| 	if s.GetVolume(volumeId) != nil { | |
| 		start := time.Now() | |
| 
 | |
| 		inFlightGauge := stats.VolumeServerInFlightRequestsGauge.WithLabelValues(stats.WriteToLocalDisk) | |
| 		inFlightGauge.Inc() | |
| 		defer inFlightGauge.Dec() | |
| 
 | |
| 		isUnchanged, err = s.WriteVolumeNeedle(volumeId, n, true, fsync) | |
| 		stats.VolumeServerRequestHistogram.WithLabelValues(stats.WriteToLocalDisk).Observe(time.Since(start).Seconds()) | |
| 		if err != nil { | |
| 			stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorWriteToLocalDisk).Inc() | |
| 			err = fmt.Errorf("failed to write to local disk: %v", err) | |
| 			glog.V(0).Infoln(err) | |
| 			return | |
| 		} | |
| 	} | |
| 
 | |
| 	if len(remoteLocations) > 0 { //send to other replica locations | |
| 		start := time.Now() | |
| 
 | |
| 		inFlightGauge := stats.VolumeServerInFlightRequestsGauge.WithLabelValues(stats.WriteToReplicas) | |
| 		inFlightGauge.Inc() | |
| 		defer inFlightGauge.Dec() | |
| 
 | |
| 		err = DistributedOperation(remoteLocations, func(location operation.Location) error { | |
| 			u := url.URL{ | |
| 				Scheme: "http", | |
| 				Host:   location.Url, | |
| 				Path:   r.URL.Path, | |
| 			} | |
| 			q := url.Values{ | |
| 				"type": {"replicate"}, | |
| 				"ttl":  {n.Ttl.String()}, | |
| 			} | |
| 			if n.LastModified > 0 { | |
| 				q.Set("ts", strconv.FormatUint(n.LastModified, 10)) | |
| 			} | |
| 			if n.IsChunkedManifest() { | |
| 				q.Set("cm", "true") | |
| 			} | |
| 			u.RawQuery = q.Encode() | |
| 
 | |
| 			pairMap := make(map[string]string) | |
| 			if n.HasPairs() { | |
| 				tmpMap := make(map[string]string) | |
| 				err := json.Unmarshal(n.Pairs, &tmpMap) | |
| 				if err != nil { | |
| 					stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorUnmarshalPairs).Inc() | |
| 					glog.V(0).Infoln("Unmarshal pairs error:", err) | |
| 				} | |
| 				for k, v := range tmpMap { | |
| 					pairMap[needle.PairNamePrefix+k] = v | |
| 				} | |
| 			} | |
| 			bytesBuffer := buffer_pool.SyncPoolGetBuffer() | |
| 			defer buffer_pool.SyncPoolPutBuffer(bytesBuffer) | |
| 
 | |
| 			// volume server do not know about encryption | |
| 			// TODO optimize here to compress data only once | |
| 			uploadOption := &operation.UploadOption{ | |
| 				UploadUrl:         u.String(), | |
| 				Filename:          string(n.Name), | |
| 				Cipher:            false, | |
| 				IsInputCompressed: n.IsCompressed(), | |
| 				MimeType:          string(n.Mime), | |
| 				PairMap:           pairMap, | |
| 				Jwt:               jwt, | |
| 				Md5:               contentMd5, | |
| 				BytesBuffer:       bytesBuffer, | |
| 			} | |
| 
 | |
| 			uploader, err := operation.NewUploader() | |
| 			if err != nil { | |
| 				glog.Errorf("replication-UploadData, err:%v, url:%s", err, u.String()) | |
| 				return err | |
| 			} | |
| 			_, err = uploader.UploadData(ctx, n.Data, uploadOption) | |
| 			if err != nil { | |
| 				glog.Errorf("replication-UploadData, err:%v, url:%s", err, u.String()) | |
| 			} | |
| 			return err | |
| 		}) | |
| 		stats.VolumeServerRequestHistogram.WithLabelValues(stats.WriteToReplicas).Observe(time.Since(start).Seconds()) | |
| 		if err != nil { | |
| 			stats.VolumeServerHandlerCounter.WithLabelValues(stats.ErrorWriteToReplicas).Inc() | |
| 			err = fmt.Errorf("failed to write to replicas for volume %d: %v", volumeId, err) | |
| 			glog.V(0).Infoln(err) | |
| 			return false, err | |
| 		} | |
| 	} | |
| 	return | |
| } | |
| 
 | |
| func ReplicatedDelete(masterFn operation.GetMasterFn, grpcDialOption grpc.DialOption, store *storage.Store, volumeId needle.VolumeId, n *needle.Needle, r *http.Request) (size types.Size, err error) { | |
| 
 | |
| 	//check JWT | |
| 	jwt := security.GetJwt(r) | |
| 
 | |
| 	var remoteLocations []operation.Location | |
| 	if r.FormValue("type") != "replicate" { | |
| 		remoteLocations, err = GetWritableRemoteReplications(store, grpcDialOption, volumeId, masterFn) | |
| 		if err != nil { | |
| 			glog.V(0).Infoln(err) | |
| 			return | |
| 		} | |
| 	} | |
| 
 | |
| 	size, err = store.DeleteVolumeNeedle(volumeId, n) | |
| 	if err != nil { | |
| 		glog.V(0).Infoln("delete error:", err) | |
| 		return | |
| 	} | |
| 
 | |
| 	if len(remoteLocations) > 0 { //send to other replica locations | |
| 		if err = DistributedOperation(remoteLocations, func(location operation.Location) error { | |
| 			return util_http.Delete("http://"+location.Url+r.URL.Path+"?type=replicate", string(jwt)) | |
| 		}); err != nil { | |
| 			size = 0 | |
| 		} | |
| 	} | |
| 	return | |
| } | |
| 
 | |
| type DistributedOperationResult map[string]error | |
| 
 | |
| func (dr DistributedOperationResult) Error() error { | |
| 	var errs []string | |
| 	for k, v := range dr { | |
| 		if v != nil { | |
| 			errs = append(errs, fmt.Sprintf("[%s]: %v", k, v)) | |
| 		} | |
| 	} | |
| 	if len(errs) == 0 { | |
| 		return nil | |
| 	} | |
| 	return errors.New(strings.Join(errs, "\n")) | |
| } | |
| 
 | |
| type RemoteResult struct { | |
| 	Host  string | |
| 	Error error | |
| } | |
| 
 | |
| func DistributedOperation(locations []operation.Location, op func(location operation.Location) error) error { | |
| 	length := len(locations) | |
| 	results := make(chan RemoteResult) | |
| 	for _, location := range locations { | |
| 		go func(location operation.Location, results chan RemoteResult) { | |
| 			results <- RemoteResult{location.Url, op(location)} | |
| 		}(location, results) | |
| 	} | |
| 	ret := DistributedOperationResult(make(map[string]error)) | |
| 	for i := 0; i < length; i++ { | |
| 		result := <-results | |
| 		ret[result.Host] = result.Error | |
| 	} | |
| 
 | |
| 	return ret.Error() | |
| } | |
| 
 | |
| func GetWritableRemoteReplications(s *storage.Store, grpcDialOption grpc.DialOption, volumeId needle.VolumeId, masterFn operation.GetMasterFn) (remoteLocations []operation.Location, err error) { | |
| 
 | |
| 	v := s.GetVolume(volumeId) | |
| 	if v != nil && v.ReplicaPlacement.GetCopyCount() == 1 { | |
| 		return | |
| 	} | |
| 
 | |
| 	// not on local store, or has replications | |
| 	lookupResult, lookupErr := operation.LookupVolumeId(masterFn, grpcDialOption, volumeId.String()) | |
| 	if lookupErr == nil { | |
| 		selfUrl := util.JoinHostPort(s.Ip, s.Port) | |
| 		for _, location := range lookupResult.Locations { | |
| 			if location.Url != selfUrl { | |
| 				remoteLocations = append(remoteLocations, location) | |
| 			} | |
| 		} | |
| 	} else { | |
| 		err = fmt.Errorf("replicating lookup failed for %d: %v", volumeId, lookupErr) | |
| 		return | |
| 	} | |
| 
 | |
| 	if v != nil { | |
| 		// has one local and has remote replications | |
| 		copyCount := v.ReplicaPlacement.GetCopyCount() | |
| 		if len(lookupResult.Locations) < copyCount { | |
| 			err = fmt.Errorf("replicating operations [%d] is less than volume %d replication copy count [%d]", | |
| 				len(lookupResult.Locations), volumeId, copyCount) | |
| 		} | |
| 	} | |
| 
 | |
| 	return | |
| }
 |