aboutsummaryrefslogtreecommitdiff
path: root/weed/wdclient/vidmap_client.go
diff options
context:
space:
mode:
Diffstat (limited to 'weed/wdclient/vidmap_client.go')
-rw-r--r--weed/wdclient/vidmap_client.go347
1 files changed, 347 insertions, 0 deletions
diff --git a/weed/wdclient/vidmap_client.go b/weed/wdclient/vidmap_client.go
new file mode 100644
index 000000000..402eaf8c4
--- /dev/null
+++ b/weed/wdclient/vidmap_client.go
@@ -0,0 +1,347 @@
+package wdclient
+
+import (
+ "context"
+ "errors"
+ "fmt"
+ "math/rand"
+ "sort"
+ "strconv"
+ "strings"
+ "sync"
+
+ "golang.org/x/sync/singleflight"
+
+ "github.com/seaweedfs/seaweedfs/weed/glog"
+)
+
+// VolumeLocationProvider is the interface for looking up volume locations
+// This allows different implementations (master subscription, filer queries, etc.)
+type VolumeLocationProvider interface {
+ // LookupVolumeIds looks up volume locations for the given volume IDs
+ // Returns a map of volume ID to locations
+ LookupVolumeIds(ctx context.Context, volumeIds []string) (map[string][]Location, error)
+}
+
+// vidMapClient provides volume location caching with pluggable lookup
+// It wraps the battle-tested vidMap with customizable volume lookup strategies
+type vidMapClient struct {
+ vidMap *vidMap
+ vidMapLock sync.RWMutex
+ vidMapCacheSize int
+ provider VolumeLocationProvider
+ vidLookupGroup singleflight.Group
+}
+
+const (
+ // DefaultVidMapCacheSize is the default number of historical vidMap snapshots to keep
+ // This provides cache history when volumes move between servers
+ DefaultVidMapCacheSize = 5
+)
+
+// newVidMapClient creates a new client with the given provider and data center
+func newVidMapClient(provider VolumeLocationProvider, dataCenter string, cacheSize int) *vidMapClient {
+ if cacheSize <= 0 {
+ cacheSize = DefaultVidMapCacheSize
+ }
+ return &vidMapClient{
+ vidMap: newVidMap(dataCenter),
+ vidMapCacheSize: cacheSize,
+ provider: provider,
+ }
+}
+
+// GetLookupFileIdFunction returns a function that can be used to lookup file IDs
+func (vc *vidMapClient) GetLookupFileIdFunction() LookupFileIdFunctionType {
+ return vc.LookupFileIdWithFallback
+}
+
+// LookupFileIdWithFallback looks up a file ID, checking cache first, then using provider
+func (vc *vidMapClient) LookupFileIdWithFallback(ctx context.Context, fileId string) (fullUrls []string, err error) {
+ // Try cache first - hold read lock during entire vidMap access to prevent swap during operation
+ vc.vidMapLock.RLock()
+ vm := vc.vidMap
+ dataCenter := vm.DataCenter
+ fullUrls, err = vm.LookupFileId(ctx, fileId)
+ vc.vidMapLock.RUnlock()
+
+ // Cache hit - return immediately
+ if err == nil && len(fullUrls) > 0 {
+ return
+ }
+
+ // Cache miss - extract volume ID from file ID (format: "volumeId,needle_id_cookie")
+ parts := strings.Split(fileId, ",")
+ if len(parts) != 2 {
+ return nil, fmt.Errorf("invalid fileId %s", fileId)
+ }
+ volumeId := parts[0]
+
+ // Use shared lookup logic with batching and singleflight
+ vidLocations, err := vc.LookupVolumeIdsWithFallback(ctx, []string{volumeId})
+
+ // Check for partial results first (important for multi-volume batched lookups)
+ locations, found := vidLocations[volumeId]
+ if !found || len(locations) == 0 {
+ // Volume not found - return specific error with context from lookup if available
+ if err != nil {
+ return nil, fmt.Errorf("volume %s not found for fileId %s: %w", volumeId, fileId, err)
+ }
+ return nil, fmt.Errorf("volume %s not found for fileId %s", volumeId, fileId)
+ }
+
+ // Volume found successfully - ignore any errors about other volumes
+ // (not relevant for single-volume lookup, but defensive for future batching)
+
+ // Build HTTP URLs from locations, preferring same data center
+ var sameDcUrls, otherDcUrls []string
+ for _, loc := range locations {
+ httpUrl := "http://" + loc.Url + "/" + fileId
+ if dataCenter != "" && dataCenter == loc.DataCenter {
+ sameDcUrls = append(sameDcUrls, httpUrl)
+ } else {
+ otherDcUrls = append(otherDcUrls, httpUrl)
+ }
+ }
+
+ // Shuffle to distribute load across volume servers
+ rand.Shuffle(len(sameDcUrls), func(i, j int) { sameDcUrls[i], sameDcUrls[j] = sameDcUrls[j], sameDcUrls[i] })
+ rand.Shuffle(len(otherDcUrls), func(i, j int) { otherDcUrls[i], otherDcUrls[j] = otherDcUrls[j], otherDcUrls[i] })
+
+ // Prefer same data center
+ fullUrls = append(sameDcUrls, otherDcUrls...)
+ return fullUrls, nil
+}
+
+// LookupVolumeIdsWithFallback looks up volume locations, querying provider if not in cache.
+// Uses singleflight to coalesce concurrent requests for the same batch of volumes.
+//
+// IMPORTANT: This function may return PARTIAL results with a non-nil error.
+// The result map contains successfully looked up volumes, while the error aggregates
+// failures for volumes that couldn't be found or had lookup errors.
+//
+// Callers MUST check both the result map AND the error:
+// - result != nil && err == nil: All volumes found successfully
+// - result != nil && err != nil: Some volumes found, some failed (check both)
+// - result == nil && err != nil: Complete failure (connection error, etc.)
+//
+// Example usage:
+//
+// locs, err := mc.LookupVolumeIdsWithFallback(ctx, []string{"1", "2", "999"})
+// if len(locs) > 0 {
+// // Process successfully found volumes
+// }
+// if err != nil {
+// // Log/handle failed volumes
+// }
+func (vc *vidMapClient) LookupVolumeIdsWithFallback(ctx context.Context, volumeIds []string) (map[string][]Location, error) {
+ result := make(map[string][]Location)
+ var needsLookup []string
+ var lookupErrors []error
+
+ // Check cache first and parse volume IDs once
+ vidStringToUint := make(map[string]uint32, len(volumeIds))
+
+ // Get stable pointer to vidMap with minimal lock hold time
+ vm := vc.getStableVidMap()
+
+ for _, vidString := range volumeIds {
+ vid, err := strconv.ParseUint(vidString, 10, 32)
+ if err != nil {
+ return nil, fmt.Errorf("invalid volume id %s: %v", vidString, err)
+ }
+ vidStringToUint[vidString] = uint32(vid)
+
+ locations, found := vm.GetLocations(uint32(vid))
+ if found && len(locations) > 0 {
+ result[vidString] = locations
+ } else {
+ needsLookup = append(needsLookup, vidString)
+ }
+ }
+
+ if len(needsLookup) == 0 {
+ return result, nil
+ }
+
+ // Batch query all missing volumes using singleflight on the batch key
+ // Sort for stable key to coalesce identical batches
+ sort.Strings(needsLookup)
+ batchKey := strings.Join(needsLookup, ",")
+
+ sfResult, err, _ := vc.vidLookupGroup.Do(batchKey, func() (interface{}, error) {
+ // Double-check cache for volumes that might have been populated while waiting
+ stillNeedLookup := make([]string, 0, len(needsLookup))
+ batchResult := make(map[string][]Location)
+
+ // Get stable pointer with minimal lock hold time
+ vm := vc.getStableVidMap()
+
+ for _, vidString := range needsLookup {
+ vid := vidStringToUint[vidString] // Use pre-parsed value
+ if locations, found := vm.GetLocations(vid); found && len(locations) > 0 {
+ batchResult[vidString] = locations
+ } else {
+ stillNeedLookup = append(stillNeedLookup, vidString)
+ }
+ }
+
+ if len(stillNeedLookup) == 0 {
+ return batchResult, nil
+ }
+
+ // Query provider with batched volume IDs
+ glog.V(2).Infof("Looking up %d volumes from provider: %v", len(stillNeedLookup), stillNeedLookup)
+
+ providerResults, err := vc.provider.LookupVolumeIds(ctx, stillNeedLookup)
+ if err != nil {
+ return batchResult, fmt.Errorf("provider lookup failed: %v", err)
+ }
+
+ // Update cache with results
+ for vidString, locations := range providerResults {
+ vid, err := strconv.ParseUint(vidString, 10, 32)
+ if err != nil {
+ glog.Warningf("Failed to parse volume id '%s': %v", vidString, err)
+ continue
+ }
+
+ for _, loc := range locations {
+ vc.addLocation(uint32(vid), loc)
+ }
+
+ if len(locations) > 0 {
+ batchResult[vidString] = locations
+ }
+ }
+
+ return batchResult, nil
+ })
+
+ if err != nil {
+ lookupErrors = append(lookupErrors, err)
+ }
+
+ // Merge singleflight batch results
+ if batchLocations, ok := sfResult.(map[string][]Location); ok {
+ for vid, locs := range batchLocations {
+ result[vid] = locs
+ }
+ }
+
+ // Check for volumes that still weren't found
+ for _, vidString := range needsLookup {
+ if _, found := result[vidString]; !found {
+ lookupErrors = append(lookupErrors, fmt.Errorf("volume %s not found", vidString))
+ }
+ }
+
+ // Return aggregated errors
+ return result, errors.Join(lookupErrors...)
+}
+
+// getStableVidMap gets a stable pointer to the vidMap, releasing the lock immediately.
+// WARNING: Use with caution. The returned vidMap pointer is stable (won't be garbage collected
+// due to cache chain), but the vidMapClient.vidMap field may be swapped by resetVidMap().
+// For operations that must use the current vidMap atomically, use withCurrentVidMap() instead.
+func (vc *vidMapClient) getStableVidMap() *vidMap {
+ vc.vidMapLock.RLock()
+ vm := vc.vidMap
+ vc.vidMapLock.RUnlock()
+ return vm
+}
+
+// withCurrentVidMap executes a function with the current vidMap under a read lock.
+// This guarantees the vidMap instance cannot be swapped during the function execution.
+// Use this when you need atomic access to the current vidMap for multiple operations.
+func (vc *vidMapClient) withCurrentVidMap(f func(vm *vidMap)) {
+ vc.vidMapLock.RLock()
+ defer vc.vidMapLock.RUnlock()
+ f(vc.vidMap)
+}
+
+// Public methods for external access
+
+// GetLocations safely retrieves volume locations
+func (vc *vidMapClient) GetLocations(vid uint32) (locations []Location, found bool) {
+ return vc.getStableVidMap().GetLocations(vid)
+}
+
+// GetLocationsClone safely retrieves a clone of volume locations
+func (vc *vidMapClient) GetLocationsClone(vid uint32) (locations []Location, found bool) {
+ return vc.getStableVidMap().GetLocationsClone(vid)
+}
+
+// GetVidLocations safely retrieves volume locations by string ID
+func (vc *vidMapClient) GetVidLocations(vid string) (locations []Location, err error) {
+ return vc.getStableVidMap().GetVidLocations(vid)
+}
+
+// LookupFileId safely looks up URLs for a file ID
+func (vc *vidMapClient) LookupFileId(ctx context.Context, fileId string) (fullUrls []string, err error) {
+ return vc.getStableVidMap().LookupFileId(ctx, fileId)
+}
+
+// LookupVolumeServerUrl safely looks up volume server URLs
+func (vc *vidMapClient) LookupVolumeServerUrl(vid string) (serverUrls []string, err error) {
+ return vc.getStableVidMap().LookupVolumeServerUrl(vid)
+}
+
+// GetDataCenter safely retrieves the data center
+func (vc *vidMapClient) GetDataCenter() string {
+ return vc.getStableVidMap().DataCenter
+}
+
+// Thread-safe helpers for vidMap operations
+
+// addLocation adds a volume location
+func (vc *vidMapClient) addLocation(vid uint32, location Location) {
+ vc.withCurrentVidMap(func(vm *vidMap) {
+ vm.addLocation(vid, location)
+ })
+}
+
+// deleteLocation removes a volume location
+func (vc *vidMapClient) deleteLocation(vid uint32, location Location) {
+ vc.withCurrentVidMap(func(vm *vidMap) {
+ vm.deleteLocation(vid, location)
+ })
+}
+
+// addEcLocation adds an EC volume location
+func (vc *vidMapClient) addEcLocation(vid uint32, location Location) {
+ vc.withCurrentVidMap(func(vm *vidMap) {
+ vm.addEcLocation(vid, location)
+ })
+}
+
+// deleteEcLocation removes an EC volume location
+func (vc *vidMapClient) deleteEcLocation(vid uint32, location Location) {
+ vc.withCurrentVidMap(func(vm *vidMap) {
+ vm.deleteEcLocation(vid, location)
+ })
+}
+
+// resetVidMap resets the volume ID map
+func (vc *vidMapClient) resetVidMap() {
+ vc.vidMapLock.Lock()
+ defer vc.vidMapLock.Unlock()
+
+ // Preserve the existing vidMap in the cache chain
+ tail := vc.vidMap
+
+ nvm := newVidMap(tail.DataCenter)
+ nvm.cache.Store(tail)
+ vc.vidMap = nvm
+
+ // Trim cache chain to vidMapCacheSize
+ node := tail
+ for i := 0; i < vc.vidMapCacheSize-1; i++ {
+ if node.cache.Load() == nil {
+ return
+ }
+ node = node.cache.Load()
+ }
+ // node is guaranteed to be non-nil after the loop
+ node.cache.Store(nil)
+}