高性能缓存设计: 客户端缓存、元数据缓存、数据缓存（一致性保证）

老马啸西风2025/9/7大约 32 分钟

在分布式文件存储平台中，缓存是提升系统性能的关键组件。通过合理设计和实现多层缓存架构，可以显著减少网络延迟、降低存储系统负载，并提高整体响应速度。本章将深入探讨高性能缓存设计，包括客户端缓存、元数据缓存和数据缓存的实现原理与一致性保证机制。

7.3.1 缓存架构概述

分布式文件存储系统的缓存架构通常采用多层设计，从客户端到服务端形成完整的缓存体系。

7.3.1.1 多层缓存架构

# 多层缓存架构示例
import time
import threading
from typing import Dict, List, Optional, Any
from enum import Enum
from dataclasses import dataclass

class CacheLayer(Enum):
    """缓存层枚举"""
    CLIENT = "client"          # 客户端缓存
    METADATA = "metadata"      # 元数据缓存
    DATA = "data"              # 数据缓存
    STORAGE = "storage"        # 存储层（持久化层）

@dataclass
class CacheEntry:
    """缓存条目"""
    key: str
    value: Any
    timestamp: float
    expiry: float  # 过期时间
    size: int      # 条目大小
    layer: CacheLayer
    version: int   # 版本号，用于一致性控制

class MultiLayerCache:
    def __init__(self):
        self.layers: Dict[CacheLayer, Dict[str, CacheEntry]] = {
            layer: {} for layer in CacheLayer
        }
        self.layer_locks: Dict[CacheLayer, threading.Lock] = {
            layer: threading.Lock() for layer in CacheLayer
        }
        self.stats: Dict[CacheLayer, Dict[str, int]] = {
            layer: {"hits": 0, "misses": 0, "evictions": 0} for layer in CacheLayer
        }
    
    def get(self, key: str, preferred_layer: CacheLayer = CacheLayer.CLIENT) -> Optional[Any]:
        """
        从缓存中获取数据
        :param key: 缓存键
        :param preferred_layer: 优先查找的缓存层
        :return: 缓存值或None
        """
        # 按层级顺序查找缓存
        layers_to_check = [preferred_layer]
        # 如果优先层未命中，则按层级顺序继续查找
        for layer in CacheLayer:
            if layer not in layers_to_check:
                layers_to_check.append(layer)
        
        for layer in layers_to_check:
            with self.layer_locks[layer]:
                if key in self.layers[layer]:
                    entry = self.layers[layer][key]
                    # 检查是否过期
                    if time.time() < entry.expiry:
                        self.stats[layer]["hits"] += 1
                        return entry.value
                    else:
                        # 过期，删除条目
                        del self.layers[layer][key]
                        self.stats[layer]["evictions"] += 1
        
        # 所有层级都未命中
        self.stats[preferred_layer]["misses"] += 1
        return None
    
    def put(self, key: str, value: Any, layer: CacheLayer, ttl: float = 300.0, size: int = 1) -> bool:
        """
        将数据放入缓存
        :param key: 缓存键
        :param value: 缓存值
        :param layer: 缓存层
        :param ttl: 生存时间（秒）
        :param size: 条目大小
        :return: 是否成功
        """
        try:
            with self.layer_locks[layer]:
                entry = CacheEntry(
                    key=key,
                    value=value,
                    timestamp=time.time(),
                    expiry=time.time() + ttl,
                    size=size,
                    layer=layer,
                    version=int(time.time() * 1000000)  # 微秒级版本号
                )
                self.layers[layer][key] = entry
                return True
        except Exception as e:
            print(f"缓存写入失败: {e}")
            return False
    
    def invalidate(self, key: str, layer: Optional[CacheLayer] = None):
        """
        失效缓存条目
        :param key: 缓存键
        :param layer: 缓存层，如果为None则失效所有层
        """
        layers_to_invalidate = [layer] if layer else list(CacheLayer)
        
        for layer in layers_to_invalidate:
            with self.layer_locks[layer]:
                if key in self.layers[layer]:
                    del self.layers[layer][key]
                    self.stats[layer]["evictions"] += 1
    
    def get_stats(self) -> Dict[str, Any]:
        """
        获取缓存统计信息
        """
        total_stats = {}
        for layer, stats in self.stats.items():
            total_stats[layer.value] = {
                "hits": stats["hits"],
                "misses": stats["misses"],
                "evictions": stats["evictions"],
                "hit_rate": stats["hits"] / (stats["hits"] + stats["misses"]) if (stats["hits"] + stats["misses"]) > 0 else 0
            }
        return total_stats

# 使用示例
print("=== 多层缓存架构演示 ===")

# 创建多层缓存实例
multi_cache = MultiLayerCache()

# 在不同层放入数据
multi_cache.put("file1_metadata", {"name": "file1.txt", "size": 1024}, CacheLayer.METADATA, ttl=600)
multi_cache.put("file1_data", b"File content data...", CacheLayer.DATA, ttl=300)
multi_cache.put("file1_local", b"Local cached data...", CacheLayer.CLIENT, ttl=60)

# 从不同层读取数据
metadata = multi_cache.get("file1_metadata", CacheLayer.METADATA)
data = multi_cache.get("file1_data", CacheLayer.DATA)
local_data = multi_cache.get("file1_local", CacheLayer.CLIENT)

print(f"元数据: {metadata}")
print(f"数据: {data}")
print(f"本地缓存数据: {local_data}")

# 查看缓存统计
stats = multi_cache.get_stats()
print(f"缓存统计: {stats}")

7.3.1.2 缓存一致性挑战

# 缓存一致性挑战与解决方案
import hashlib
import json
import time
from typing import Dict, List, Optional
from enum import Enum

class ConsistencyModel(Enum):
    """一致性模型"""
    STRONG = "strong"      # 强一致性
    EVENTUAL = "eventual"  # 最终一致性
    READ_YOUR_WRITES = "read_your_writes"  # 读己之所写

class CacheConsistencyManager:
    def __init__(self):
        self.version_vector: Dict[str, int] = {}  # 版本向量
        self.cache_invalidations: Dict[str, float] = {}  # 失效时间戳
        self.consistency_model = ConsistencyModel.EVENTUAL
    
    def generate_version(self, key: str) -> int:
        """
        为缓存键生成新版本号
        """
        current_time = int(time.time() * 1000000)  # 微秒级时间戳
        self.version_vector[key] = current_time
        return current_time
    
    def validate_cache_entry(self, key: str, cached_version: int) -> bool:
        """
        验证缓存条目是否有效
        :param key: 缓存键
        :param cached_version: 缓存条目版本号
        :return: 是否有效
        """
        # 检查是否有更新的版本
        if key in self.version_vector:
            latest_version = self.version_vector[key]
            if cached_version < latest_version:
                return False
        
        # 检查是否在失效时间之后
        if key in self.cache_invalidations:
            invalidation_time = self.cache_invalidations[key]
            if cached_version < invalidation_time * 1000000:  # 转换为微秒
                return False
        
        return True
    
    def invalidate_cache(self, key: str):
        """
        失效指定键的缓存
        """
        self.cache_invalidations[key] = time.time()
        # 通知分布式环境中的其他节点（简化处理）
        self._notify_peers(key)
    
    def _notify_peers(self, key: str):
        """
        通知其他节点缓存失效（简化实现）
        """
        print(f"通知其他节点失效缓存键: {key}")
        # 在实际实现中，这里会通过网络向其他节点发送失效通知
    
    def set_consistency_model(self, model: ConsistencyModel):
        """
        设置一致性模型
        """
        self.consistency_model = model

class DistributedCacheWithConsistency:
    def __init__(self):
        self.cache_data: Dict[str, Dict] = {}
        self.consistency_manager = CacheConsistencyManager()
        self.cache_lock = threading.RLock()
    
    def read_with_consistency(self, key: str) -> Optional[Any]:
        """
        带一致性检查的读取操作
        """
        with self.cache_lock:
            if key in self.cache_data:
                cached_entry = self.cache_data[key]
                version = cached_entry.get("version", 0)
                
                # 验证缓存一致性
                if self.consistency_manager.validate_cache_entry(key, version):
                    return cached_entry["value"]
                else:
                    # 缓存失效，删除条目
                    del self.cache_data[key]
            
            # 缓存未命中或失效，需要从存储层读取
            return self._read_from_storage(key)
    
    def write_with_consistency(self, key: str, value: Any) -> bool:
        """
        带一致性保证的写入操作
        """
        with self.cache_lock:
            # 生成新版本号
            version = self.consistency_manager.generate_version(key)
            
            # 更新缓存
            self.cache_data[key] = {
                "value": value,
                "version": version,
                "timestamp": time.time()
            }
            
            # 失效其他节点的缓存
            self.consistency_manager.invalidate_cache(key)
            
            # 写入存储层（简化处理）
            return self._write_to_storage(key, value)
    
    def _read_from_storage(self, key: str) -> Optional[Any]:
        """
        从存储层读取数据（模拟实现）
        """
        print(f"从存储层读取: {key}")
        time.sleep(0.01)  # 模拟I/O延迟
        # 模拟返回数据
        return f"Data for {key}"
    
    def _write_to_storage(self, key: str, value: Any) -> bool:
        """
        向存储层写入数据（模拟实现）
        """
        print(f"向存储层写入: {key} = {value}")
        time.sleep(0.02)  # 模拟I/O延迟
        return True

# 使用示例
print("\n=== 缓存一致性挑战演示 ===")

# 创建带一致性管理的分布式缓存
dist_cache = DistributedCacheWithConsistency()

# 写入数据
dist_cache.write_with_consistency("file1", "File content 1")
print("写入文件 file1")

# 读取数据（第一次，缓存未命中）
data1 = dist_cache.read_with_consistency("file1")
print(f"第一次读取 file1: {data1}")

# 读取数据（第二次，应该从缓存读取）
data2 = dist_cache.read_with_consistency("file1")
print(f"第二次读取 file1: {data2}")

# 模拟数据更新
dist_cache.write_with_consistency("file1", "Updated file content 1")
print("更新文件 file1")

# 再次读取（应该从存储层读取，因为缓存已失效）
data3 = dist_cache.read_with_consistency("file1")
print(f"更新后读取 file1: {data3}")

7.3.2 客户端缓存设计

客户端缓存是分布式文件存储系统中最近的缓存层，直接面向应用程序，对提升用户体验具有重要作用。

7.3.2.1 客户端缓存策略

# 客户端缓存策略实现
import os
import hashlib
import json
import time
from typing import Dict, List, Optional, Tuple
from enum import Enum
import threading

class CacheEvictionPolicy(Enum):
    """缓存淘汰策略"""
    LRU = "lru"      # 最近最少使用
    LFU = "lfu"      # 最少频率使用
    FIFO = "fifo"    # 先进先出
    TTL = "ttl"      # 基于时间

class ClientCacheEntry:
    """客户端缓存条目"""
    def __init__(self, key: str, value: bytes, ttl: float = 300.0):
        self.key = key
        self.value = value
        self.size = len(value)
        self.created_time = time.time()
        self.last_access_time = time.time()
        self.expiry_time = self.created_time + ttl
        self.access_count = 1
        self.hash = hashlib.md5(value).hexdigest()

class ClientCacheManager:
    def __init__(self, max_size_mb: float = 100.0, eviction_policy: CacheEvictionPolicy = CacheEvictionPolicy.LRU):
        self.max_size_bytes = max_size_mb * 1024 * 1024
        self.current_size_bytes = 0
        self.eviction_policy = eviction_policy
        self.cache: Dict[str, ClientCacheEntry] = {}
        self.cache_lock = threading.RLock()
        self.stats = {
            "hits": 0,
            "misses": 0,
            "evictions": 0,
            "writes": 0
        }
    
    def get(self, key: str) -> Optional[bytes]:
        """
        从客户端缓存获取数据
        """
        with self.cache_lock:
            if key in self.cache:
                entry = self.cache[key]
                
                # 检查是否过期
                if time.time() > entry.expiry_time:
                    self._evict_entry(key)
                    self.stats["misses"] += 1
                    return None
                
                # 更新访问统计
                entry.last_access_time = time.time()
                entry.access_count += 1
                self.stats["hits"] += 1
                
                return entry.value
            else:
                self.stats["misses"] += 1
                return None
    
    def put(self, key: str, value: bytes, ttl: float = 300.0) -> bool:
        """
        将数据放入客户端缓存
        """
        with self.cache_lock:
            # 检查是否已存在
            if key in self.cache:
                # 更新现有条目
                old_entry = self.cache[key]
                self.current_size_bytes -= old_entry.size
                self.cache.pop(key)
            
            # 创建新条目
            entry = ClientCacheEntry(key, value, ttl)
            
            # 检查空间是否足够
            if self.current_size_bytes + entry.size > self.max_size_bytes:
                # 执行缓存淘汰
                if not self._evict_for_space(entry.size):
                    return False  # 空间不足且无法淘汰
            
            # 添加到缓存
            self.cache[key] = entry
            self.current_size_bytes += entry.size
            self.stats["writes"] += 1
            
            return True
    
    def _evict_for_space(self, required_size: int) -> bool:
        """
        为新条目腾出空间
        """
        # 根据淘汰策略选择要淘汰的条目
        entries_to_evict = self._select_entries_for_eviction(required_size)
        
        if not entries_to_evict:
            return False
        
        # 执行淘汰
        for key in entries_to_evict:
            self._evict_entry(key)
        
        return True
    
    def _select_entries_for_eviction(self, required_size: int) -> List[str]:
        """
        根据策略选择要淘汰的条目
        """
        if not self.cache:
            return []
        
        # 创建条目列表用于排序
        entries = list(self.cache.items())
        
        if self.eviction_policy == CacheEvictionPolicy.LRU:
            # 按最后访问时间排序（最久未使用的在前）
            entries.sort(key=lambda x: x[1].last_access_time)
        elif self.eviction_policy == CacheEvictionPolicy.LFU:
            # 按访问次数排序（最少使用的在前）
            entries.sort(key=lambda x: x[1].access_count)
        elif self.eviction_policy == CacheEvictionPolicy.FIFO:
            # 按创建时间排序（最早创建的在前）
            entries.sort(key=lambda x: x[1].created_time)
        elif self.eviction_policy == CacheEvictionPolicy.TTL:
            # 按过期时间排序（最早过期的在前）
            entries.sort(key=lambda x: x[1].expiry_time)
        
        # 选择足够的条目来腾出空间
        evicted_size = 0
        evicted_keys = []
        
        for key, entry in entries:
            evicted_size += entry.size
            evicted_keys.append(key)
            self.stats["evictions"] += 1
            
            if evicted_size >= required_size:
                break
        
        return evicted_keys
    
    def _evict_entry(self, key: str):
        """
        淘汰指定条目
        """
        if key in self.cache:
            entry = self.cache[key]
            self.current_size_bytes -= entry.size
            self.cache.pop(key)
            self.stats["evictions"] += 1
    
    def invalidate(self, key: str):
        """
        失效指定缓存条目
        """
        with self.cache_lock:
            if key in self.cache:
                self._evict_entry(key)
    
    def get_stats(self) -> Dict[str, any]:
        """
        获取缓存统计信息
        """
        with self.cache_lock:
            total_requests = self.stats["hits"] + self.stats["misses"]
            hit_rate = self.stats["hits"] / total_requests if total_requests > 0 else 0
            
            return {
                "max_size_mb": self.max_size_bytes / (1024 * 1024),
                "current_size_mb": self.current_size_bytes / (1024 * 1024),
                "entry_count": len(self.cache),
                "hits": self.stats["hits"],
                "misses": self.stats["misses"],
                "evictions": self.stats["evictions"],
                "writes": self.stats["writes"],
                "hit_rate": hit_rate,
                "utilization": self.current_size_bytes / self.max_size_bytes if self.max_size_bytes > 0 else 0
            }
    
    def clear(self):
        """
        清空缓存
        """
        with self.cache_lock:
            self.cache.clear()
            self.current_size_bytes = 0
            # 重置统计信息
            for key in self.stats:
                self.stats[key] = 0

class SmartClientCache:
    """
    智能客户端缓存，支持多种缓存类型
    """
    def __init__(self):
        # 不同类型的缓存
        self.metadata_cache = ClientCacheManager(max_size_mb=10.0, eviction_policy=CacheEvictionPolicy.LRU)
        self.data_cache = ClientCacheManager(max_size_mb=50.0, eviction_policy=CacheEvictionPolicy.LRU)
        self.attribute_cache = ClientCacheManager(max_size_mb=5.0, eviction_policy=CacheEvictionPolicy.LFU)
    
    def get_file_metadata(self, filepath: str) -> Optional[Dict]:
        """
        获取文件元数据
        """
        key = f"metadata:{filepath}"
        cached_data = self.metadata_cache.get(key)
        if cached_data:
            return json.loads(cached_data.decode('utf-8'))
        return None
    
    def put_file_metadata(self, filepath: str, metadata: Dict, ttl: float = 600.0):
        """
        缓存文件元数据
        """
        key = f"metadata:{filepath}"
        data = json.dumps(metadata).encode('utf-8')
        return self.metadata_cache.put(key, data, ttl)
    
    def get_file_data(self, filepath: str, offset: int = 0, length: int = -1) -> Optional[bytes]:
        """
        获取文件数据
        """
        # 对于数据缓存，使用更精细的键（包含偏移和长度）
        if length == -1:
            key = f"data:{filepath}:{offset}:end"
        else:
            key = f"data:{filepath}:{offset}:{length}"
        
        return self.data_cache.get(key)
    
    def put_file_data(self, filepath: str, data: bytes, offset: int = 0, ttl: float = 300.0):
        """
        缓存文件数据
        """
        length = len(data)
        if length == -1:
            key = f"data:{filepath}:{offset}:end"
        else:
            key = f"data:{filepath}:{offset}:{length}"
        
        return self.data_cache.put(key, data, ttl)
    
    def get_file_attributes(self, filepath: str) -> Optional[Dict]:
        """
        获取文件属性
        """
        key = f"attr:{filepath}"
        cached_data = self.attribute_cache.get(key)
        if cached_data:
            return json.loads(cached_data.decode('utf-8'))
        return None
    
    def put_file_attributes(self, filepath: str, attributes: Dict, ttl: float = 1200.0):
        """
        缓存文件属性
        """
        key = f"attr:{filepath}"
        data = json.dumps(attributes).encode('utf-8')
        return self.attribute_cache.put(key, data, ttl)
    
    def invalidate_file_cache(self, filepath: str):
        """
        失效文件相关的所有缓存
        """
        # 失效所有与文件相关的缓存条目
        keys_to_invalidate = []
        
        # 收集元数据缓存键
        keys_to_invalidate.append(f"metadata:{filepath}")
        
        # 收集属性缓存键
        keys_to_invalidate.append(f"attr:{filepath}")
        
        # 收集数据缓存键（简化处理，实际需要更复杂的匹配）
        # 这里只是示例，实际实现中需要遍历所有可能的数据缓存键
        
        for key in keys_to_invalidate:
            self.metadata_cache.invalidate(key)
            self.attribute_cache.invalidate(key)
            # 数据缓存的失效需要更精确的实现

# 使用示例
print("\n=== 客户端缓存策略演示 ===")

# 创建智能客户端缓存
client_cache = SmartClientCache()

# 缓存文件元数据
file_metadata = {
    "name": "example.txt",
    "size": 1024,
    "mtime": time.time(),
    "permissions": "rw-r--r--"
}

client_cache.put_file_metadata("example.txt", file_metadata, ttl=600)
print("缓存文件元数据: example.txt")

# 缓存文件属性
file_attributes = {
    "owner": "user1",
    "group": "group1",
    "created_time": time.time() - 3600,
    "accessed_time": time.time()
}

client_cache.put_file_attributes("example.txt", file_attributes, ttl=1200)
print("缓存文件属性: example.txt")

# 缓存文件数据
file_data = b"This is example file content for caching demonstration."
client_cache.put_file_data("example.txt", file_data, offset=0, ttl=300)
print("缓存文件数据: example.txt")

# 读取缓存数据
cached_metadata = client_cache.get_file_metadata("example.txt")
print(f"读取缓存的元数据: {cached_metadata}")

cached_attributes = client_cache.get_file_attributes("example.txt")
print(f"读取缓存的属性: {cached_attributes}")

cached_data = client_cache.get_file_data("example.txt", 0, len(file_data))
print(f"读取缓存的数据: {cached_data[:30]}..." if cached_data else "未找到缓存数据")

# 查看缓存统计
print(f"元数据缓存统计: {client_cache.metadata_cache.get_stats()}")
print(f"数据缓存统计: {client_cache.data_cache.get_stats()}")
print(f"属性缓存统计: {client_cache.attribute_cache.get_stats()}")

7.3.2.2 客户端缓存优化

# 客户端缓存优化技术
import asyncio
import aiohttp
import time
from typing import Dict, List, Optional, Callable
import threading
from concurrent.futures import ThreadPoolExecutor

class AsyncClientCache:
    """
    异步客户端缓存，支持预取和批量操作
    """
    def __init__(self, max_size_mb: float = 100.0):
        self.max_size_bytes = max_size_mb * 1024 * 1024
        self.cache: Dict[str, any] = {}
        self.cache_lock = threading.RLock()
        self.prefetch_queue: List[str] = []
        self.prefetch_lock = threading.Lock()
        self.prefetch_executor = ThreadPoolExecutor(max_workers=4)
    
    async def get_async(self, key: str, fetch_func: Callable = None) -> Optional[any]:
        """
        异步获取缓存数据
        """
        with self.cache_lock:
            if key in self.cache:
                return self.cache[key]
        
        # 缓存未命中，从源获取数据
        if fetch_func:
            try:
                data = await fetch_func(key)
                # 放入缓存
                with self.cache_lock:
                    self.cache[key] = data
                return data
            except Exception as e:
                print(f"获取数据失败: {e}")
                return None
        
        return None
    
    def prefetch(self, keys: List[str], fetch_func: Callable):
        """
        预取数据到缓存
        """
        with self.prefetch_lock:
            self.prefetch_queue.extend(keys)
        
        # 在后台线程中执行预取
        self.prefetch_executor.submit(self._execute_prefetch, fetch_func)
    
    def _execute_prefetch(self, fetch_func: Callable):
        """
        执行预取操作
        """
        with self.prefetch_lock:
            keys_to_fetch = self.prefetch_queue.copy()
            self.prefetch_queue.clear()
        
        # 批量获取数据
        for key in keys_to_fetch:
            try:
                # 这里简化处理，实际应该批量获取
                data = fetch_func(key)
                with self.cache_lock:
                    self.cache[key] = data
                print(f"预取数据完成: {key}")
            except Exception as e:
                print(f"预取数据失败 {key}: {e}")
    
    async def batch_get(self, keys: List[str], fetch_func: Callable) -> Dict[str, any]:
        """
        批量获取缓存数据
        """
        results = {}
        missing_keys = []
        
        # 先从缓存获取
        with self.cache_lock:
            for key in keys:
                if key in self.cache:
                    results[key] = self.cache[key]
                else:
                    missing_keys.append(key)
        
        # 获取缺失的数据
        if missing_keys:
            try:
                # 批量获取缺失的数据
                fetched_data = await fetch_func(missing_keys)
                results.update(fetched_data)
                
                # 放入缓存
                with self.cache_lock:
                    for key, value in fetched_data.items():
                        self.cache[key] = value
            except Exception as e:
                print(f"批量获取数据失败: {e}")
        
        return results

class AdaptiveCacheManager:
    """
    自适应缓存管理器，根据访问模式动态调整缓存策略
    """
    def __init__(self):
        self.access_patterns: Dict[str, List[float]] = {}
        self.cache_performance: Dict[str, Dict[str, float]] = {}
        self.pattern_lock = threading.Lock()
    
    def record_access(self, key: str, access_time: float = None):
        """
        记录缓存访问
        """
        if access_time is None:
            access_time = time.time()
        
        with self.pattern_lock:
            if key not in self.access_patterns:
                self.access_patterns[key] = []
            
            self.access_patterns[key].append(access_time)
            
            # 保持最近100次访问记录
            if len(self.access_patterns[key]) > 100:
                self.access_patterns[key] = self.access_patterns[key][-100:]
    
    def analyze_access_pattern(self, key: str) -> Dict[str, any]:
        """
        分析访问模式
        """
        with self.pattern_lock:
            if key not in self.access_patterns or not self.access_patterns[key]:
                return {"pattern": "unknown"}
            
            access_times = self.access_patterns[key]
            
            # 计算访问频率
            if len(access_times) < 2:
                return {"pattern": "sparse", "frequency": 0}
            
            # 计算平均访问间隔
            intervals = [access_times[i] - access_times[i-1] for i in range(1, len(access_times))]
            avg_interval = sum(intervals) / len(intervals)
            
            # 计算访问频率（次/秒）
            frequency = 1.0 / avg_interval if avg_interval > 0 else 0
            
            # 判断访问模式
            if frequency > 1.0:  # 每秒超过1次访问
                pattern = "hot"
            elif frequency > 0.1:  # 每10秒超过1次访问
                pattern = "warm"
            else:
                pattern = "cold"
            
            return {
                "pattern": pattern,
                "frequency": frequency,
                "avg_interval": avg_interval,
                "access_count": len(access_times)
            }
    
    def recommend_cache_strategy(self, key: str) -> Dict[str, any]:
        """
        推荐缓存策略
        """
        pattern = self.analyze_access_pattern(key)
        
        if pattern["pattern"] == "hot":
            return {
                "ttl": 600.0,  # 10分钟
                "priority": "high",
                "eviction_policy": "lru"
            }
        elif pattern["pattern"] == "warm":
            return {
                "ttl": 1800.0,  # 30分钟
                "priority": "medium",
                "eviction_policy": "lru"
            }
        else:  # cold
            return {
                "ttl": 60.0,  # 1分钟
                "priority": "low",
                "eviction_policy": "fifo"
            }
    
    def record_performance(self, key: str, hit: bool, response_time: float):
        """
        记录缓存性能数据
        """
        with self.pattern_lock:
            if key not in self.cache_performance:
                self.cache_performance[key] = {
                    "hits": 0,
                    "misses": 0,
                    "total_response_time": 0.0,
                    "access_count": 0
                }
            
            perf = self.cache_performance[key]
            perf["access_count"] += 1
            
            if hit:
                perf["hits"] += 1
            else:
                perf["misses"] += 1
            
            perf["total_response_time"] += response_time

# 模拟异步数据获取函数
async def mock_fetch_data(key: str) -> any:
    """模拟异步获取数据"""
    # 模拟网络延迟
    await asyncio.sleep(0.01)
    return f"Data for {key}"

async def mock_batch_fetch_data(keys: List[str]) -> Dict[str, any]:
    """模拟批量获取数据"""
    # 模拟网络延迟
    await asyncio.sleep(0.05)
    return {key: f"Batch data for {key}" for key in keys}

# 使用示例
print("\n=== 客户端缓存优化演示 ===")

async def demonstrate_async_cache():
    # 创建异步客户端缓存
    async_cache = AsyncClientCache()
    adaptive_manager = AdaptiveCacheManager()
    
    # 异步获取数据
    print("异步获取缓存数据...")
    data1 = await async_cache.get_async("key1", mock_fetch_data)
    print(f"获取到数据: {data1}")
    
    # 再次获取（应该从缓存获取）
    data2 = await async_cache.get_async("key1", mock_fetch_data)
    print(f"再次获取数据: {data2}")
    
    # 批量获取数据
    print("\n批量获取缓存数据...")
    keys = ["key2", "key3", "key4"]
    batch_results = await async_cache.batch_get(keys, mock_batch_fetch_data)
    print(f"批量获取结果: {batch_results}")
    
    # 演示自适应缓存管理
    print("\n自适应缓存管理演示...")
    
    # 记录多次访问以建立访问模式
    for i in range(10):
        adaptive_manager.record_access("hot_file")
        time.sleep(0.1)  # 模拟频繁访问
    
    for i in range(5):
        adaptive_manager.record_access("warm_file")
        time.sleep(1)  # 模拟中等频率访问
    
    adaptive_manager.record_access("cold_file")
    
    # 分析访问模式
    hot_pattern = adaptive_manager.analyze_access_pattern("hot_file")
    warm_pattern = adaptive_manager.analyze_access_pattern("warm_file")
    cold_pattern = adaptive_manager.analyze_access_pattern("cold_file")
    
    print(f"热文件访问模式: {hot_pattern}")
    print(f"温文件访问模式: {warm_pattern}")
    print(f"冷文件访问模式: {cold_pattern}")
    
    # 获取缓存策略推荐
    hot_strategy = adaptive_manager.recommend_cache_strategy("hot_file")
    warm_strategy = adaptive_manager.recommend_cache_strategy("warm_file")
    cold_strategy = adaptive_manager.recommend_cache_strategy("cold_file")
    
    print(f"热文件推荐策略: {hot_strategy}")
    print(f"温文件推荐策略: {warm_strategy}")
    print(f"冷文件推荐策略: {cold_strategy}")

# 运行异步演示
asyncio.run(demonstrate_async_cache())

7.3.3 元数据缓存设计

元数据缓存是分布式文件存储系统中的关键组件，直接影响目录遍历、文件属性查询等操作的性能。

7.3.3.1 元数据缓存架构

# 元数据缓存架构实现
import time
import threading
from typing import Dict, List, Optional, Set
from dataclasses import dataclass
from enum import Enum

class MetadataType(Enum):
    """元数据类型"""
    FILE = "file"
    DIRECTORY = "directory"
    SYMLINK = "symlink"
    ATTRIBUTE = "attribute"

@dataclass
class FileMetadata:
    """文件元数据"""
    name: str
    size: int
    mtime: float
    ctime: float
    atime: float
    mode: int
    uid: int
    gid: int
    nlink: int
    checksum: Optional[str] = None

@dataclass
class DirectoryMetadata:
    """目录元数据"""
    name: str
    mtime: float
    ctime: float
    atime: float
    mode: int
    uid: int
    gid: int
    file_count: int
    subdirs: List[str]

class MetadataCacheEntry:
    """元数据缓存条目"""
    def __init__(self, path: str, metadata: any, metadata_type: MetadataType, ttl: float = 300.0):
        self.path = path
        self.metadata = metadata
        self.type = metadata_type
        self.created_time = time.time()
        self.expiry_time = self.created_time + ttl
        self.last_access_time = self.created_time
        self.access_count = 1
        self.version = int(time.time() * 1000000)

class HierarchicalMetadataCache:
    """
    分层元数据缓存，支持目录树结构
    """
    def __init__(self, max_entries: int = 10000):
        self.max_entries = max_entries
        self.cache: Dict[str, MetadataCacheEntry] = {}
        self.cache_lock = threading.RLock()
        self.directory_contents: Dict[str, Set[str]] = {}  # 目录内容索引
        self.stats = {
            "hits": 0,
            "misses": 0,
            "evictions": 0,
            "inserts": 0
        }
    
    def get_metadata(self, path: str) -> Optional[any]:
        """
        获取元数据
        """
        with self.cache_lock:
            if path in self.cache:
                entry = self.cache[path]
                
                # 检查是否过期
                if time.time() > entry.expiry_time:
                    self._evict_entry(path)
                    self.stats["misses"] += 1
                    return None
                
                # 更新访问统计
                entry.last_access_time = time.time()
                entry.access_count += 1
                self.stats["hits"] += 1
                
                return entry.metadata
            else:
                self.stats["misses"] += 1
                return None
    
    def put_metadata(self, path: str, metadata: any, metadata_type: MetadataType, ttl: float = 300.0) -> bool:
        """
        存储元数据
        """
        with self.cache_lock:
            # 如果缓存已满，执行淘汰
            if len(self.cache) >= self.max_entries:
                self._evict_lru_entry()
            
            # 创建缓存条目
            entry = MetadataCacheEntry(path, metadata, metadata_type, ttl)
            self.cache[path] = entry
            self.stats["inserts"] += 1
            
            # 更新目录内容索引
            if metadata_type == MetadataType.DIRECTORY:
                # 对于目录，初始化内容索引
                if path not in self.directory_contents:
                    self.directory_contents[path] = set()
            else:
                # 对于文件，更新父目录索引
                parent_dir = self._get_parent_directory(path)
                if parent_dir:
                    if parent_dir not in self.directory_contents:
                        self.directory_contents[parent_dir] = set()
                    self.directory_contents[parent_dir].add(path)
            
            return True
    
    def invalidate_path(self, path: str, recursive: bool = False):
        """
        失效指定路径的元数据
        :param path: 路径
        :param recursive: 是否递归失效子路径
        """
        with self.cache_lock:
            # 失效指定路径
            if path in self.cache:
                self._evict_entry(path)
            
            if recursive:
                # 递归失效子路径
                paths_to_invalidate = [
                    p for p in self.cache.keys() 
                    if p.startswith(path + "/") or p == path
                ]
                
                for p in paths_to_invalidate:
                    self._evict_entry(p)
            
            # 更新目录内容索引
            parent_dir = self._get_parent_directory(path)
            if parent_dir and parent_dir in self.directory_contents:
                self.directory_contents[parent_dir].discard(path)
    
    def get_directory_contents(self, dir_path: str) -> Optional[List[str]]:
        """
        获取目录内容列表
        """
        with self.cache_lock:
            if dir_path in self.directory_contents:
                return list(self.directory_contents[dir_path])
            return None
    
    def _get_parent_directory(self, path: str) -> Optional[str]:
        """
        获取父目录路径
        """
        if path == "/":
            return None
        
        # 移除末尾的斜杠
        if path.endswith("/"):
            path = path[:-1]
        
        # 找到最后一个斜杠
        last_slash = path.rfind("/")
        if last_slash <= 0:
            return "/"
        
        return path[:last_slash]
    
    def _evict_entry(self, path: str):
        """
        淘汰指定条目
        """
        if path in self.cache:
            # 更新目录内容索引
            entry = self.cache[path]
            if entry.type != MetadataType.DIRECTORY:
                parent_dir = self._get_parent_directory(path)
                if parent_dir and parent_dir in self.directory_contents:
                    self.directory_contents[parent_dir].discard(path)
            
            # 删除缓存条目
            del self.cache[path]
            self.stats["evictions"] += 1
    
    def _evict_lru_entry(self):
        """
        淘汰最久未使用的条目
        """
        if not self.cache:
            return
        
        # 找到最久未使用的条目
        lru_path = min(self.cache.keys(), key=lambda k: self.cache[k].last_access_time)
        self._evict_entry(lru_path)
    
    def get_stats(self) -> Dict[str, any]:
        """
        获取缓存统计信息
        """
        with self.cache_lock:
            total_requests = self.stats["hits"] + self.stats["misses"]
            hit_rate = self.stats["hits"] / total_requests if total_requests > 0 else 0
            
            return {
                "entries": len(self.cache),
                "max_entries": self.max_entries,
                "directory_indexes": len(self.directory_contents),
                "hits": self.stats["hits"],
                "misses": self.stats["misses"],
                "evictions": self.stats["evictions"],
                "inserts": self.stats["inserts"],
                "hit_rate": hit_rate
            }

class DistributedMetadataCache:
    """
    分布式元数据缓存，支持多节点协调
    """
    def __init__(self, node_id: str, peer_nodes: List[str]):
        self.node_id = node_id
        self.peer_nodes = peer_nodes
        self.local_cache = HierarchicalMetadataCache()
        self.cache_versions: Dict[str, int] = {}  # 元数据版本
        self.invalidations: Dict[str, float] = {}  # 失效时间戳
    
    def get_metadata(self, path: str) -> Optional[any]:
        """
        获取元数据（带分布式一致性检查）
        """
        # 首先检查本地缓存
        metadata = self.local_cache.get_metadata(path)
        if metadata:
            # 检查是否需要验证一致性
            if self._needs_consistency_check(path):
                # 在实际实现中，这里会与元数据服务验证一致性
                pass
            return metadata
        
        return None
    
    def put_metadata(self, path: str, metadata: any, metadata_type: MetadataType, ttl: float = 300.0) -> bool:
        """
        存储元数据并通知其他节点
        """
        # 存储到本地缓存
        success = self.local_cache.put_metadata(path, metadata, metadata_type, ttl)
        if success:
            # 生成新版本号
            version = int(time.time() * 1000000)
            self.cache_versions[path] = version
            
            # 通知其他节点（简化实现）
            self._notify_peers_of_update(path, version)
        
        return success
    
    def invalidate_metadata(self, path: str, recursive: bool = False):
        """
        失效元数据并通知其他节点
        """
        # 失效本地缓存
        self.local_cache.invalidate_path(path, recursive)
        
        # 记录失效时间
        self.invalidations[path] = time.time()
        
        # 通知其他节点（简化实现）
        self._notify_peers_of_invalidation(path, recursive)
    
    def _needs_consistency_check(self, path: str) -> bool:
        """
        检查是否需要一致性验证
        """
        # 简化实现：基于时间戳检查
        return path in self.invalidations and time.time() - self.invalidations[path] < 60
    
    def _notify_peers_of_update(self, path: str, version: int):
        """
        通知其他节点元数据更新
        """
        print(f"节点 {self.node_id} 通知其他节点元数据更新: {path} (版本 {version})")
        # 在实际实现中，这里会通过网络向其他节点发送更新通知
    
    def _notify_peers_of_invalidation(self, path: str, recursive: bool):
        """
        通知其他节点元数据失效
        """
        print(f"节点 {self.node_id} 通知其他节点元数据失效: {path} (递归: {recursive})")
        # 在实际实现中，这里会通过网络向其他节点发送失效通知

# 使用示例
print("\n=== 元数据缓存架构演示 ===")

# 创建分层元数据缓存
metadata_cache = HierarchicalMetadataCache(max_entries=1000)

# 创建文件元数据
file_metadata = FileMetadata(
    name="example.txt",
    size=1024,
    mtime=time.time(),
    ctime=time.time(),
    atime=time.time(),
    mode=0o644,
    uid=1000,
    gid=1000,
    nlink=1
)

# 创建目录元数据
dir_metadata = DirectoryMetadata(
    name="documents",
    mtime=time.time(),
    ctime=time.time(),
    atime=time.time(),
    mode=0o755,
    uid=1000,
    gid=1000,
    file_count=5,
    subdirs=["images", "videos"]
)

# 存储元数据
metadata_cache.put_metadata("/home/user/example.txt", file_metadata, MetadataType.FILE, ttl=600)
metadata_cache.put_metadata("/home/user/documents", dir_metadata, MetadataType.DIRECTORY, ttl=600)
metadata_cache.put_metadata("/home/user/documents/readme.md", 
                          FileMetadata("readme.md", 2048, time.time(), time.time(), time.time(), 0o644, 1000, 1000, 1),
                          MetadataType.FILE, ttl=300)

print("存储元数据完成")

# 获取元数据
retrieved_file = metadata_cache.get_metadata("/home/user/example.txt")
print(f"获取文件元数据: {retrieved_file.name if retrieved_file else '未找到'}")

retrieved_dir = metadata_cache.get_metadata("/home/user/documents")
print(f"获取目录元数据: {retrieved_dir.name if retrieved_dir else '未找到'}")

# 获取目录内容
dir_contents = metadata_cache.get_directory_contents("/home/user/documents")
print(f"目录内容: {dir_contents}")

# 查看缓存统计
stats = metadata_cache.get_stats()
print(f"缓存统计: {stats}")

# 演示分布式元数据缓存
print("\n分布式元数据缓存演示:")
peer_nodes = ["node2", "node3", "node4"]
dist_cache = DistributedMetadataCache("node1", peer_nodes)

# 存储元数据
dist_cache.put_metadata("/shared/project/file1.txt", file_metadata, MetadataType.FILE)
print("存储分布式元数据")

# 获取元数据
retrieved_dist = dist_cache.get_metadata("/shared/project/file1.txt")
print(f"获取分布式元数据: {retrieved_dist.name if retrieved_dist else '未找到'}")

# 失效元数据
dist_cache.invalidate_metadata("/shared/project/file1.txt")
print("失效分布式元数据")

7.3.3.2 元数据缓存优化策略

# 元数据缓存优化策略
import heapq
import time
from typing import Dict, List, Optional, Tuple
import threading

class MetadataCacheOptimizer:
    """
    元数据缓存优化器，实现智能缓存策略
    """
    def __init__(self, cache_manager):
        self.cache_manager = cache_manager
        self.access_frequency: Dict[str, int] = {}
        self.access_patterns: Dict[str, List[float]] = {}
        self.performance_metrics: Dict[str, Dict[str, float]] = {}
        self.optimizer_lock = threading.Lock()
    
    def record_access(self, path: str, access_time: float = None):
        """
        记录元数据访问
        """
        if access_time is None:
            access_time = time.time()
        
        with self.optimizer_lock:
            # 记录访问频率
            self.access_frequency[path] = self.access_frequency.get(path, 0) + 1
            
            # 记录访问时间模式
            if path not in self.access_patterns:
                self.access_patterns[path] = []
            self.access_patterns[path].append(access_time)
            
            # 保持最近100次访问记录
            if len(self.access_patterns[path]) > 100:
                self.access_patterns[path] = self.access_patterns[path][-100:]
    
    def analyze_access_patterns(self) -> Dict[str, List[str]]:
        """
        分析访问模式，分类热点数据
        """
        with self.optimizer_lock:
            hot_paths = []
            warm_paths = []
            cold_paths = []
            
            current_time = time.time()
            
            for path, access_times in self.access_patterns.items():
                if len(access_times) < 2:
                    cold_paths.append(path)
                    continue
                
                # 计算最近访问频率
                recent_accesses = [t for t in access_times if current_time - t < 300]  # 最近5分钟
                recent_frequency = len(recent_accesses) / 300.0  # 次/秒
                
                # 计算总体访问频率
                total_time_span = max(access_times) - min(access_times)
                overall_frequency = len(access_times) / (total_time_span if total_time_span > 0 else 1)
                
                # 分类
                if recent_frequency > 0.1 or overall_frequency > 0.01:  # 高频访问
                    hot_paths.append(path)
                elif recent_frequency > 0.01 or overall_frequency > 0.001:  # 中频访问
                    warm_paths.append(path)
                else:  # 低频访问
                    cold_paths.append(path)
            
            return {
                "hot": hot_paths,
                "warm": warm_paths,
                "cold": cold_paths
            }
    
    def recommend_ttl(self, path: str) -> float:
        """
        为指定路径推荐TTL值
        """
        with self.optimizer_lock:
            # 基于访问频率推荐TTL
            frequency = self.access_frequency.get(path, 0)
            
            if frequency > 100:  # 非常频繁访问
                return 1800.0  # 30分钟
            elif frequency > 50:  # 频繁访问
                return 900.0   # 15分钟
            elif frequency > 10:  # 中等访问
                return 300.0   # 5分钟
            else:  # 低频访问
                return 60.0    # 1分钟
    
    def optimize_cache(self):
        """
        执行缓存优化
        """
        # 分析访问模式
        patterns = self.analyze_access_patterns()
        
        # 为热点数据调整TTL
        for path in patterns["hot"]:
            recommended_ttl = self.recommend_ttl(path)
            # 在实际实现中，这里会调整缓存条目的TTL
            
            print(f"优化热点数据 {path}: 推荐TTL = {recommended_ttl}秒")
        
        # 为冷数据考虑预淘汰
        for path in patterns["cold"]:
            # 在实际实现中，这里可能会提前淘汰或降低优先级
            print(f"识别冷数据 {path}: 考虑降低缓存优先级")

class MetadataPrefetcher:
    """
    元数据预取器，预测并预取可能需要的元数据
    """
    def __init__(self, cache_manager):
        self.cache_manager = cache_manager
        self.access_sequences: Dict[str, List[str]] = {}  # 访问序列
        self.sequence_lock = threading.Lock()
    
    def record_access_sequence(self, current_path: str, previous_path: str):
        """
        记录访问序列
        """
        with self.sequence_lock:
            if previous_path not in self.access_sequences:
                self.access_sequences[previous_path] = []
            self.access_sequences[previous_path].append(current_path)
            
            # 保持最近10次访问记录
            if len(self.access_sequences[previous_path]) > 10:
                self.access_sequences[previous_path] = self.access_sequences[previous_path][-10:]
    
    def predict_next_access(self, current_path: str) -> Optional[List[str]]:
        """
        预测下一个可能访问的路径
        """
        with self.sequence_lock:
            if current_path not in self.access_sequences:
                return None
            
            # 统计后续访问频率
            next_paths = self.access_sequences[current_path]
            path_counts = {}
            for path in next_paths:
                path_counts[path] = path_counts.get(path, 0) + 1
            
            # 返回按频率排序的路径
            sorted_paths = sorted(path_counts.items(), key=lambda x: x[1], reverse=True)
            return [path for path, count in sorted_paths[:3]]  # 返回前3个
    
    def prefetch_metadata(self, paths: List[str], metadata_provider):
        """
        预取元数据
        """
        # 在实际实现中，这里会在后台线程中预取元数据
        for path in paths:
            try:
                # 模拟预取操作
                metadata = metadata_provider.get_metadata_from_storage(path)
                if metadata:
                    # 存储到缓存
                    self.cache_manager.put_metadata(path, metadata, metadata_provider.get_metadata_type(path))
                    print(f"预取元数据完成: {path}")
            except Exception as e:
                print(f"预取元数据失败 {path}: {e}")

class AdaptiveMetadataCache:
    """
    自适应元数据缓存，结合优化器和预取器
    """
    def __init__(self, max_entries: int = 10000):
        self.hierarchical_cache = HierarchicalMetadataCache(max_entries)
        self.optimizer = MetadataCacheOptimizer(self.hierarchical_cache)
        self.prefetcher = MetadataPrefetcher(self.hierarchical_cache)
        self.last_access_path = None
    
    def get_metadata(self, path: str) -> Optional[any]:
        """
        获取元数据（带自适应优化）
        """
        # 记录访问
        self.optimizer.record_access(path)
        
        # 记录访问序列（用于预取）
        if self.last_access_path:
            self.prefetcher.record_access_sequence(self.last_access_path, path)
        
        self.last_access_path = path
        
        # 预测并预取下一个可能访问的路径
        predicted_paths = self.prefetcher.predict_next_access(path)
        if predicted_paths:
            # 在实际实现中，这里会启动后台预取
            print(f"预测下一个可能访问的路径: {predicted_paths}")
        
        # 获取元数据
        return self.hierarchical_cache.get_metadata(path)
    
    def put_metadata(self, path: str, metadata: any, metadata_type: MetadataType, ttl: float = 300.0) -> bool:
        """
        存储元数据（带自适应优化）
        """
        # 根据访问模式优化TTL
        optimized_ttl = self.optimizer.recommend_ttl(path)
        if optimized_ttl != ttl:
            ttl = optimized_ttl
            print(f"优化 {path} 的TTL: {ttl}秒")
        
        return self.hierarchical_cache.put_metadata(path, metadata, metadata_type, ttl)
    
    def run_optimization_cycle(self):
        """
        运行优化周期
        """
        print("运行缓存优化周期...")
        self.optimizer.optimize_cache()

# 模拟元数据提供者
class MockMetadataProvider:
    def __init__(self):
        self.mock_metadata = {
            "/home/user/documents": DirectoryMetadata("documents", time.time(), time.time(), time.time(), 0o755, 1000, 1000, 3, ["images", "videos"]),
            "/home/user/documents/file1.txt": FileMetadata("file1.txt", 1024, time.time(), time.time(), time.time(), 0o644, 1000, 1000, 1),
            "/home/user/documents/file2.txt": FileMetadata("file2.txt", 2048, time.time(), time.time(), time.time(), 0o644, 1000, 1000, 1),
            "/home/user/documents/images": DirectoryMetadata("images", time.time(), time.time(), time.time(), 0o755, 1000, 1000, 2, []),
        }
    
    def get_metadata_from_storage(self, path: str) -> Optional[any]:
        """模拟从存储获取元数据"""
        time.sleep(0.01)  # 模拟I/O延迟
        return self.mock_metadata.get(path)
    
    def get_metadata_type(self, path: str) -> MetadataType:
        """获取元数据类型"""
        if path in self.mock_metadata:
            if isinstance(self.mock_metadata[path], DirectoryMetadata):
                return MetadataType.DIRECTORY
            else:
                return MetadataType.FILE
        return MetadataType.FILE

# 使用示例
print("\n=== 元数据缓存优化策略演示 ===")

# 创建自适应元数据缓存
adaptive_cache = AdaptiveMetadataCache(max_entries=1000)
metadata_provider = MockMetadataProvider()

# 模拟一系列访问模式
print("模拟访问模式...")
access_patterns = [
    "/home/user/documents",
    "/home/user/documents/file1.txt",
    "/home/user/documents/file2.txt",
    "/home/user/documents/images",
    "/home/user/documents/file1.txt",  # 重复访问
    "/home/user/documents/file1.txt",  # 频繁访问
]

for i, path in enumerate(access_patterns):
    # 存储元数据
    metadata = metadata_provider.get_metadata_from_storage(path)
    if metadata:
        metadata_type = metadata_provider.get_metadata_type(path)
        adaptive_cache.put_metadata(path, metadata, metadata_type)
        print(f"存储元数据: {path}")
    
    # 获取元数据
    retrieved = adaptive_cache.get_metadata(path)
    print(f"访问 {path}: {'成功' if retrieved else '失败'}")
    
    # 模拟时间间隔
    time.sleep(0.1)

# 运行优化周期
adaptive_cache.run_optimization_cycle()

# 查看缓存统计
stats = adaptive_cache.hierarchical_cache.get_stats()
print(f"缓存统计: {stats}")

7.3.4 数据缓存设计

数据缓存是分布式文件存储系统中最重要的缓存层之一，直接影响数据读取性能。

7.3.4.1 数据缓存架构

# 数据缓存架构实现
import hashlib
import time
import threading
from typing import Dict, List, Optional, Tuple
from dataclasses import dataclass
import mmap
import os

@dataclass
class DataBlock:
    """数据块"""
    block_id: str
    data: bytes
    size: int
    checksum: str
    created_time: float
    last_access_time: float
    access_count: int

class DataCacheEntry:
    """数据缓存条目"""
    def __init__(self, file_path: str, offset: int, data: bytes, block_size: int, ttl: float = 300.0):
        self.file_path = file_path
        self.offset = offset
        self.data = data
        self.size = len(data)
        self.block_size = block_size
        self.block_id = f"{file_path}:{offset}:{block_size}"
        self.checksum = hashlib.md5(data).hexdigest()
        self.created_time = time.time()
        self.expiry_time = self.created_time + ttl
        self.last_access_time = self.created_time
        self.access_count = 1
        self.version = int(time.time() * 1000000)

class BlockBasedDataCache:
    """
    基于块的数据缓存
    """
    def __init__(self, max_size_mb: float = 1024.0, default_block_size: int = 1024 * 1024):  # 1MB默认块大小
        self.max_size_bytes = max_size_mb * 1024 * 1024
        self.current_size_bytes = 0
        self.default_block_size = default_block_size
        self.cache: Dict[str, DataCacheEntry] = {}
        self.file_blocks: Dict[str, List[str]] = {}  # 文件到块ID的映射
        self.cache_lock = threading.RLock()
        self.stats = {
            "hits": 0,
            "misses": 0,
            "evictions": 0,
            "writes": 0,
            "bytes_read": 0,
            "bytes_written": 0
        }
    
    def read_data(self, file_path: str, offset: int, length: int) -> Optional[bytes]:
        """
        读取数据
        """
        result = bytearray()
        bytes_read = 0
        
        # 计算需要的块
        start_block = offset // self.default_block_size
        end_block = (offset + length - 1) // self.default_block_size
        
        for block_index in range(start_block, end_block + 1):
            block_offset = block_index * self.default_block_size
            block_id = f"{file_path}:{block_offset}:{self.default_block_size}"
            
            # 读取块数据
            block_data = self._read_block(block_id)
            if block_data is None:
                # 块未缓存，需要从存储读取
                block_data = self._fetch_block_from_storage(file_path, block_offset, self.default_block_size)
                if block_data:
                    # 缓存块数据
                    self._cache_block(file_path, block_offset, block_data)
            
            if block_data:
                # 计算在当前块中的偏移和长度
                local_offset = max(0, offset - block_offset)
                local_end = min(len(block_data), offset + length - block_offset)
                local_length = local_end - local_offset
                
                if local_length > 0:
                    result.extend(block_data[local_offset:local_offset + local_length])
                    bytes_read += local_length
        
        if bytes_read > 0:
            self.stats["bytes_read"] += bytes_read
            return bytes(result)
        else:
            return None
    
    def _read_block(self, block_id: str) -> Optional[bytes]:
        """
        读取缓存块
        """
        with self.cache_lock:
            if block_id in self.cache:
                entry = self.cache[block_id]
                
                # 检查是否过期
                if time.time() > entry.expiry_time:
                    self._evict_block(block_id)
                    self.stats["misses"] += 1
                    return None
                
                # 更新访问统计
                entry.last_access_time = time.time()
                entry.access_count += 1
                self.stats["hits"] += 1
                
                return entry.data
            else:
                self.stats["misses"] += 1
                return None
    
    def _fetch_block_from_storage(self, file_path: str, offset: int, length: int) -> Optional[bytes]:
        """
        从存储层获取数据块（模拟实现）
        """
        print(f"从存储层获取数据块: {file_path} offset={offset} length={length}")
        time.sleep(0.02)  # 模拟I/O延迟
        
        # 模拟返回数据
        data_size = min(length, 1024 * 1024)  # 最多1MB
        return b"x" * data_size  # 模拟数据
    
    def _cache_block(self, file_path: str, offset: int, data: bytes, ttl: float = 300.0) -> bool:
        """
        缓存数据块
        """
        with self.cache_lock:
            block_id = f"{file_path}:{offset}:{self.default_block_size}"
            
            # 检查是否已存在
            if block_id in self.cache:
                # 更新现有条目
                old_entry = self.cache[block_id]
                self.current_size_bytes -= old_entry.size
                self.cache.pop(block_id)
                
                # 从文件块映射中移除
                if file_path in self.file_blocks:
                    if block_id in self.file_blocks[file_path]:
                        self.file_blocks[file_path].remove(block_id)
            
            # 检查空间是否足够
            if self.current_size_bytes + len(data) > self.max_size_bytes:
                # 执行缓存淘汰
                if not self._evict_for_space(len(data)):
                    return False  # 空间不足且无法淘汰
            
            # 创建新条目
            entry = DataCacheEntry(file_path, offset, data, self.default_block_size, ttl)
            self.cache[block_id] = entry
            self.current_size_bytes += entry.size
            self.stats["writes"] += 1
            self.stats["bytes_written"] += len(data)
            
            # 更新文件块映射
            if file_path not in self.file_blocks:
                self.file_blocks[file_path] = []
            self.file_blocks[file_path].append(block_id)
            
            return True
    
    def _evict_for_space(self, required_size: int) -> bool:
        """
        为新数据腾出空间
        """
        if not self.cache:
            return False
        
        # 按最后访问时间排序（LRU）
        sorted_entries = sorted(self.cache.items(), key=lambda x: x[1].last_access_time)
        
        # 淘汰最久未使用的条目
        evicted_size = 0
        for block_id, entry in sorted_entries:
            evicted_size += entry.size
            self._evict_block(block_id)
            self.stats["evictions"] += 1
            
            if evicted_size >= required_size:
                break
        
        return evicted_size >= required_size
    
    def _evict_block(self, block_id: str):
        """
        淘汰指定块
        """
        if block_id in self.cache:
            entry = self.cache[block_id]
            self.current_size_bytes -= entry.size
            
            # 从文件块映射中移除
            file_path = entry.file_path
            if file_path in self.file_blocks:
                if block_id in self.file_blocks[file_path]:
                    self.file_blocks[file_path].remove(block_id)
                if not self.file_blocks[file_path]:
                    del self.file_blocks[file_path]
            
            # 删除缓存条目
            del self.cache[block_id]
    
    def invalidate_file_cache(self, file_path: str):
        """
        失效文件的所有缓存块
        """
        with self.cache_lock:
            if file_path in self.file_blocks:
                block_ids = self.file_blocks[file_path].copy()
                for block_id in block_ids:
                    self._evict_block(block_id)
    
    def get_stats(self) -> Dict[str, any]:
        """
        获取缓存统计信息
        """
        with self.cache_lock:
            total_requests = self.stats["hits"] + self.stats["misses"]
            hit_rate = self.stats["hits"] / total_requests if total_requests > 0 else 0
            
            return {
                "max_size_mb": self.max_size_bytes / (1024 * 1024),
                "current_size_mb": self.current_size_bytes / (1024 * 1024),
                "blocks": len(self.cache),
                "files": len(self.file_blocks),
                "hits": self.stats["hits"],
                "misses": self.stats["misses"],
                "evictions": self.stats["evictions"],
                "writes": self.stats["writes"],
                "hit_rate": hit_rate,
                "utilization": self.current_size_bytes / self.max_size_bytes if self.max_size_bytes > 0 else 0,
                "bytes_read": self.stats["bytes_read"],
                "bytes_written": self.stats["bytes_written"]
            }

class TieredDataCache:
    """
    分层数据缓存，支持内存和磁盘缓存
    """
    def __init__(self, memory_cache_mb: float = 512.0, disk_cache_mb: float = 2048.0, 
                 disk_cache_path: str = "/tmp/dfs_cache"):
        self.memory_cache = BlockBasedDataCache(memory_cache_mb)
        self.disk_cache_path = disk_cache_path
        self.disk_cache_lock = threading.Lock()
        
        # 创建磁盘缓存目录
        os.makedirs(disk_cache_path, exist_ok=True)
    
    def read_data(self, file_path: str, offset: int, length: int) -> Optional[bytes]:
        """
        读取数据（先内存缓存，后磁盘缓存）
        """
        # 首先尝试从内存缓存读取
        data = self.memory_cache.read_data(file_path, offset, length)
        if data:
            return data
        
        # 如果内存缓存未命中，尝试从磁盘缓存读取
        disk_data = self._read_from_disk_cache(file_path, offset, length)
        if disk_data:
            # 将数据放入内存缓存
            self._cache_to_memory(file_path, offset, disk_data)
            return disk_data
        
        # 都未命中，从存储层读取
        return self._read_from_storage(file_path, offset, length)
    
    def _read_from_disk_cache(self, file_path: str, offset: int, length: int) -> Optional[bytes]:
        """
        从磁盘缓存读取数据
        """
        try:
            # 构造缓存文件路径
            safe_filename = hashlib.md5(file_path.encode()).hexdigest()
            cache_file_path = os.path.join(self.disk_cache_path, safe_filename)
            
            if not os.path.exists(cache_file_path):
                return None
            
            with self.disk_cache_lock:
                with open(cache_file_path, 'rb') as f:
                    f.seek(offset)
                    data = f.read(length)
                    return data if data else None
        except Exception as e:
            print(f"从磁盘缓存读取失败: {e}")
            return None
    
    def _cache_to_memory(self, file_path: str, offset: int, data: bytes):
        """
        将数据缓存到内存
        """
        # 计算块边界
        block_start = (offset // self.memory_cache.default_block_size) * self.memory_cache.default_block_size
        block_end = block_start + self.memory_cache.default_block_size
        
        # 缓存完整的块
        self.memory_cache._cache_block(file_path, block_start, data)
    
    def _read_from_storage(self, file_path: str, offset: int, length: int) -> Optional[bytes]:
        """
        从存储层读取数据（模拟实现）
        """
        print(f"从存储层读取数据: {file_path} offset={offset} length={length}")
        time.sleep(0.05)  # 模拟较高的I/O延迟
        
        # 模拟返回数据
        data_size = min(length, 1024 * 1024)  # 最多1MB
        return b"s" * data_size  # 模拟数据
    
    def write_data(self, file_path: str, offset: int, data: bytes):
        """
        写入数据（更新缓存）
        """
        # 失效相关的缓存块
        self.memory_cache.invalidate_file_cache(file_path)
        
        # 更新磁盘缓存
        self._update_disk_cache(file_path, offset, data)
        
        # 在实际实现中，这里会写入存储层
    
    def _update_disk_cache(self, file_path: str, offset: int, data: bytes):
        """
        更新磁盘缓存
        """
        try:
            safe_filename = hashlib.md5(file_path.encode()).hexdigest()
            cache_file_path = os.path.join(self.disk_cache_path, safe_filename)
            
            with self.disk_cache_lock:
                # 确保目录存在
                os.makedirs(os.path.dirname(cache_file_path), exist_ok=True)
                
                # 写入数据
                with open(cache_file_path, 'r+b' if os.path.exists(cache_file_path) else 'wb') as f:
                    f.seek(offset)
                    f.write(data)
        except Exception as e:
            print(f"更新磁盘缓存失败: {e}")
    
    def get_stats(self) -> Dict[str, any]:
        """
        获取缓存统计信息
        """
        memory_stats = self.memory_cache.get_stats()
        return {
            "memory_cache": memory_stats,
            "disk_cache_path": self.disk_cache_path
        }

# 使用示例
print("\n=== 数据缓存架构演示 ===")

# 创建分层数据缓存
tiered_cache = TieredDataCache(memory_cache_mb=100.0, disk_cache_mb=500.0)

# 读取数据（第一次，缓存未命中）
print("第一次读取数据...")
data1 = tiered_cache.read_data("/data/large_file.dat", 0, 1024)
print(f"读取到数据: {len(data1) if data1 else 0} 字节")

# 读取相同数据（应该从内存缓存命中）
print("\n第二次读取相同数据...")
data2 = tiered_cache.read_data("/data/large_file.dat", 0, 1024)
print(f"读取到数据: {len(data2) if data2 else 0} 字节")

# 读取相邻数据（应该从同一块获取）
print("\n读取相邻数据...")
data3 = tiered_cache.read_data("/data/large_file.dat", 512, 512)
print(f"读取到数据: {len(data3) if data3 else 0} 字节")

# 查看缓存统计
stats = tiered_cache.get_stats()
print(f"\n缓存统计:")
print(f"  内存缓存:")
for key, value in stats["memory_cache"].items():
    print(f"    {key}: {value}")

# 演示写入操作对缓存的影响
print("\n写入数据并查看缓存影响...")
tiered_cache.write_data("/data/large_file.dat", 0, b"Updated data")
print("写入完成")

# 再次读取（缓存应该已失效）
print("写入后再次读取...")
data4 = tiered_cache.read_data("/data/large_file.dat", 0, 1024)
print(f"读取到数据: {len(data4) if data4 else 0} 字节")

7.3.4.2 数据缓存一致性保证

# 数据缓存一致性保证机制
import hashlib
import time
import threading
from typing import Dict, List, Optional
from dataclasses import dataclass

@dataclass
class DataVersion:
    """数据版本信息"""
    version: int
    checksum: str
    timestamp: float

class DataConsistencyManager:
    """
    数据一致性管理器
    """
    def __init__(self):
        self.file_versions: Dict[str, DataVersion] = {}
        self.cache_invalidation: Dict[str, float] = {}
        self.consistency_lock = threading.RLock()
    
    def update_file_version(self, file_path: str, data: bytes) -> int:
        """
        更新文件版本
        """
        with self.consistency_lock:
            version = int(time.time() * 1000000)  # 微秒级版本号
            checksum = hashlib.md5(data).hexdigest()
            
            self.file_versions[file_path] = DataVersion(
                version=version,
                checksum=checksum,
                timestamp=time.time()
            )
            
            return version
    
    def validate_cache_data(self, file_path: str, cached_version: int, cached_checksum: str) -> bool:
        """
        验证缓存数据的一致性
        """
        with self.consistency_lock:
            # 检查文件版本
            if file_path in self.file_versions:
                current_version = self.file_versions[file_path]
                if cached_version < current_version.version:
                    return False  # 缓存版本过旧
                
                # 检查校验和
                if cached_checksum != current_version.checksum:
                    return False  # 数据不一致
            
            # 检查是否在失效时间之后
            if file_path in self.cache_invalidation:
                invalidation_time = self.cache_invalidation[file_path]
                cached_version_time = cached_version / 1000000.0  # 转换为秒
                if cached_version_time < invalidation_time:
                    return False  # 缓存在失效时间之前
            
            return True
    
    def invalidate_file_cache(self, file_path: str):
        """
        失效文件缓存
        """
        with self.consistency_lock:
            self.cache_invalidation[file_path] = time.time()
            # 通知分布式环境中的其他节点
            self._notify_peers_of_invalidation(file_path)
    
    def _notify_peers_of_invalidation(self, file_path: str):
        """
        通知其他节点缓存失效（简化实现）
        """
        print(f"通知其他节点失效文件缓存: {file_path}")

class ConsistentDataCache:
    """
    一致性数据缓存
    """
    def __init__(self, max_size_mb: float = 1024.0):
        self.block_cache = BlockBasedDataCache(max_size_mb)
        self.consistency_manager = DataConsistencyManager()
        self.cache_lock = threading.RLock()
    
    def read_data(self, file_path: str, offset: int, length: int) -> Optional[bytes]:
        """
        读取数据（带一致性检查）
        """
        # 直接从块缓存读取
        return self.block_cache.read_data(file_path, offset, length)
    
    def write_data(self, file_path: str, offset: int, data: bytes) -> bool:
        """
        写入数据（保证一致性）
        """
        with self.cache_lock:
            # 更新文件版本
            version = self.consistency_manager.update_file_version(file_path, data)
            
            # 失效相关缓存
            self.consistency_manager.invalidate_file_cache(file_path)
            self.block_cache.invalidate_file_cache(file_path)
            
            # 在实际实现中，这里会写入存储层
            success = self._write_to_storage(file_path, offset, data)
            
            if success:
                print(f"写入数据成功: {file_path} (版本 {version})")
            else:
                print(f"写入数据失败: {file_path}")
            
            return success
    
    def _write_to_storage(self, file_path: str, offset: int, data: bytes) -> bool:
        """
        写入存储层（模拟实现）
        """
        print(f"向存储层写入数据: {file_path} offset={offset} size={len(data)}")
        time.sleep(0.03)  # 模拟I/O延迟
        return True  # 模拟写入成功
    
    def get_consistency_info(self, file_path: str) -> Optional[DataVersion]:
        """
        获取文件一致性信息
        """
        with self.consistency_lock:
            return self.consistency_manager.file_versions.get(file_path)

class DistributedDataCache:
    """
    分布式数据缓存，支持多节点一致性
    """
    def __init__(self, node_id: str, peer_nodes: List[str]):
        self.node_id = node_id
        self.peer_nodes = peer_nodes
        self.local_cache = ConsistentDataCache()
        self.version_vector: Dict[str, int] = {}  # 版本向量
        self.invalidation_timestamps: Dict[str, float] = {}  # 失效时间戳
    
    def read_data(self, file_path: str, offset: int, length: int) -> Optional[bytes]:
        """
        读取数据（分布式一致性）
        """
        # 首先从本地缓存读取
        data = self.local_cache.read_data(file_path, offset, length)
        if data:
            # 检查是否需要验证一致性
            if self._needs_consistency_verification(file_path):
                # 在实际实现中，这里会与存储层或其他节点验证一致性
                print(f"验证 {file_path} 的一致性")
            
            return data
        
        return None
    
    def write_data(self, file_path: str, offset: int, data: bytes) -> bool:
        """
        写入数据（分布式一致性）
        """
        # 写入本地缓存
        success = self.local_cache.write_data(file_path, offset, data)
        if success:
            # 获取新版本号
            consistency_info = self.local_cache.get_consistency_info(file_path)
            if consistency_info:
                version = consistency_info.version
                self.version_vector[file_path] = version
                
                # 通知其他节点
                self._notify_peers_of_write(file_path, version)
        
        return success
    
    def _needs_consistency_verification(self, file_path: str) -> bool:
        """
        检查是否需要一致性验证
        """
        # 简化实现：基于时间戳检查
        if file_path in self.invalidation_timestamps:
            return time.time() - self.invalidation_timestamps[file_path] < 60  # 1分钟内需要验证
        return False
    
    def _notify_peers_of_write(self, file_path: str, version: int):
        """
        通知其他节点写入操作
        """
        print(f"节点 {self.node_id} 通知其他节点写入: {file_path} (版本 {version})")
        # 在实际实现中，这里会通过网络向其他节点发送写入通知
    
    def handle_peer_write_notification(self, file_path: str, version: int, peer_id: str):
        """
        处理来自其他节点的写入通知
        """
        print(f"节点 {self.node_id} 接收到节点 {peer_id} 的写入通知: {file_path} (版本 {version})")
        
        # 更新版本向量
        self.version_vector[file_path] = version
        
        # 失效本地缓存
        self.local_cache.consistency_manager.invalidate_file_cache(file_path)
        self.local_cache.block_cache.invalidate_file_cache(file_path)
        
        # 记录失效时间戳
        self.invalidation_timestamps[file_path] = time.time()

# 使用示例
print("\n=== 数据缓存一致性保证演示 ===")

# 创建分布式数据缓存
peer_nodes = ["node2", "node3", "node4"]
dist_cache = DistributedDataCache("node1", peer_nodes)

# 写入数据
print("写入数据...")
write_success = dist_cache.write_data("/shared/data/file1.dat", 0, b"Initial data content")
print(f"写入结果: {'成功' if write_success else '失败'}")

# 读取数据
print("\n读取数据...")
data = dist_cache.read_data("/shared/data/file1.dat", 0, 1024)
print(f"读取到数据: {data[:20] if data else '无数据'}")

# 再次读取（应该从缓存获取）
print("\n再次读取数据...")
data2 = dist_cache.read_data("/shared/data/file1.dat", 0, 1024)
print(f"再次读取到数据: {data2[:20] if data2 else '无数据'}")

# 模拟其他节点的写入通知
print("\n处理其他节点的写入通知...")
dist_cache.handle_peer_write_notification("/shared/data/file1.dat", 1234567890, "node2")

# 再次读取（缓存应该已失效）
print("\n失效后再次读取数据...")
data3 = dist_cache.read_data("/shared/data/file1.dat", 0, 1024)
print(f"失效后读取到数据: {data3[:20] if data3 else '无数据'}")

# 查看一致性信息
consistency_info = dist_cache.local_cache.get_consistency_info("/shared/data/file1.dat")
if consistency_info:
    print(f"\n一致性信息: 版本={consistency_info.version}, 校验和={consistency_info.checksum[:10]}...")

# 查看缓存统计
stats = dist_cache.local_cache.block_cache.get_stats()
print(f"\n缓存统计:")
for key, value in stats.items():
    print(f"  {key}: {value}")

总结

高性能缓存设计是分布式文件存储平台提升性能的关键技术。通过本章的深入探讨，我们了解了以下核心内容：

缓存架构概述：分布式文件存储系统采用多层缓存架构，包括客户端缓存、元数据缓存和数据缓存，形成完整的缓存体系。
客户端缓存设计：客户端缓存直接面向应用程序，通过合理的淘汰策略（LRU、LFU等）和优化技术（预取、批量操作）显著提升用户体验。
元数据缓存设计：元数据缓存针对目录结构和文件属性进行优化，支持分层存储和分布式协调，有效减少元数据查询延迟。
数据缓存设计：数据缓存采用基于块的存储方式，结合内存和磁盘分层缓存，通过一致性管理机制确保数据正确性。

在实际工程实践中，需要注意以下要点：

缓存策略选择：根据不同数据访问模式选择合适的缓存策略和参数
一致性保证：在分布式环境中实现有效的缓存一致性机制
性能监控：建立完善的缓存性能监控体系，持续优化缓存效果
容量规划：合理规划各层缓存容量，平衡成本与性能

通过合理设计和实现这些缓存机制，分布式文件存储平台能够在保证数据一致性的前提下，显著提升系统性能和用户体验。