基准测试实践与性能验证

老马啸西风2025/9/7大约 11 分钟

基准测试是验证分布式文件存储平台性能优化效果的关键手段。通过科学、系统的基准测试实践，我们不仅能够量化系统的性能表现，还能验证优化措施的有效性，为系统的持续改进提供数据支撑。

12.1.4 基准测试框架设计

一个完善的基准测试框架需要具备可扩展性、可重复性和准确性等特征。

12.1.4.1 基准测试框架实现

# 基准测试框架
import time
import threading
from typing import Dict, List, Any, Callable, Optional
from datetime import datetime, timedelta
import statistics
import json

class BenchmarkTest:
    """基准测试基类"""
    
    def __init__(self, name: str, description: str):
        self.name = name
        self.description = description
        self.setup_func: Optional[Callable] = None
        self.teardown_func: Optional[Callable] = None
        self.test_func: Optional[Callable] = None
        self.iterations = 1
        self.concurrent_threads = 1
        self.warmup_iterations = 0
        self.results = []
        self.metrics = {}
    
    def setup(self, func: Callable):
        """设置测试准备函数"""
        self.setup_func = func
        return self
    
    def teardown(self, func: Callable):
        """设置测试清理函数"""
        self.teardown_func = func
        return self
    
    def test(self, func: Callable):
        """设置测试执行函数"""
        self.test_func = func
        return self
    
    def config(self, iterations: int = 1, concurrent_threads: int = 1, 
               warmup_iterations: int = 0):
        """配置测试参数"""
        self.iterations = iterations
        self.concurrent_threads = concurrent_threads
        self.warmup_iterations = warmup_iterations
        return self
    
    def run(self) -> Dict[str, Any]:
        """运行基准测试"""
        print(f"开始运行基准测试: {self.name}")
        
        # 执行准备阶段
        if self.setup_func:
            try:
                self.setup_func()
                print("测试准备阶段完成")
            except Exception as e:
                return {"error": f"测试准备失败: {e}"}
        
        try:
            # 执行预热
            if self.warmup_iterations > 0:
                print(f"执行 {self.warmup_iterations} 次预热...")
                self._run_warmup()
            
            # 执行正式测试
            print(f"执行 {self.iterations} 次测试，{self.concurrent_threads} 并发...")
            self._run_benchmark()
            
            # 计算指标
            self._calculate_metrics()
            
        except Exception as e:
            return {"error": f"测试执行失败: {e}"}
        finally:
            # 执行清理阶段
            if self.teardown_func:
                try:
                    self.teardown_func()
                    print("测试清理阶段完成")
                except Exception as e:
                    print(f"测试清理失败: {e}")
        
        return self._generate_report()
    
    def _run_warmup(self):
        """执行预热"""
        for i in range(self.warmup_iterations):
            try:
                if self.test_func:
                    self.test_func()
            except Exception as e:
                print(f"预热迭代 {i+1} 失败: {e}")
    
    def _run_benchmark(self):
        """执行基准测试"""
        if self.concurrent_threads > 1:
            self._run_concurrent_benchmark()
        else:
            self._run_sequential_benchmark()
    
    def _run_sequential_benchmark(self):
        """顺序执行基准测试"""
        for i in range(self.iterations):
            try:
                start_time = time.time()
                result = self.test_func() if self.test_func else None
                end_time = time.time()
                
                self.results.append({
                    "iteration": i + 1,
                    "duration": end_time - start_time,
                    "success": True,
                    "result": result,
                    "timestamp": datetime.now().isoformat()
                })
            except Exception as e:
                self.results.append({
                    "iteration": i + 1,
                    "duration": 0,
                    "success": False,
                    "error": str(e),
                    "timestamp": datetime.now().isoformat()
                })
    
    def _run_concurrent_benchmark(self):
        """并发执行基准测试"""
        def worker(thread_id: int, results: List[Dict[str, Any]]):
            thread_results = []
            for i in range(self.iterations // self.concurrent_threads):
                try:
                    start_time = time.time()
                    result = self.test_func() if self.test_func else None
                    end_time = time.time()
                    
                    thread_results.append({
                        "thread_id": thread_id,
                        "iteration": i + 1,
                        "duration": end_time - start_time,
                        "success": True,
                        "result": result,
                        "timestamp": datetime.now().isoformat()
                    })
                except Exception as e:
                    thread_results.append({
                        "thread_id": thread_id,
                        "iteration": i + 1,
                        "duration": 0,
                        "success": False,
                        "error": str(e),
                        "timestamp": datetime.now().isoformat()
                    })
            results.extend(thread_results)
        
        # 创建并启动线程
        threads = []
        thread_results = []
        
        for i in range(self.concurrent_threads):
            thread = threading.Thread(target=worker, args=(i, thread_results))
            threads.append(thread)
            thread.start()
        
        # 等待所有线程完成
        for thread in threads:
            thread.join()
        
        self.results = thread_results
    
    def _calculate_metrics(self):
        """计算性能指标"""
        if not self.results:
            return
        
        # 成功的测试结果
        successful_results = [r for r in self.results if r["success"]]
        durations = [r["duration"] for r in successful_results]
        
        if not durations:
            self.metrics = {"error": "所有测试都失败了"}
            return
        
        # 基本统计指标
        self.metrics = {
            "total_iterations": len(self.results),
            "successful_iterations": len(successful_results),
            "success_rate": len(successful_results) / len(self.results),
            "avg_duration": statistics.mean(durations),
            "min_duration": min(durations),
            "max_duration": max(durations),
            "duration_stddev": statistics.stdev(durations) if len(durations) > 1 else 0,
            "percentiles": self._calculate_percentiles(durations)
        }
        
        # 吞吐量计算
        total_duration = sum(durations)
        if total_duration > 0:
            self.metrics["throughput_ops_per_sec"] = len(successful_results) / total_duration
        
        # 计算每秒操作数
        if self.metrics["avg_duration"] > 0:
            self.metrics["ops_per_sec"] = 1.0 / self.metrics["avg_duration"]
    
    def _calculate_percentiles(self, durations: List[float]) -> Dict[str, float]:
        """计算百分位数"""
        if not durations:
            return {}
        
        sorted_durations = sorted(durations)
        percentiles = {}
        
        for p in [50, 90, 95, 99]:
            index = int(len(sorted_durations) * p / 100)
            if index >= len(sorted_durations):
                index = len(sorted_durations) - 1
            percentiles[f"p{p}"] = sorted_durations[index]
        
        return percentiles
    
    def _generate_report(self) -> Dict[str, Any]:
        """生成测试报告"""
        return {
            "test_name": self.name,
            "description": self.description,
            "configuration": {
                "iterations": self.iterations,
                "concurrent_threads": self.concurrent_threads,
                "warmup_iterations": self.warmup_iterations
            },
            "results": self.results,
            "metrics": self.metrics,
            "generated_at": datetime.now().isoformat()
        }

class BenchmarkSuite:
    """基准测试套件"""
    
    def __init__(self, name: str):
        self.name = name
        self.tests: List[BenchmarkTest] = []
        self.suite_results = []
    
    def add_test(self, test: BenchmarkTest):
        """添加测试用例"""
        self.tests.append(test)
    
    def run_suite(self) -> Dict[str, Any]:
        """运行测试套件"""
        print(f"开始运行测试套件: {self.name}")
        print(f"包含 {len(self.tests)} 个测试用例")
        
        suite_start_time = time.time()
        
        for i, test in enumerate(self.tests, 1):
            print(f"\n[{i}/{len(self.tests)}] 运行测试: {test.name}")
            result = test.run()
            self.suite_results.append(result)
            
            # 显示测试结果摘要
            if "error" in result:
                print(f"  测试失败: {result['error']}")
            elif "metrics" in result and "error" in result["metrics"]:
                print(f"  测试失败: {result['metrics']['error']}")
            else:
                metrics = result.get("metrics", {})
                print(f"  成功率: {metrics.get('success_rate', 0):.2%}")
                print(f"  平均耗时: {metrics.get('avg_duration', 0)*1000:.2f}ms")
                print(f"  吞吐量: {metrics.get('ops_per_sec', 0):.2f} ops/sec")
        
        suite_end_time = time.time()
        
        return {
            "suite_name": self.name,
            "total_tests": len(self.tests),
            "completed_tests": len([r for r in self.suite_results if "error" not in r]),
            "suite_duration": suite_end_time - suite_start_time,
            "test_results": self.suite_results,
            "generated_at": datetime.now().isoformat()
        }

# 使用示例
def sample_test_operation():
    """示例测试操作"""
    # 模拟一些计算工作
    time.sleep(0.001 + random.random() * 0.002)  # 1-3ms延迟
    return {"result": "success"}

def sample_setup():
    """示例准备函数"""
    print("执行测试准备...")

def sample_teardown():
    """示例清理函数"""
    print("执行测试清理...")

def demonstrate_benchmark_framework():
    """演示基准测试框架"""
    # 创建单个测试
    test1 = (BenchmarkTest("Sample Test 1", "示例测试用例1")
             .setup(sample_setup)
             .test(sample_test_operation)
             .teardown(sample_teardown)
             .config(iterations=100, concurrent_threads=5, warmup_iterations=10))
    
    result1 = test1.run()
    print("测试1结果:")
    if "error" not in result1:
        metrics = result1.get("metrics", {})
        print(f"  成功率: {metrics.get('success_rate', 0):.2%}")
        print(f"  平均耗时: {metrics.get('avg_duration', 0)*1000:.2f}ms")
    
    # 创建测试套件
    suite = BenchmarkSuite("Performance Test Suite")
    
    test2 = (BenchmarkTest("Sample Test 2", "示例测试用例2")
             .test(sample_test_operation)
             .config(iterations=50, concurrent_threads=3))
    
    test3 = (BenchmarkTest("Sample Test 3", "示例测试用例3")
             .test(sample_test_operation)
             .config(iterations=200, concurrent_threads=10, warmup_iterations=20))
    
    suite.add_test(test1)
    suite.add_test(test2)
    suite.add_test(test3)
    
    suite_result = suite.run_suite()
    print(f"\n测试套件结果:")
    print(f"  套件名称: {suite_result['suite_name']}")
    print(f"  总测试数: {suite_result['total_tests']}")
    print(f"  完成测试: {suite_result['completed_tests']}")
    print(f"  总耗时: {suite_result['suite_duration']:.2f}秒")

# 运行演示
# demonstrate_benchmark_framework()

12.1.4.2 存储系统专项基准测试

# 存储系统专项基准测试
import os
import tempfile
import hashlib
from typing import Dict, List, Any, Optional

class StorageBenchmark:
    """存储系统基准测试"""
    
    def __init__(self, test_directory: Optional[str] = None):
        self.test_directory = test_directory or tempfile.mkdtemp()
        self.test_files = []
        self.benchmark_results = {}
    
    def prepare_test_data(self, file_sizes: List[int], file_count: int = 10) -> List[str]:
        """准备测试数据"""
        print(f"准备测试数据: {file_count} 个文件，大小范围 {min(file_sizes)}-{max(file_sizes)} 字节")
        
        prepared_files = []
        for i in range(file_count):
            # 随机选择文件大小
            file_size = random.choice(file_sizes)
            
            # 生成测试文件
            file_path = os.path.join(self.test_directory, f"test_file_{i:04d}_{file_size}.dat")
            
            # 生成随机数据
            with open(file_path, 'wb') as f:
                f.write(os.urandom(file_size))
            
            prepared_files.append(file_path)
            self.test_files.append(file_path)
        
        print(f"测试数据准备完成，共 {len(prepared_files)} 个文件")
        return prepared_files
    
    def benchmark_sequential_read(self, files: List[str]) -> Dict[str, Any]:
        """顺序读取基准测试"""
        print("执行顺序读取基准测试...")
        
        durations = []
        bytes_read = 0
        
        for file_path in files:
            try:
                start_time = time.time()
                with open(file_path, 'rb') as f:
                    data = f.read()
                    bytes_read += len(data)
                end_time = time.time()
                
                durations.append(end_time - start_time)
            except Exception as e:
                print(f"读取文件 {file_path} 失败: {e}")
                durations.append(0)
        
        if not durations or sum(durations) == 0:
            return {"error": "读取测试失败"}
        
        total_duration = sum(durations)
        avg_duration = total_duration / len(durations)
        
        return {
            "test_type": "sequential_read",
            "file_count": len(files),
            "total_bytes": bytes_read,
            "total_duration": total_duration,
            "avg_duration": avg_duration,
            "throughput_bytes_per_sec": bytes_read / total_duration if total_duration > 0 else 0,
            "throughput_mbps": (bytes_read / total_duration / 1024 / 1024) if total_duration > 0 else 0
        }
    
    def benchmark_sequential_write(self, file_sizes: List[int], file_count: int = 10) -> Dict[str, Any]:
        """顺序写入基准测试"""
        print("执行顺序写入基准测试...")
        
        durations = []
        bytes_written = 0
        
        for i in range(file_count):
            file_size = random.choice(file_sizes)
            file_path = os.path.join(self.test_directory, f"write_test_{i:04d}_{file_size}.dat")
            
            try:
                start_time = time.time()
                with open(file_path, 'wb') as f:
                    f.write(os.urandom(file_size))
                    bytes_written += file_size
                end_time = time.time()
                
                durations.append(end_time - start_time)
                self.test_files.append(file_path)
            except Exception as e:
                print(f"写入文件 {file_path} 失败: {e}")
                durations.append(0)
        
        if not durations or sum(durations) == 0:
            return {"error": "写入测试失败"}
        
        total_duration = sum(durations)
        avg_duration = total_duration / len(durations)
        
        return {
            "test_type": "sequential_write",
            "file_count": file_count,
            "total_bytes": bytes_written,
            "total_duration": total_duration,
            "avg_duration": avg_duration,
            "throughput_bytes_per_sec": bytes_written / total_duration if total_duration > 0 else 0,
            "throughput_mbps": (bytes_written / total_duration / 1024 / 1024) if total_duration > 0 else 0
        }
    
    def benchmark_random_read(self, files: List[str], read_size: int = 4096, 
                            read_count: int = 100) -> Dict[str, Any]:
        """随机读取基准测试"""
        print("执行随机读取基准测试...")
        
        durations = []
        successful_reads = 0
        
        for _ in range(read_count):
            # 随机选择一个文件
            file_path = random.choice(files)
            
            try:
                file_size = os.path.getsize(file_path)
                if file_size <= read_size:
                    offset = 0
                else:
                    offset = random.randint(0, file_size - read_size)
                
                start_time = time.time()
                with open(file_path, 'rb') as f:
                    f.seek(offset)
                    data = f.read(read_size)
                end_time = time.time()
                
                if len(data) == read_size:
                    durations.append(end_time - start_time)
                    successful_reads += 1
            except Exception as e:
                print(f"随机读取失败: {e}")
        
        if not durations:
            return {"error": "随机读取测试失败"}
        
        avg_duration = sum(durations) / len(durations)
        
        return {
            "test_type": "random_read",
            "read_operations": read_count,
            "successful_reads": successful_reads,
            "success_rate": successful_reads / read_count,
            "read_size": read_size,
            "avg_duration": avg_duration,
            "iops": len(durations) / sum(durations) if sum(durations) > 0 else 0
        }
    
    def benchmark_concurrent_access(self, files: List[str], 
                                  concurrent_threads: int = 10) -> Dict[str, Any]:
        """并发访问基准测试"""
        print(f"执行并发访问基准测试 ({concurrent_threads} 并发)...")
        
        def worker(thread_id: int, results: List[float]):
            thread_durations = []
            for _ in range(5):  # 每个线程执行5次操作
                file_path = random.choice(files)
                try:
                    start_time = time.time()
                    with open(file_path, 'rb') as f:
                        f.read(1024)  # 读取1KB
                    end_time = time.time()
                    thread_durations.append(end_time - start_time)
                except Exception as e:
                    print(f"线程 {thread_id} 操作失败: {e}")
            results.extend(thread_durations)
        
        # 创建并启动线程
        threads = []
        thread_results = []
        
        for i in range(concurrent_threads):
            thread = threading.Thread(target=worker, args=(i, thread_results))
            threads.append(thread)
            thread.start()
        
        # 等待所有线程完成
        for thread in threads:
            thread.join()
        
        if not thread_results:
            return {"error": "并发测试失败"}
        
        total_duration = sum(thread_results)
        avg_duration = total_duration / len(thread_results)
        
        return {
            "test_type": "concurrent_access",
            "concurrent_threads": concurrent_threads,
            "total_operations": len(thread_results),
            "total_duration": total_duration,
            "avg_duration": avg_duration,
            "throughput_ops_per_sec": len(thread_results) / total_duration if total_duration > 0 else 0
        }
    
    def run_comprehensive_benchmark(self, file_sizes: List[int] = None) -> Dict[str, Any]:
        """运行综合基准测试"""
        if file_sizes is None:
            file_sizes = [1024, 10240, 102400, 1048576]  # 1KB, 10KB, 100KB, 1MB
        
        print("开始综合存储基准测试...")
        
        # 准备测试数据
        test_files = self.prepare_test_data(file_sizes, 20)
        
        # 执行各项测试
        results = {}
        
        # 顺序读取测试
        seq_read_result = self.benchmark_sequential_read(test_files)
        results["sequential_read"] = seq_read_result
        
        # 顺序写入测试
        seq_write_result = self.benchmark_sequential_write(file_sizes, 10)
        results["sequential_write"] = seq_write_result
        
        # 随机读取测试
        random_read_result = self.benchmark_random_read(test_files, 4096, 100)
        results["random_read"] = random_read_result
        
        # 并发访问测试
        concurrent_result = self.benchmark_concurrent_access(test_files, 10)
        results["concurrent_access"] = concurrent_result
        
        # 清理测试文件
        self.cleanup_test_files()
        
        return {
            "benchmark_type": "comprehensive_storage",
            "results": results,
            "generated_at": datetime.now().isoformat()
        }
    
    def cleanup_test_files(self):
        """清理测试文件"""
        print("清理测试文件...")
        for file_path in self.test_files:
            try:
                if os.path.exists(file_path):
                    os.remove(file_path)
            except Exception as e:
                print(f"删除文件 {file_path} 失败: {e}")
        self.test_files.clear()

# 使用示例
def demonstrate_storage_benchmark():
    """演示存储基准测试"""
    # 创建存储基准测试实例
    storage_bench = StorageBenchmark()
    
    # 运行综合基准测试
    comprehensive_result = storage_bench.run_comprehensive_benchmark()
    
    print("\n综合存储基准测试结果:")
    results = comprehensive_result.get("results", {})
    
    for test_type, result in results.items():
        if "error" in result:
            print(f"  {test_type}: {result['error']}")
        else:
            print(f"  {test_type}:")
            if "throughput_mbps" in result:
                print(f"    吞吐量: {result['throughput_mbps']:.2f} MB/s")
            if "iops" in result:
                print(f"    IOPS: {result['iops']:.2f}")
            if "avg_duration" in result:
                print(f"    平均延迟: {result['avg_duration']*1000:.2f} ms")
            if "success_rate" in result:
                print(f"    成功率: {result['success_rate']:.2%}")

# 运行演示
# demonstrate_storage_benchmark()

12.1.5 性能验证与持续监控

性能验证不仅是一次性的测试活动，更需要建立持续的监控机制。

12.1.5.1 性能回归检测

# 性能回归检测系统
from typing import Dict, List, Any, Optional
import json

class PerformanceRegressionDetector:
    """性能回归检测器"""
    
    def __init__(self, baseline_data: Optional[Dict[str, Any]] = None):
        self.baseline_data = baseline_data or {}
        self.current_performance = {}
        self.regression_threshold = 0.1  # 10% 性能下降阈值
    
    def set_baseline(self, baseline_data: Dict[str, Any]):
        """设置性能基线"""
        self.baseline_data = baseline_data
        print("性能基线已设置")
    
    def load_baseline_from_file(self, file_path: str) -> bool:
        """从文件加载性能基线"""
        try:
            with open(file_path, 'r', encoding='utf-8') as f:
                self.baseline_data = json.load(f)
            print(f"从 {file_path} 加载性能基线")
            return True
        except Exception as e:
            print(f"加载性能基线失败: {e}")
            return False
    
    def save_baseline_to_file(self, file_path: str) -> bool:
        """保存性能基线到文件"""
        try:
            with open(file_path, 'w', encoding='utf-8') as f:
                json.dump(self.baseline_data, f, indent=2, ensure_ascii=False)
            print(f"性能基线已保存到 {file_path}")
            return True
        except Exception as e:
            print(f"保存性能基线失败: {e}")
            return False
    
    def compare_performance(self, current_data: Dict[str, Any]) -> Dict[str, Any]:
        """比较性能数据"""
        self.current_performance = current_data
        regressions = []
        improvements = []
        
        for metric_name, current_value in current_data.items():
            if metric_name in self.baseline_data:
                baseline_value = self.baseline_data[metric_name]
                
                # 计算变化率
                if baseline_value != 0:
                    change_rate = (current_value - baseline_value) / baseline_value
                else:
                    change_rate = float('inf') if current_value > 0 else 0
                
                comparison = {
                    "metric": metric_name,
                    "baseline": baseline_value,
                    "current": current_value,
                    "change_rate": change_rate,
                    "absolute_change": current_value - baseline_value
                }
                
                # 判断是回归还是改进
                if change_rate < -self.regression_threshold:
                    regressions.append(comparison)
                elif change_rate > self.regression_threshold:
                    improvements.append(comparison)
        
        return {
            "regressions": regressions,
            "improvements": improvements,
            "total_metrics": len(current_data),
            "regression_count": len(regressions),
            "improvement_count": len(improvements),
            "comparison_timestamp": datetime.now().isoformat()
        }
    
    def generate_regression_report(self, comparison_result: Dict[str, Any]) -> str:
        """生成回归报告"""
        report = []
        report.append("=== 性能回归检测报告 ===")
        report.append(f"检测时间: {comparison_result['comparison_timestamp']}")
        report.append(f"总指标数: {comparison_result['total_metrics']}")
        report.append(f"性能回归: {comparison_result['regression_count']} 项")
        report.append(f"性能改进: {comparison_result['improvement_count']} 项")
        report.append("")
        
        if comparison_result["regressions"]:
            report.append("性能回归项:")
            for regression in comparison_result["regressions"]:
                report.append(f"  {regression['metric']}: "
                            f"{regression['baseline']:.4f} -> {regression['current']:.4f} "
                            f"({regression['change_rate']:.2%})")
            report.append("")
        
        if comparison_result["improvements"]:
            report.append("性能改进项:")
            for improvement in comparison_result["improvements"]:
                report.append(f"  {improvement['metric']}: "
                            f"{improvement['baseline']:.4f} -> {improvement['current']:.4f} "
                            f"({improvement['change_rate']:.2%})")
            report.append("")
        
        return "\n".join(report)

class ContinuousPerformanceMonitor:
    """持续性能监控器"""
    
    def __init__(self, detector: PerformanceRegressionDetector):
        self.detector = detector
        self.monitoring = False
        self.monitoring_interval = 3600  # 1小时默认间隔
        self.performance_history = []
    
    def start_monitoring(self, interval: int = 3600):
        """开始持续监控"""
        self.monitoring_interval = interval
        self.monitoring = True
        
        monitor_thread = threading.Thread(target=self._monitoring_loop)
        monitor_thread.daemon = True
        monitor_thread.start()
        print(f"持续性能监控已启动，间隔: {interval}秒")
    
    def stop_monitoring(self):
        """停止持续监控"""
        self.monitoring = False
        print("持续性能监控已停止")
    
    def _monitoring_loop(self):
        """监控循环"""
        while self.monitoring:
            try:
                # 收集当前性能数据（这里简化实现）
                current_performance = self._collect_current_performance()
                
                # 比较性能
                comparison_result = self.detector.compare_performance(current_performance)
                
                # 记录历史
                self.performance_history.append({
                    "timestamp": datetime.now().isoformat(),
                    "performance": current_performance,
                    "comparison": comparison_result
                })
                
                # 生成报告
                report = self.detector.generate_regression_report(comparison_result)
                print(report)
                
                # 如果有性能回归，发出告警
                if comparison_result["regression_count"] > 0:
                    self._send_regression_alert(comparison_result)
                
                time.sleep(self.monitoring_interval)
            except Exception as e:
                print(f"性能监控出错: {e}")
    
    def _collect_current_performance(self) -> Dict[str, Any]:
        """收集当前性能数据（简化实现）"""
        # 在实际实现中，这里会从监控系统收集真实数据
        return {
            "read_latency_ms": random.uniform(5, 15),
            "write_latency_ms": random.uniform(10, 25),
            "throughput_mb_per_sec": random.uniform(50, 150),
            "iops": random.uniform(1000, 5000),
            "cpu_utilization": random.uniform(20, 80),
            "memory_utilization": random.uniform(30, 70)
        }
    
    def _send_regression_alert(self, comparison_result: Dict[str, Any]):
        """发送性能回归告警"""
        print("=== 性能回归告警 ===")
        for regression in comparison_result["regressions"]:
            print(f"警告: {regression['metric']} 性能下降 {regression['change_rate']:.2%}")

# 使用示例
def demonstrate_regression_detection():
    """演示性能回归检测"""
    # 创建回归检测器
    detector = PerformanceRegressionDetector()
    
    # 设置基线数据
    baseline_data = {
        "read_latency_ms": 10.0,
        "write_latency_ms": 20.0,
        "throughput_mb_per_sec": 100.0,
        "iops": 3000.0,
        "cpu_utilization": 50.0,
        "memory_utilization": 60.0
    }
    detector.set_baseline(baseline_data)
    
    # 保存基线到文件
    detector.save_baseline_to_file("performance_baseline.json")
    
    # 模拟当前性能数据（有性能下降的情况）
    current_performance = {
        "read_latency_ms": 15.0,      # +50% 延迟增加
        "write_latency_ms": 22.0,     # +10% 延迟增加
        "throughput_mb_per_sec": 80.0, # -20% 吞吐量下降
        "iops": 2500.0,               # -16.7% IOPS下降
        "cpu_utilization": 55.0,      # +10% CPU使用率增加
        "memory_utilization": 58.0    # -3.3% 内存使用率下降（改进）
    }
    
    # 比较性能
    comparison_result = detector.compare_performance(current_performance)
    
    # 生成报告
    report = detector.generate_regression_report(comparison_result)
    print(report)
    
    # 持续监控示例
    print("\n启动持续监控演示...")
    monitor = ContinuousPerformanceMonitor(detector)
    monitor.start_monitoring(interval=10)  # 10秒间隔用于演示
    
    # 运行30秒
    time.sleep(30)
    monitor.stop_monitoring()

# 运行演示
# demonstrate_regression_detection()

通过建立完善的基准测试实践和性能验证体系，我们能够科学地评估分布式文件存储平台的性能表现，及时发现性能问题，并验证优化措施的有效性，从而确保系统持续提供高质量的服务。