<!-- Fluentd配置示例 -->
<source>
  @type tail
  path /var/log/test-executor/*.log
  pos_file /var/log/td-agent/test-executor.log.pos
  tag test.executor
  format json
  time_key timestamp
</source>

<match test.executor>
  @type elasticsearch
  host elasticsearch-host
  port 9200
  logstash_format true
</match>

Logstash

Logstash是Elastic Stack的重要组成部分：

强大的处理能力：支持复杂的数据处理和转换
丰富的插件：提供大量的输入、过滤和输出插件
易于集成：与Elasticsearch和Kibana无缝集成
可扩展性：支持水平扩展

Filebeat

Filebeat是轻量级的日志收集器：

轻量级：资源占用少，适合边缘节点部署
可靠性：保证日志数据不丢失
简单易用：配置简单，易于部署
模块化：提供预构建的模块简化配置

实时日志推送机制

实时日志推送能够为用户提供即时的反馈信息。

WebSocket推送

WebSocket是实现实时推送的常用技术：

@Component
public class LogPushService {
    private final SimpMessagingTemplate messagingTemplate;
    
    public void pushLog(String taskId, LogEntry logEntry) {
        messagingTemplate.convertAndSend("/topic/task/" + taskId + "/logs", logEntry);
    }
    
    @MessageMapping("/task/{taskId}/logs")
    @SendTo("/topic/task/{taskId}/logs")
    public LogEntry subscribeToLogs(@DestinationVariable String taskId) {
        // 订阅日志推送
        return new LogEntry("Connected to log stream for task: " + taskId);
    }
}

Server-Sent Events (SSE)

SSE是另一种实现实时推送的技术：

@RestController
public class LogStreamController {
    
    @GetMapping(value = "/tasks/{taskId}/logs/stream", produces = MediaType.TEXT_EVENT_STREAM_VALUE)
    public SseEmitter streamLogs(@PathVariable String taskId) {
        SseEmitter emitter = new SseEmitter(Long.MAX_VALUE);
        
        // 启动日志推送线程
        logStreamingService.startStreaming(taskId, emitter);
        
        return emitter;
    }
}

消息队列推送

使用消息队列实现日志推送：

@Component
public class LogMessageProducer {
    private final RabbitTemplate rabbitTemplate;
    
    public void sendLog(String taskId, LogEntry logEntry) {
        rabbitTemplate.convertAndSend("log.exchange", "task." + taskId, logEntry);
    }
}

@Component
public class LogMessageConsumer {
    
    @RabbitListener(queues = "log.queue")
    public void receiveLog(LogEntry logEntry) {
        // 处理接收到的日志消息
        logPushService.pushLog(logEntry.getTaskId(), logEntry);
    }
}

日志格式标准化

统一的日志格式有助于日志的处理和分析。

结构化日志

采用结构化日志格式，便于机器处理：

{
  "timestamp": "2025-09-07T10:30:45.123Z",
  "level": "INFO",
  "service": "test-executor",
  "taskId": "task-12345",
  "thread": "pool-1-thread-1",
  "class": "com.test.platform.executor.TestExecutor",
  "method": "executeTest",
  "message": "开始执行测试任务",
  "context": {
    "testCaseId": "tc-001",
    "testSuiteId": "ts-001",
    "userId": "user-001"
  },
  "metrics": {
    "duration": 0,
    "memoryUsage": "256MB"
  }
}

日志级别定义

合理定义日志级别，便于过滤和处理：

public enum LogLevel {
    TRACE(1, "跟踪"),
    DEBUG(2, "调试"),
    INFO(3, "信息"),
    WARN(4, "警告"),
    ERROR(5, "错误"),
    FATAL(6, "致命");
    
    private int level;
    private String description;
    
    LogLevel(int level, String description) {
        this.level = level;
        this.description = description;
    }
    
    public int getLevel() {
        return level;
    }
    
    public String getDescription() {
        return description;
    }
}

日志存储与索引

高效的日志存储和索引是日志系统的核心。

Elasticsearch

Elasticsearch是日志存储和搜索的首选方案：

全文搜索：支持复杂的全文搜索功能
实时分析：支持实时数据分析
水平扩展：支持集群部署和水平扩展
REST API：提供丰富的REST API接口

存储策略

制定合理的日志存储策略：

# Elasticsearch索引生命周期管理策略
index.lifecycle.rollover_alias: "test-logs"
index.lifecycle.policy:
  phases:
    hot:
      actions:
        rollover:
          max_age: "7d"
          max_size: "50gb"
    warm:
      min_age: "7d"
      actions:
        forcemerge:
          max_num_segments: 1
    cold:
      min_age: "30d"
      actions:
        freeze: {}
    delete:
      min_age: "90d"
      actions:
        delete: {}

索引优化

优化索引配置提高查询性能：

{
  "settings": {
    "number_of_shards": 5,
    "number_of_replicas": 1,
    "refresh_interval": "30s",
    "translog": {
      "durability": "async"
    }
  },
  "mappings": {
    "properties": {
      "timestamp": {
        "type": "date"
      },
      "level": {
        "type": "keyword"
      },
      "service": {
        "type": "keyword"
      },
      "taskId": {
        "type": "keyword"
      },
      "message": {
        "type": "text",
        "analyzer": "ik_max_word"
      }
    }
  }
}

日志分析与可视化

通过分析和可视化日志数据，提取有价值的信息。

Kibana仪表盘

使用Kibana创建日志分析仪表盘：

实时监控面板：展示系统实时状态
趋势分析图表：展示日志数据的变化趋势
异常检测面板：识别异常日志模式
性能分析视图：分析系统性能指标

自定义分析

开发自定义的日志分析功能：

@Service
public class LogAnalysisService {
    
    public LogAnalysisReport analyzeTaskLogs(String taskId) {
        // 查询任务相关日志
        List<LogEntry> logs = logRepository.findByTaskId(taskId);
        
        // 分析日志数据
        LogAnalysisReport report = new LogAnalysisReport();
        report.setTaskId(taskId);
        report.setErrorCount(countErrors(logs));
        report.setWarningCount(countWarnings(logs));
        report.setExecutionTime(calculateExecutionTime(logs));
        report.setResourceUsage(analyzeResourceUsage(logs));
        
        // 识别异常模式
        report.setAnomalies(detectAnomalies(logs));
        
        return report;
    }
    
    private List<Anomaly> detectAnomalies(List<LogEntry> logs) {
        // 实现异常检测算法
        return anomalyDetectionService.detect(logs);
    }
}

性能优化

优化日志收集和推送系统的性能。

批量处理

采用批量处理提高处理效率：

@Component
public class BatchLogProcessor {
    private final BlockingQueue<LogEntry> logQueue = new LinkedBlockingQueue<>();
    private final ScheduledExecutorService scheduler = Executors.newScheduledThreadPool(1);
    
    @PostConstruct
    public void init() {
        // 定时批量处理日志
        scheduler.scheduleWithFixedDelay(this::processBatch, 0, 1, TimeUnit.SECONDS);
    }
    
    public void addLog(LogEntry logEntry) {
        logQueue.offer(logEntry);
    }
    
    private void processBatch() {
        List<LogEntry> batch = new ArrayList<>();
        logQueue.drainTo(batch, 100); // 批量处理最多100条日志
        
        if (!batch.isEmpty()) {
            // 批量存储日志
            logStorageService.storeLogs(batch);
        }
    }
}

异步处理

采用异步处理避免阻塞主线程：

@Component
public class AsyncLogService {
    
    @Async
    public CompletableFuture<Void> processLogAsync(LogEntry logEntry) {
        return CompletableFuture.runAsync(() -> {
            try {
                // 异步处理日志
                logProcessor.process(logEntry);
                
                // 异步推送日志
                logPushService.pushLog(logEntry.getTaskId(), logEntry);
            } catch (Exception e) {
                log.error("处理日志失败", e);
            }
        });
    }
}

安全与权限控制

确保日志系统的安全性和访问控制。

日志访问控制

实现细粒度的日志访问控制：

@Service
public class LogAccessControlService {
    
    public boolean canAccessLogs(String userId, String taskId) {
        // 检查用户是否有权限访问指定任务的日志
        return taskService.isTaskOwner(userId, taskId) || 
               permissionService.hasPermission(userId, "LOG_VIEW_ALL");
    }
    
    public List<LogEntry> getFilteredLogs(String taskId, String userId, LogFilter filter) {
        // 验证访问权限
        if (!canAccessLogs(userId, taskId)) {
            throw new AccessDeniedException("无权访问日志");
        }
        
        // 应用过滤条件
        return logRepository.findByTaskIdAndFilter(taskId, filter);
    }
}

敏感信息脱敏

对日志中的敏感信息进行脱敏处理：

@Component
public class LogSanitizer {
    
    public LogEntry sanitize(LogEntry logEntry) {
        String message = logEntry.getMessage();
        
        // 脱敏手机号
        message = message.replaceAll("(13[0-9]|14[01456879]|15[0-35-9]|16[2567]|17[0-8]|18[0-9]|19[0-35-9])\\d{4}(\\d{4})", "$1****$2");
        
        // 脱敏邮箱
        message = message.replaceAll("([a-zA-Z0-9._%+-]+)@([a-zA-Z0-9.-]+\\.[a-zA-Z]{2,})", "$1****@$2");
        
        // 脱敏身份证号
        message = message.replaceAll("(\\d{4})\\d{10}(\\d{4})", "$1****$2");
        
        logEntry.setMessage(message);
        return logEntry;
    }
}

监控与告警

建立完善的日志系统监控和告警机制。

系统健康监控

监控日志系统的健康状态：

# 日志系统监控指标
metrics:
  - name: "log_collection_rate"
    description: "日志收集速率"
    type: "gauge"
  
  - name: "log_processing_latency"
    description: "日志处理延迟"
    type: "histogram"
  
  - name: "log_storage_usage"
    description: "日志存储使用率"
    type: "gauge"
  
  - name: "log_push_success_rate"
    description: "日志推送成功率"
    type: "gauge"

异常告警

设置日志异常告警规则：

# 日志异常告警规则
alerts:
  - name: "high_error_rate"
    condition: "rate(log_errors[5m]) > 0.05"
    severity: "warning"
    description: "错误日志比例过高"
  
  - name: "log_collection_failure"
    condition: "rate(log_collection_failures[1m]) > 0"
    severity: "critical"
    description: "日志收集失败"
  
  - name: "log_push_failure"
    condition: "rate(log_push_failures[1m]) > 0"
    severity: "warning"
    description: "日志推送失败"

总结

实时日志收集与推送是现代测试平台不可或缺的重要功能。通过构建完善的日志收集架构，选择合适的技术栈，实现高效的日志推送机制，我们能够为测试平台用户提供实时的反馈信息，为系统运维人员提供强大的问题诊断能力。在实际应用中，我们需要根据具体的业务需求和技术架构，不断优化日志收集和推送方案，确保日志系统能够稳定、高效地运行，为测试平台的可靠性和用户体验提供有力保障。