Initial commit

2025-08-01 23:50:28 +02:00
Commit 04585e95b6
--- a/utils/performance_monitor.py
+++ b/utils/performance_monitor.py
@ -0,0 +1,412 @@
+"""
+Performance Monitor - Non-intrusive monitoring for race condition detection
+Debug-only monitoring without production performance impact
+"""
+
+import time
+import threading
+import functools
+import traceback
+from typing import Dict, Any, Optional, Callable, List
+from collections import defaultdict, deque
+from datetime import datetime, timedelta
+from dataclasses import dataclass, field
+import logging
+import json
+import os
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass
+class OperationMetrics:
+    """Metriken für eine einzelne Operation"""
+    operation_name: str
+    thread_id: int
+    thread_name: str
+    start_time: float
+    end_time: Optional[float] = None
+    duration: Optional[float] = None
+    success: bool = True
+    error_message: Optional[str] = None
+    metadata: Dict[str, Any] = field(default_factory=dict)
+    stack_trace: Optional[str] = None
+    
+    def complete(self, success: bool = True, error_message: Optional[str] = None):
+        """Markiert Operation als abgeschlossen"""
+        self.end_time = time.time()
+        self.duration = self.end_time - self.start_time
+        self.success = success
+        self.error_message = error_message
+    
+    def to_dict(self) -> Dict[str, Any]:
+        """Konvertiert zu Dictionary für Serialisierung"""
+        return {
+            'operation_name': self.operation_name,
+            'thread_id': self.thread_id,
+            'thread_name': self.thread_name,
+            'start_time': self.start_time,
+            'end_time': self.end_time,
+            'duration': self.duration,
+            'success': self.success,
+            'error_message': self.error_message,
+            'metadata': self.metadata,
+            'has_stack_trace': self.stack_trace is not None
+        }
+
+
+class PerformanceMonitor:
+    """
+    Performance-Monitor mit race condition detection
+    """
+    
+    def __init__(self, enabled: bool = None, max_history: int = 1000):
+        # Auto-detect based on debug settings oder environment
+        if enabled is None:
+            enabled = (
+                os.getenv('DEBUG_RACE_CONDITIONS', '').lower() in ['true', '1', 'yes'] or
+                os.getenv('PERFORMANCE_MONITORING', '').lower() in ['true', '1', 'yes']
+            )
+        
+        self.enabled = enabled
+        self.max_history = max_history
+        
+        # Monitoring data
+        self._operation_history: deque = deque(maxlen=max_history)
+        self._active_operations: Dict[str, OperationMetrics] = {}
+        self._operation_stats: Dict[str, Dict[str, Any]] = defaultdict(lambda: {
+            'total_calls': 0,
+            'successful_calls': 0,
+            'failed_calls': 0,
+            'total_duration': 0.0,
+            'min_duration': float('inf'),
+            'max_duration': 0.0,
+            'concurrent_executions': 0,
+            'max_concurrent': 0
+        })
+        
+        # Thread safety
+        self._lock = threading.RLock()
+        
+        # Race condition detection
+        self._potential_races: List[Dict[str, Any]] = []
+        self._long_operations: List[Dict[str, Any]] = []
+        
+        # Thresholds
+        self.long_operation_threshold = 2.0  # seconds
+        self.race_detection_window = 0.1     # seconds
+        
+        if self.enabled:
+            logger.info("Performance monitoring enabled")
+    
+    def monitor_operation(self, operation_name: str, capture_stack: bool = False):
+        """
+        Decorator für Operation-Monitoring
+        """
+        def decorator(func: Callable) -> Callable:
+            if not self.enabled:
+                return func  # No overhead when disabled
+            
+            @functools.wraps(func)
+            def wrapper(*args, **kwargs):
+                return self._execute_monitored(
+                    operation_name or func.__name__,
+                    func,
+                    capture_stack,
+                    *args,
+                    **kwargs
+                )
+            
+            wrapper.original = func
+            wrapper.is_monitored = True
+            return wrapper
+        
+        return decorator
+    
+    def _execute_monitored(self, operation_name: str, func: Callable, 
+                          capture_stack: bool, *args, **kwargs) -> Any:
+        """Führt eine überwachte Operation aus"""
+        if not self.enabled:
+            return func(*args, **kwargs)
+        
+        thread_id = threading.current_thread().ident
+        thread_name = threading.current_thread().name
+        operation_key = f"{operation_name}_{thread_id}_{time.time()}"
+        
+        # Metrics-Objekt erstellen
+        metrics = OperationMetrics(
+            operation_name=operation_name,
+            thread_id=thread_id,
+            thread_name=thread_name,
+            start_time=time.time(),
+            stack_trace=traceback.format_stack() if capture_stack else None
+        )
+        
+        # Race condition detection
+        self._detect_potential_race(operation_name, metrics.start_time)
+        
+        with self._lock:
+            # Concurrent execution tracking
+            concurrent_count = sum(
+                1 for op in self._active_operations.values()
+                if op.operation_name == operation_name
+            )
+            
+            stats = self._operation_stats[operation_name]
+            stats['concurrent_executions'] = concurrent_count
+            stats['max_concurrent'] = max(stats['max_concurrent'], concurrent_count)
+            
+            # Operation zu aktiven hinzufügen
+            self._active_operations[operation_key] = metrics
+        
+        try:
+            # Operation ausführen
+            result = func(*args, **kwargs)
+            
+            # Erfolg markieren
+            metrics.complete(success=True)
+            
+            return result
+            
+        except Exception as e:
+            # Fehler markieren
+            metrics.complete(success=False, error_message=str(e))
+            raise
+            
+        finally:
+            # Cleanup und Statistik-Update
+            with self._lock:
+                self._active_operations.pop(operation_key, None)
+                self._update_statistics(metrics)
+                self._operation_history.append(metrics)
+                
+                # Long operation detection
+                if metrics.duration and metrics.duration > self.long_operation_threshold:
+                    self._record_long_operation(metrics)
+    
+    def _detect_potential_race(self, operation_name: str, start_time: float):
+        """Erkennt potentielle Race Conditions"""
+        if not self.enabled:
+            return
+        
+        # Prüfe ob ähnliche Operationen zeitgleich laufen
+        concurrent_ops = []
+        with self._lock:
+            for op in self._active_operations.values():
+                if (op.operation_name == operation_name and 
+                    abs(op.start_time - start_time) < self.race_detection_window):
+                    concurrent_ops.append(op)
+        
+        if len(concurrent_ops) > 0:
+            race_info = {
+                'operation_name': operation_name,
+                'detected_at': start_time,
+                'concurrent_threads': [op.thread_id for op in concurrent_ops],
+                'time_window': self.race_detection_window,
+                'severity': 'high' if len(concurrent_ops) > 2 else 'medium'
+            }
+            
+            self._potential_races.append(race_info)
+            
+            logger.warning(f"Potential race condition detected: {operation_name} "
+                         f"running on {len(concurrent_ops)} threads simultaneously")
+    
+    def _record_long_operation(self, metrics: OperationMetrics):
+        """Zeichnet lange Operationen auf"""
+        long_op_info = {
+            'operation_name': metrics.operation_name,
+            'duration': metrics.duration,
+            'thread_id': metrics.thread_id,
+            'start_time': metrics.start_time,
+            'success': metrics.success,
+            'metadata': metrics.metadata
+        }
+        
+        self._long_operations.append(long_op_info)
+        
+        logger.warning(f"Long operation detected: {metrics.operation_name} "
+                      f"took {metrics.duration:.3f}s (threshold: {self.long_operation_threshold}s)")
+    
+    def _update_statistics(self, metrics: OperationMetrics):
+        """Aktualisiert Operation-Statistiken"""
+        stats = self._operation_stats[metrics.operation_name]
+        
+        stats['total_calls'] += 1
+        if metrics.success:
+            stats['successful_calls'] += 1
+        else:
+            stats['failed_calls'] += 1
+        
+        if metrics.duration:
+            stats['total_duration'] += metrics.duration
+            stats['min_duration'] = min(stats['min_duration'], metrics.duration)
+            stats['max_duration'] = max(stats['max_duration'], metrics.duration)
+    
+    def get_statistics(self) -> Dict[str, Any]:
+        """Gibt vollständige Monitoring-Statistiken zurück"""
+        if not self.enabled:
+            return {'monitoring_enabled': False}
+        
+        with self._lock:
+            # Statistiken aufbereiten
+            processed_stats = {}
+            for op_name, stats in self._operation_stats.items():
+                processed_stats[op_name] = {
+                    **stats,
+                    'average_duration': (
+                        stats['total_duration'] / stats['total_calls'] 
+                        if stats['total_calls'] > 0 else 0
+                    ),
+                    'success_rate': (
+                        stats['successful_calls'] / stats['total_calls']
+                        if stats['total_calls'] > 0 else 0
+                    ),
+                    'min_duration': stats['min_duration'] if stats['min_duration'] != float('inf') else 0
+                }
+            
+            return {
+                'monitoring_enabled': True,
+                'operation_statistics': processed_stats,
+                'race_conditions': {
+                    'detected_count': len(self._potential_races),
+                    'recent_races': self._potential_races[-10:],  # Last 10
+                },
+                'long_operations': {
+                    'detected_count': len(self._long_operations),
+                    'threshold': self.long_operation_threshold,
+                    'recent_long_ops': self._long_operations[-10:],  # Last 10
+                },
+                'active_operations': len(self._active_operations),
+                'history_size': len(self._operation_history),
+                'thresholds': {
+                    'long_operation_threshold': self.long_operation_threshold,
+                    'race_detection_window': self.race_detection_window
+                }
+            }
+    
+    def get_race_condition_report(self) -> Dict[str, Any]:
+        """Gibt detaillierten Race Condition Report zurück"""
+        if not self.enabled:
+            return {'monitoring_enabled': False}
+        
+        with self._lock:
+            # Gruppiere Race Conditions nach Operation
+            races_by_operation = defaultdict(list)
+            for race in self._potential_races:
+                races_by_operation[race['operation_name']].append(race)
+            
+            # Analysiere Patterns
+            analysis = {}
+            for op_name, races in races_by_operation.items():
+                high_severity = sum(1 for r in races if r['severity'] == 'high')
+                analysis[op_name] = {
+                    'total_races': len(races),
+                    'high_severity_races': high_severity,
+                    'affected_threads': len(set(
+                        thread_id for race in races 
+                        for thread_id in race['concurrent_threads']
+                    )),
+                    'first_detected': min(r['detected_at'] for r in races),
+                    'last_detected': max(r['detected_at'] for r in races),
+                    'recommendation': self._get_race_recommendation(op_name, races)
+                }
+            
+            return {
+                'monitoring_enabled': True,
+                'total_race_conditions': len(self._potential_races),
+                'affected_operations': len(races_by_operation),
+                'analysis_by_operation': analysis,
+                'raw_detections': self._potential_races
+            }
+    
+    def _get_race_recommendation(self, operation_name: str, races: List[Dict]) -> str:
+        """Gibt Empfehlungen für Race Condition Behebung"""
+        race_count = len(races)
+        high_severity_count = sum(1 for r in races if r['severity'] == 'high')
+        
+        if high_severity_count > 5:
+            return f"CRITICAL: {operation_name} has {high_severity_count} high-severity race conditions. Implement ThreadSafetyMixin immediately."
+        elif race_count > 10:
+            return f"HIGH: {operation_name} frequently encounters race conditions. Consider adding thread synchronization."
+        elif race_count > 3:
+            return f"MEDIUM: {operation_name} occasionally has race conditions. Monitor and consider thread safety measures."
+        else:
+            return f"LOW: {operation_name} has minimal race condition risk."
+    
+    def export_report(self, filename: Optional[str] = None) -> str:
+        """Exportiert vollständigen Report als JSON"""
+        if not self.enabled:
+            return "Monitoring not enabled"
+        
+        if filename is None:
+            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+            filename = f"performance_report_{timestamp}.json"
+        
+        report = {
+            'timestamp': datetime.now().isoformat(),
+            'statistics': self.get_statistics(),
+            'race_condition_report': self.get_race_condition_report(),
+            'operation_history': [op.to_dict() for op in list(self._operation_history)[-100:]]  # Last 100
+        }
+        
+        try:
+            with open(filename, 'w', encoding='utf-8') as f:
+                json.dump(report, f, indent=2, ensure_ascii=False)
+            
+            logger.info(f"Performance report exported to: {filename}")
+            return filename
+            
+        except Exception as e:
+            logger.error(f"Failed to export performance report: {e}")
+            return f"Export failed: {e}"
+    
+    def reset_statistics(self):
+        """Setzt alle Statistiken zurück"""
+        with self._lock:
+            self._operation_history.clear()
+            self._operation_stats.clear()
+            self._potential_races.clear()
+            self._long_operations.clear()
+            # Aktive Operationen nicht löschen - könnten noch laufen
+        
+        if self.enabled:
+            logger.info("Performance monitoring statistics reset")
+
+
+# Global Monitor Instance
+_global_monitor: Optional[PerformanceMonitor] = None
+_monitor_init_lock = threading.RLock()
+
+
+def get_performance_monitor() -> PerformanceMonitor:
+    """Holt die globale Monitor-Instanz (Singleton)"""
+    global _global_monitor
+    
+    if _global_monitor is None:
+        with _monitor_init_lock:
+            if _global_monitor is None:
+                _global_monitor = PerformanceMonitor()
+    
+    return _global_monitor
+
+
+# Convenience Decorators
+def monitor_if_enabled(operation_name: str = None, capture_stack: bool = False):
+    """Convenience decorator für conditional monitoring"""
+    monitor = get_performance_monitor()
+    return monitor.monitor_operation(operation_name, capture_stack)
+
+
+def monitor_race_conditions(operation_name: str = None):
+    """Speziell für Race Condition Detection"""
+    return monitor_if_enabled(operation_name, capture_stack=True)
+
+
+def monitor_fingerprint_operations(operation_name: str = None):
+    """Speziell für Fingerprint-Operationen"""
+    return monitor_if_enabled(f"fingerprint_{operation_name}", capture_stack=False)
+
+
+def monitor_session_operations(operation_name: str = None):
+    """Speziell für Session-Operationen"""
+    return monitor_if_enabled(f"session_{operation_name}", capture_stack=False)