File size: 1,640 Bytes
95d8c91
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
"""
Incident scenarios for the demo
"""

INCIDENT_SCENARIOS = {
    "Cache Miss Storm": {
        "description": "Redis cluster experiencing 80% cache miss rate causing database overload",
        "severity": "CRITICAL",
        "component": "redis_cache",
        "metrics": {
            "cache_hit_rate": 18.5,
            "database_load": 92,
            "response_time_ms": 1850,
            "affected_users": 45000
        },
        "business_impact": {
            "revenue_loss_per_hour": 8500,
            "sla_violation": True,
            "customer_sat_change": -40
        }
    },
    "Database Connection Pool Exhaustion": {
        "description": "Database connection pool exhausted causing API timeouts",
        "severity": "HIGH",
        "component": "database",
        "metrics": {
            "active_connections": 98,
            "max_connections": 100,
            "api_latency_ms": 2450,
            "error_rate": 15.2
        },
        "business_impact": {
            "revenue_loss_per_hour": 4200,
            "affected_services": 3,
            "sla_violation": True
        }
    },
    "Memory Leak in Production": {
        "description": "Java service memory leak causing gradual degradation",
        "severity": "HIGH",
        "component": "java_service",
        "metrics": {
            "memory_usage": 96,
            "gc_pause_time_ms": 4500,
            "error_rate": 28.5,
            "restart_frequency_per_hour": 12
        },
        "business_impact": {
            "revenue_loss_per_hour": 5500,
            "session_loss": 8500,
            "support_tickets_increase": 300
        }
    }
}