{
"period": {
"start_date": "2024-01-24T00:00:00Z",
"end_date": "2024-01-30T23:59:59Z"
},
"summary": {
"total_failures": 234,
"failure_rate": 0.013,
"retries_succeeded": 156,
"fallback_succeeded": 67,
"unrecoverable": 11
},
"by_failure_mode": {
"format_violation": {
"count": 89,
"percentage": 0.38,
"affected_models": ["gpt-4o-mini", "claude-haiku-4-5"],
"common_triggers": ["complex JSON structures", "nested arrays"]
},
"refusal": {
"count": 56,
"percentage": 0.24,
"affected_models": ["gpt-4o", "claude-sonnet-4-5"],
"common_triggers": ["policy violations", "ambiguous requests"]
},
"hallucination": {
"count": 34,
"percentage": 0.15,
"affected_models": ["gpt-4o-mini"],
"common_triggers": ["data extraction from noise", "edge cases"]
},
"incomplete": {
"count": 31,
"percentage": 0.13,
"affected_models": ["claude-haiku-4-5"],
"common_triggers": ["max tokens exceeded", "complex outputs"]
},
"reasoning_error": {
"count": 24,
"percentage": 0.10,
"affected_models": ["gpt-4o-mini"],
"common_triggers": ["multi-step logic", "mathematical reasoning"]
}
},
"by_model": {
"gpt-4o-mini": {
"total_calls": 8234,
"failures": 123,
"failure_rate": 0.015,
"top_failure_modes": ["hallucination", "format_violation"]
},
"claude-sonnet-4-5": {
"total_calls": 5678,
"failures": 67,
"failure_rate": 0.012,
"top_failure_modes": ["refusal", "format_violation"]
}
},
"mitigation_recommendations": [
{
"issue": "High format_violation rate for complex JSON",
"recommendation": "Add schema validation to prompts",
"expected_improvement": "40% reduction in failures"
},
{
"issue": "Hallucinations in data extraction",
"recommendation": "Use Claude Haiku for structured extraction",
"expected_improvement": "60% reduction in hallucinations"
}
]
}