Spaces:
Sleeping
Sleeping
| { | |
| "report_metadata": { | |
| "generated_at": "2025-06-14T11:34:25.370128", | |
| "total_questions": 20, | |
| "session_directory": "logs/session_20250614_112312", | |
| "report_version": "1.0" | |
| }, | |
| "executive_summary": { | |
| "overall_performance": { | |
| "accuracy": 0.9, | |
| "partial_accuracy": 0.05, | |
| "error_rate": 0.0, | |
| "total_questions": 20 | |
| }, | |
| "classification_performance": { | |
| "best": { | |
| "classification": "general", | |
| "accuracy": 0.9 | |
| }, | |
| "worst": { | |
| "classification": "general", | |
| "accuracy": 0.9 | |
| } | |
| }, | |
| "production_readiness": { | |
| "ready": true, | |
| "accuracy_target": 0.7, | |
| "current_accuracy": 0.9, | |
| "gap_to_target": 0 | |
| }, | |
| "key_findings": [ | |
| "Best performing agent: general (90.0% accuracy)" | |
| ] | |
| }, | |
| "detailed_metrics": { | |
| "by_classification": { | |
| "general": { | |
| "total_questions": 20, | |
| "accuracy": 0.9, | |
| "partial_accuracy": 0.05, | |
| "error_rate": 0.0, | |
| "counts": { | |
| "correct": 18, | |
| "partial": 1, | |
| "incorrect": 1, | |
| "timeout": 0, | |
| "error": 0 | |
| }, | |
| "execution_time": { | |
| "mean": 85.51647197008133, | |
| "median": 47.42774319648743, | |
| "max": 464.02518820762634, | |
| "min": 23.65158772468567 | |
| }, | |
| "complexity": { | |
| "mean": 3, | |
| "distribution": { | |
| "3": 20 | |
| } | |
| }, | |
| "classification_confidence": { | |
| "mean": 0, | |
| "min": 0 | |
| } | |
| } | |
| }, | |
| "processing_time_analysis": { | |
| "mean": 85.51647197008133, | |
| "median": 47.42774319648743, | |
| "max": 464.02518820762634, | |
| "min": 23.65158772468567, | |
| "total_processing_time": 1710.3294394016266 | |
| }, | |
| "tool_effectiveness_ranking": [], | |
| "error_analysis": { | |
| "timeout_count": 0, | |
| "error_count": 0, | |
| "timeout_questions": [], | |
| "error_questions": [], | |
| "error_types": {} | |
| } | |
| }, | |
| "improvement_roadmap": { | |
| "high_priority": [], | |
| "medium_priority": [], | |
| "low_priority": [], | |
| "recommended_sequence": [], | |
| "effort_estimates": { | |
| "high_priority_items": 0, | |
| "estimated_effort": { | |
| "agent_redesign": "0 weeks", | |
| "stability_fixes": "0 days", | |
| "tool_improvements": "0 days", | |
| "performance_optimization": "0 days" | |
| }, | |
| "total_estimated_effort": "0 person-days" | |
| } | |
| }, | |
| "technical_insights": { | |
| "complexity_analysis": { | |
| "3": { | |
| "success_rate": 0.9, | |
| "total_questions": 20 | |
| } | |
| }, | |
| "classification_patterns": { | |
| "high_performers": [ | |
| { | |
| "classification": "general", | |
| "accuracy": 0.9, | |
| "questions": 20 | |
| } | |
| ], | |
| "low_performers": [], | |
| "inconsistent_performers": [] | |
| }, | |
| "tool_patterns": { | |
| "highly_effective_tools": [], | |
| "moderately_effective_tools": [], | |
| "ineffective_tools": [] | |
| }, | |
| "system_limitations": [] | |
| } | |
| } |