{ "model": "qwen35-dpo", "api_base": "http://localhost:8001/v1", "timestamp": "2026-05-07T22:09:21.072639", "total_evaluated": 60, "avg_latency_seconds": 54.79, "api_errors": 0, "summary": { "total_episodes": 60, "detection_accuracy": 0.38333333333333336, "miss_rate": 0, "false_alarm_rate": 0.6, "precision": 0.0, "recall": 0, "f1_security": 0, "threat_type_accuracy": 0, "parse_failure_rate": 0.06666666666666667, "breakdown": { "TP": { "total": 0, "correct": 0, "accuracy": 0 }, "FP": { "total": 55, "correct": 21, "accuracy": 0.38181818181818183 }, "TN": { "total": 5, "correct": 2, "accuracy": 0.4 } }, "per_sq": { "SQ1": { "total": 60, "accuracy": 0.38333333333333336, "miss_count": 0, "false_alarm_count": 36 } } }, "errors": { "total_errors": 37, "error_distribution": { "FALSE_ALARM": 35, "PARSE_FAIL": 2 }, "error_by_sq": { "SQ1": { "FALSE_ALARM": 35, "PARSE_FAIL": 2 }, "SQ2": {}, "SQ3": {}, "SQ4": {}, "SQ5": {} }, "error_by_category": {} } }