Files
llmiotsafe/results/qwen35_dpo_ultralowmem_ref_free_diag60/summary.json
2026-05-12 17:01:39 +08:00

62 lines
1.2 KiB
JSON

{
"model": "qwen35-dpo",
"api_base": "http://localhost:8001/v1",
"timestamp": "2026-05-07T22:09:21.072639",
"total_evaluated": 60,
"avg_latency_seconds": 54.79,
"api_errors": 0,
"summary": {
"total_episodes": 60,
"detection_accuracy": 0.38333333333333336,
"miss_rate": 0,
"false_alarm_rate": 0.6,
"precision": 0.0,
"recall": 0,
"f1_security": 0,
"threat_type_accuracy": 0,
"parse_failure_rate": 0.06666666666666667,
"breakdown": {
"TP": {
"total": 0,
"correct": 0,
"accuracy": 0
},
"FP": {
"total": 55,
"correct": 21,
"accuracy": 0.38181818181818183
},
"TN": {
"total": 5,
"correct": 2,
"accuracy": 0.4
}
},
"per_sq": {
"SQ1": {
"total": 60,
"accuracy": 0.38333333333333336,
"miss_count": 0,
"false_alarm_count": 36
}
}
},
"errors": {
"total_errors": 37,
"error_distribution": {
"FALSE_ALARM": 35,
"PARSE_FAIL": 2
},
"error_by_sq": {
"SQ1": {
"FALSE_ALARM": 35,
"PARSE_FAIL": 2
},
"SQ2": {},
"SQ3": {},
"SQ4": {},
"SQ5": {}
},
"error_by_category": {}
}
}