Files
llmiotsafe/tmp_dpo/train_pairs_fallback_report.json
2026-05-12 17:01:39 +08:00

17 lines
351 B
JSON

{
"split": "train",
"input_root": "data_dpo_v2\\train_pref_v1",
"total_pairs": 2500,
"assembly_counts": {
"chosen_rule_fallback": 2500,
"rejected_constructed_fallback": 2500
},
"strong_answer_summary": {
"label": "strong_answers",
"count": 0
},
"weak_answer_summary": {
"label": "weak_answers",
"count": 0
}
}