From f8727a45eeebd22029b4ce5f400fbaa0417874cd Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E7=8E=96=E7=83=9B?= Date: Mon, 9 Jun 2025 16:57:41 +0800 Subject: [PATCH] fix white box max length dismatch --- configs/kd_white_box.json | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/configs/kd_white_box.json b/configs/kd_white_box.json index 9cb13c8..ba53df3 100644 --- a/configs/kd_white_box.json +++ b/configs/kd_white_box.json @@ -19,7 +19,7 @@ "top_logits_num": 10 }, "distillation": { - "kd_ratio": 0.5, + "kd_ratio": 0.1, "max_seq_length": 512, "distillation_type": "forward_kld" }, @@ -32,6 +32,7 @@ "num_train_epochs": 3, "per_device_train_batch_size": 1, "gradient_accumulation_steps": 8, + "max_length":512, "save_steps": 1000, "logging_steps": 1, "learning_rate": 2e-5,