This commit is contained in:
玖烛
2025-05-28 11:36:44 +08:00
parent 0d8da53a59
commit d926998c38
2 changed files with 2 additions and 1 deletions

View File

@@ -72,6 +72,7 @@ We have a series of technical articles on the functionalities of EasyDistill.
"per_device_train_batch_size": 1,
"gradient_accumulation_steps": 8,
"save_steps": 1000,
"max_length": 512,
"logging_steps": 1,
"learning_rate": 2e-5,
"weight_decay": 0.05,

View File

@@ -1,4 +1,4 @@
transformers==4.51.0
transformers==4.51.1
transformers-stream-generator==0.0.5
trl==0.17.0
tokenizers==0.21.1