{ "job_type": "kd_black_box_api", "dataset": { "labeled_path": "distil_qwen_thoughtX.json", "template" : "chat_template_kd.jinja", "seed": 42 }, "models": { "student": "model/Qwen/Qwen2.5-1.5B-Instruct/" }, "training": { "output_dir": "result/", "num_train_epochs": 3, "per_device_train_batch_size": 1, "gradient_accumulation_steps": 8, "max_length":4096, "save_steps": 1000, "logging_steps": 1, "learning_rate": 2e-5, "weight_decay": 0.05, "warmup_ratio": 0.1, "lr_scheduler_type": "cosine" } }