diff --git a/configs/mmkd_black_box_api.json b/configs/mmkd_black_box_api.json new file mode 100644 index 0000000..ab59577 --- /dev/null +++ b/configs/mmkd_black_box_api.json @@ -0,0 +1,30 @@ +{ + "job_type": "mmkd_black_box_api", + "dataset": { + "instruction_path": "data/mllm_demo.json", + "labeled_path": "data/mllm_demo_distill.json", + "seed": 42 + }, + "inference":{ + "base_url": "ENDPOINT", + "api_key": "TOKEN", + "system_prompt" : "You are a helpful assistant.", + "max_new_tokens": 512 + }, + "models": { + "student": "student/Qwen/Qwen2.5-VL-3B-Instruct/" + }, + "training": { + "output_dir": "./result/", + "num_train_epochs": 3, + "per_device_train_batch_size": 1, + "gradient_accumulation_steps": 8, + "max_length": 512, + "save_steps": 1000, + "logging_steps": 1, + "learning_rate": 2e-5, + "weight_decay": 0.05, + "warmup_ratio": 0.1, + "lr_scheduler_type": "cosine" + } +} \ No newline at end of file