| { | |
| "num_samples_train": 16643, | |
| "world_size": 1, | |
| "effective_batch_size": 8, | |
| "steps_per_epoch": 2081, | |
| "save_steps": 693, | |
| "saves_per_epoch": 3, | |
| "total_steps_est": 6243, | |
| "approx_ckpts": 10, | |
| "target_modules": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "o_proj" | |
| ], | |
| "lora_r": 16, | |
| "lora_alpha": 32, | |
| "lora_dropout": 0.05, | |
| "response_template": "<|start_header_id|>assistant<|end_header_id|>", | |
| "use_max_len": 2560, | |
| "label_all_assistant": true, | |
| "skip_tool_only_assistant": false, | |
| "assistant_tag": "<|start_header_id|>assistant<|end_header_id|>", | |
| "tool_use_token": "<|use_tool|>" | |
| } |