{ "batch_size": 4, "accum_iter": 4, "epochs": 200, "warmup_epochs": 0.001, "lr": 2e-05, "min_lr": 0.0, "wd": 0.1, "clip_grad": 4.0, "init_from": "output/Lumina-DiMOO-TI2TI-Finetuning/epoch40", "data_config": "../configs/data.yaml", "cache_ann_on_disk": true, "length_clustering": true, "num_workers": 16, "pin_mem": true, "seed": 42, "output_dir": "output/Lumina-DiMOO-TI2TI-Finetuning_mixed3", "save_interval": 1, "save_iteration_interval": 1000, "only_save_trainable": false, "ckpt_max_keep": 2, "auto_resume": true, "resume_path": null, "model_parallel_size": 1, "data_parallel": "fsdp", "precision": "bf16", "grad_precision": "fp32", "checkpointing": true, "max_seq_len": 5120, "dropout": 0.05, "world_size": 8, "rank": 0, "gpu": 0, "local_rank": 0, "dist_url": "env://", "distributed": true, "dist_backend": "nccl" }