ivnle's picture
Upload folder using huggingface_hub
b66dc55 verified
{
"regime": "meanpool",
"data_path": "data/training/splits_510k/train_arrow",
"output_dir": "outputs/production_meanpool_w4_s4_reconstruction_20251115_011352_lm_20251128_123730",
"objective": "lm",
"val_data_path": "data/training/splits_510k/val_arrow",
"max_samples": null,
"vision_mode": "small",
"text_context_tokens": null,
"hybrid_text_tokens": 0,
"vision_prompt": null,
"train_encoder": false,
"encoder_lr": 1e-05,
"compression_window_size": 4,
"compression_stride": 4,
"subsample_strategy": "regular",
"subsample_count": null,
"projection_dim": null,
"train_projection": false,
"compression_target": null,
"conv_kernel": 5,
"timestamp": null,
"batch_size": 12,
"gradient_accumulation_steps": 4,
"learning_rate": 0.0001,
"weight_decay": 0.01,
"num_epochs": 1,
"warmup_ratio": 0.1,
"max_grad_norm": 1.0,
"log_steps": 10,
"save_steps": 0,
"eval_steps": 500,
"initial_validation": true,
"validation_only": false,
"no_checkpoints": false,
"num_qualitative_samples": 5,
"max_generation_tokens": 200,
"use_wandb": true,
"wandb_project": "vision-compression-2",
"wandb_run_name": null,
"resume_from_checkpoint": null,
"resume": null,
"init_from_checkpoint": "./outputs/production_meanpool_w4_s4_reconstruction_20251115_011352/best_checkpoint.pt",
"allow_objective_switch": true,
"aux_loss_weight": 0.5,
"num_workers": 8,
"prefetch_factor": 64,
"seed": null,
"eval_seed": 42,
"debug_log_sample_ids": false,
"device": "cuda",
"compile": false,
"compile_mode": "default",
"use_optimized_model": true,
"use_encoder_checkpointing": true,
"use_decoder_checkpointing": true,
"use_8bit_optimizer": true
}