| { | |
| "architectures": [ | |
| "TabStarModel" | |
| ], | |
| "batch_size": 32, | |
| "bert_lr_factor": 1.0, | |
| "d_model": 384, | |
| "downstream_mode": null, | |
| "e5_model": "intfloat/e5-small-v2", | |
| "is_pretrain": true, | |
| "lr": 5e-05, | |
| "macro_batch_size": 128, | |
| "model_type": "tabstar", | |
| "num_layers": 6, | |
| "numbers_fusion": "attention", | |
| "p_mask": 0, | |
| "scheduler": "cycle", | |
| "tabular_encoder_type": "d1", | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.49.0", | |
| "unfreeze_layers": 6, | |
| "weight_balance": "uniform", | |
| "weight_decay": 0.001 | |
| } | |