File size: 711 Bytes
b1105bf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 |
{
"model_type": "isrm-vae",
"architecture": "distilbert-vae",
"architecture_type": "dual-layer",
"base_model": "distilbert-base-uncased",
"latent_dim": 3,
"hidden_dim": 768,
"num_layers": 6,
"num_unfrozen_layers": 2,
"pad_dimensions": [
"pleasure",
"arousal",
"dominance"
],
"bdi_dimensions": [
"belief",
"goal",
"intention",
"ambiguity",
"social"
],
"pad_layer": 10,
"bdi_layer": 19,
"task": "affective-state-encoding",
"training": {
"dataset_size": 1500,
"epochs": 15,
"optimizer": "AdamW",
"learning_rate": 2e-05,
"loss_fn": "MSE + KL divergence",
"kl_weight": 0.001,
"final_mse": 0.018,
"final_kld": 0.003
}
} |