phi-tiny-moe-math-lean-sft / all_results.json
rkumar1999's picture
Model save
eb73939 verified
{
"entropy": 0.4213579764237275,
"epoch": 2.0,
"mean_token_accuracy": 0.8710838395196039,
"num_tokens": 98528536.0,
"total_flos": 2.1561577524323942e+18,
"train_loss": 0.5024350297862086,
"train_runtime": 9862.6956,
"train_samples": 48420,
"train_samples_per_second": 9.819,
"train_steps_per_second": 0.029
}