{ "entropy": 0.4213579764237275, "epoch": 2.0, "mean_token_accuracy": 0.8710838395196039, "num_tokens": 98528536.0, "total_flos": 2.1561577524323942e+18, "train_loss": 0.5024350297862086, "train_runtime": 9862.6956, "train_samples": 48420, "train_samples_per_second": 9.819, "train_steps_per_second": 0.029 }