{ "entropy": 1.2591145833333333, "epoch": 1.0, "eval_entropy": 1.2470703125, "eval_loss": 0.27956658601760864, "eval_mean_token_accuracy": 0.9408915489912033, "eval_num_tokens": 416460333.0, "eval_runtime": 5.1488, "eval_samples": 1000, "eval_samples_per_second": 87.593, "eval_steps_per_second": 1.554, "mean_token_accuracy": 0.9201805492242178, "num_tokens": 416460333.0, "total_flos": 665167385886720.0, "train_loss": 0.7855377271239742, "train_runtime": 16972.5987, "train_samples": 993477, "train_samples_per_second": 24.303, "train_steps_per_second": 0.19, "weight_norm": 258.9971042309161 }