{ "epoch": 1.14, "eval_loss": 2.2956442832946777, "eval_runtime": 3135.1617, "eval_samples_per_second": 159.481, "eval_steps_per_second": 4.984, "perplexity": 9.930832220881081, "train_loss": 2.669982685546875, "train_runtime": 65951.2344, "train_samples_per_second": 97.041, "train_steps_per_second": 0.758 }