{ "epoch": 4.997878659312685, "eval_loss": 1.3836458921432495, "eval_runtime": 52.7263, "eval_samples_per_second": 7.226, "eval_steps_per_second": 0.91, "perplexity": 3.989420140492546, "total_flos": 4951537335926784.0, "train_loss": 1.2631714882389191, "train_runtime": 59759.6565, "train_samples_per_second": 3.155, "train_steps_per_second": 0.099 }