{ "epoch": 0.9999149532682873, "eval_accuracy": 0.5874091441969519, "eval_loss": 1.9824198484420776, "eval_runtime": 86.7224, "eval_samples": 400, "eval_samples_per_second": 4.612, "eval_steps_per_second": 1.153, "perplexity": 7.26029054814878, "total_flos": 6.861219031857234e+18, "train_loss": 2.0199434388696393, "train_runtime": 95478.6823, "train_samples": 1363955, "train_samples_per_second": 14.285, "train_steps_per_second": 0.112 }