{ "epoch": 5.96, "total_flos": 2.0253789729052508e+18, "train_loss": 4.31497132544424, "train_runtime": 1061.9918, "train_samples_per_second": 24.757, "train_steps_per_second": 0.192 }