{ "epoch": 3.0, "total_flos": 5.381051647021056e+17, "train_loss": 1.0441436089967426, "train_runtime": 655.2315, "train_samples_per_second": 111.258, "train_steps_per_second": 0.87 }