{ "epoch": 4.95, "total_flos": 3.4409368031831654e+17, "train_loss": 0.6955731582641601, "train_runtime": 190.8065, "train_samples_per_second": 23.217, "train_steps_per_second": 1.441 }