{ "epoch": 10.0, "eval_loss": 3.4622573852539062, "eval_runtime": 2.2596, "eval_samples": 1945, "eval_samples_per_second": 860.769, "eval_steps_per_second": 53.992, "perplexity": 31.888880815596, "total_flos": 1536221652235776.0, "train_loss": 2.5605053229872228, "train_runtime": 388.3929, "train_samples": 9733, "train_samples_per_second": 250.597, "train_steps_per_second": 15.68 }