{ "epoch": 6.0, "eval_loss": NaN, "eval_runtime": 26.9467, "eval_samples": 177, "eval_samples_per_second": 6.569, "eval_steps_per_second": 6.569, "perplexity": NaN, "total_flos": 358029585285120.0, "train_loss": 2.4681696535317337, "train_runtime": 44136.3163, "train_samples": 10717, "train_samples_per_second": 1.457, "train_steps_per_second": 1.457 }