{ "epoch": 6.0, "eval_loss": 1.8202452659606934, "eval_runtime": 245.6979, "eval_samples": 1788, "eval_samples_per_second": 7.277, "eval_steps_per_second": 7.277, "perplexity": 6.173372382325986, "total_flos": 815647319654400.0, "train_loss": 1.8342725714209487, "train_runtime": 100493.137, "train_samples": 24415, "train_samples_per_second": 1.458, "train_steps_per_second": 1.458 }