| { | |
| "epoch": 2.995008319467554, | |
| "eval_accuracy": 0.6477501136495986, | |
| "eval_loss": 2.9963440895080566, | |
| "eval_runtime": 49.7886, | |
| "eval_samples": 921, | |
| "eval_samples_per_second": 18.498, | |
| "eval_steps_per_second": 9.259, | |
| "perplexity": 20.012240063032426, | |
| "total_flos": 2.6245163088714138e+17, | |
| "train_loss": 3.7161494956193146, | |
| "train_runtime": 2214.8433, | |
| "train_samples": 7211, | |
| "train_samples_per_second": 9.767, | |
| "train_steps_per_second": 0.61 | |
| } |