{ | |
"epoch": 2.995008319467554, | |
"eval_accuracy": 0.6457728521567662, | |
"eval_loss": 3.2508158683776855, | |
"eval_runtime": 31.6071, | |
"eval_samples": 921, | |
"eval_samples_per_second": 29.139, | |
"eval_steps_per_second": 14.585, | |
"perplexity": 25.81139002587262, | |
"total_flos": 6.970992786879283e+16, | |
"train_loss": 3.9628717678564565, | |
"train_runtime": 1531.0104, | |
"train_samples": 7211, | |
"train_samples_per_second": 14.13, | |
"train_steps_per_second": 0.882 | |
} |