{ | |
"epoch": 2.995008319467554, | |
"eval_accuracy": 0.6798516302478071, | |
"eval_loss": 0.9872721433639526, | |
"eval_runtime": 33.1054, | |
"eval_samples": 921, | |
"eval_samples_per_second": 27.82, | |
"eval_steps_per_second": 13.925, | |
"perplexity": 2.683903174445662, | |
"total_flos": 2.324441285315789e+16, | |
"train_loss": 0.5607477950608288, | |
"train_runtime": 2259.369, | |
"train_samples": 7211, | |
"train_samples_per_second": 9.575, | |
"train_steps_per_second": 0.598 | |
} |