{ | |
"epoch": 1.0, | |
"eval_loss": 0.13376566767692566, | |
"eval_runtime": 45.0014, | |
"eval_samples": 2500, | |
"eval_samples_per_second": 55.554, | |
"eval_steps_per_second": 6.955, | |
"num_input_tokens_seen": 56941616, | |
"total_flos": 2.067540416810189e+16, | |
"train_loss": 0.19179043090820314, | |
"train_runtime": 4730.669, | |
"train_samples": 100000, | |
"train_samples_per_second": 21.139, | |
"train_steps_per_second": 10.569, | |
"train_tokens_per_second": 12036.694 | |
} |