File size: 2,528 Bytes
9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee 1066c4c 9e57aee |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 1.3908045977011494,
"global_step": 60,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.23,
"learning_rate": 9.418604651162792e-05,
"loss": 1.9238,
"step": 10
},
{
"epoch": 0.23,
"eval_accuracy": 0.1818181872367859,
"eval_loss": 1.9564208984375,
"eval_runtime": 19.1351,
"eval_samples_per_second": 4.599,
"eval_steps_per_second": 1.15,
"step": 10
},
{
"epoch": 0.46,
"learning_rate": 8.837209302325582e-05,
"loss": 1.9589,
"step": 20
},
{
"epoch": 0.46,
"eval_accuracy": 0.15909090638160706,
"eval_loss": 1.9498623609542847,
"eval_runtime": 21.5957,
"eval_samples_per_second": 4.075,
"eval_steps_per_second": 1.019,
"step": 20
},
{
"epoch": 0.69,
"learning_rate": 8.255813953488373e-05,
"loss": 1.9677,
"step": 30
},
{
"epoch": 0.69,
"eval_accuracy": 0.17045454680919647,
"eval_loss": 1.8762873411178589,
"eval_runtime": 19.1489,
"eval_samples_per_second": 4.596,
"eval_steps_per_second": 1.149,
"step": 30
},
{
"epoch": 0.92,
"learning_rate": 7.674418604651163e-05,
"loss": 1.9357,
"step": 40
},
{
"epoch": 0.92,
"eval_accuracy": 0.21590909361839294,
"eval_loss": 1.8796330690383911,
"eval_runtime": 21.6027,
"eval_samples_per_second": 4.074,
"eval_steps_per_second": 1.018,
"step": 40
},
{
"epoch": 1.16,
"learning_rate": 7.093023255813955e-05,
"loss": 1.9529,
"step": 50
},
{
"epoch": 1.16,
"eval_accuracy": 0.22727273404598236,
"eval_loss": 1.841020107269287,
"eval_runtime": 22.0824,
"eval_samples_per_second": 3.985,
"eval_steps_per_second": 0.996,
"step": 50
},
{
"epoch": 1.39,
"learning_rate": 6.511627906976745e-05,
"loss": 1.8197,
"step": 60
},
{
"epoch": 1.39,
"eval_accuracy": 0.35227271914482117,
"eval_loss": 1.6947021484375,
"eval_runtime": 21.8177,
"eval_samples_per_second": 4.033,
"eval_steps_per_second": 1.008,
"step": 60
}
],
"max_steps": 172,
"num_train_epochs": 4,
"total_flos": 1.7581701250290854e+17,
"trial_name": null,
"trial_params": null
}
|