File size: 2,528 Bytes
9e57aee
 
 
1066c4c
 
9e57aee
 
 
 
 
1066c4c
 
 
9e57aee
 
 
1066c4c
 
 
 
 
 
9e57aee
 
 
1066c4c
 
 
9e57aee
 
 
1066c4c
 
 
 
 
 
9e57aee
 
 
1066c4c
 
 
9e57aee
 
 
1066c4c
 
 
 
 
 
9e57aee
 
 
1066c4c
 
 
9e57aee
 
 
1066c4c
 
 
 
 
 
9e57aee
 
 
1066c4c
 
 
9e57aee
 
 
1066c4c
 
 
 
 
 
9e57aee
 
 
1066c4c
 
 
9e57aee
 
 
1066c4c
 
 
 
 
 
9e57aee
 
 
1066c4c
 
 
9e57aee
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 1.3908045977011494,
  "global_step": 60,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.23,
      "learning_rate": 9.418604651162792e-05,
      "loss": 1.9238,
      "step": 10
    },
    {
      "epoch": 0.23,
      "eval_accuracy": 0.1818181872367859,
      "eval_loss": 1.9564208984375,
      "eval_runtime": 19.1351,
      "eval_samples_per_second": 4.599,
      "eval_steps_per_second": 1.15,
      "step": 10
    },
    {
      "epoch": 0.46,
      "learning_rate": 8.837209302325582e-05,
      "loss": 1.9589,
      "step": 20
    },
    {
      "epoch": 0.46,
      "eval_accuracy": 0.15909090638160706,
      "eval_loss": 1.9498623609542847,
      "eval_runtime": 21.5957,
      "eval_samples_per_second": 4.075,
      "eval_steps_per_second": 1.019,
      "step": 20
    },
    {
      "epoch": 0.69,
      "learning_rate": 8.255813953488373e-05,
      "loss": 1.9677,
      "step": 30
    },
    {
      "epoch": 0.69,
      "eval_accuracy": 0.17045454680919647,
      "eval_loss": 1.8762873411178589,
      "eval_runtime": 19.1489,
      "eval_samples_per_second": 4.596,
      "eval_steps_per_second": 1.149,
      "step": 30
    },
    {
      "epoch": 0.92,
      "learning_rate": 7.674418604651163e-05,
      "loss": 1.9357,
      "step": 40
    },
    {
      "epoch": 0.92,
      "eval_accuracy": 0.21590909361839294,
      "eval_loss": 1.8796330690383911,
      "eval_runtime": 21.6027,
      "eval_samples_per_second": 4.074,
      "eval_steps_per_second": 1.018,
      "step": 40
    },
    {
      "epoch": 1.16,
      "learning_rate": 7.093023255813955e-05,
      "loss": 1.9529,
      "step": 50
    },
    {
      "epoch": 1.16,
      "eval_accuracy": 0.22727273404598236,
      "eval_loss": 1.841020107269287,
      "eval_runtime": 22.0824,
      "eval_samples_per_second": 3.985,
      "eval_steps_per_second": 0.996,
      "step": 50
    },
    {
      "epoch": 1.39,
      "learning_rate": 6.511627906976745e-05,
      "loss": 1.8197,
      "step": 60
    },
    {
      "epoch": 1.39,
      "eval_accuracy": 0.35227271914482117,
      "eval_loss": 1.6947021484375,
      "eval_runtime": 21.8177,
      "eval_samples_per_second": 4.033,
      "eval_steps_per_second": 1.008,
      "step": 60
    }
  ],
  "max_steps": 172,
  "num_train_epochs": 4,
  "total_flos": 1.7581701250290854e+17,
  "trial_name": null,
  "trial_params": null
}