Training in progress, step 2280, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d2b4eb6ede7bd8c2e85cb9ea4c87d64a24d61b9f82ee9dfeae0b3261cfc9de2b
 size 389074464

 version https://git-lfs.github.com/spec/v1
+oid sha256:d130ac47ed7ae141798c2d67da12d00f8f7b9ea7cf027d56de55b3b8590b2850
 size 389074464

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:90e30c4c34c5a744f7c50eb890eb88d5238a3d95f2d028ce06e1b000482edf08
 size 198011700

 version https://git-lfs.github.com/spec/v1
+oid sha256:c6252331758a1f9b1131927a72d62a3faf0c8dc2d5aab8bd8ebeb638a0536413
 size 198011700

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e8b606578427f8c7c5a0703c9ea80297d5709e9484a7eb99f421fd211c612d5
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:5b26bb65679d1fbe119ff115522738907e642e45677820751547812f1ce25739
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.8966725043782837,
   "eval_steps": 500,
-  "global_step": 2166,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -140,6 +140,13 @@
       "learning_rate": 4.06948109058927e-05,
       "loss": 0.7776,
       "step": 2166
     }
   ],
   "logging_steps": 114,
@@ -159,7 +166,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.2350737508775322e+17,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.9964973730297724,
   "eval_steps": 500,
+  "global_step": 2280,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 4.06948109058927e-05,
       "loss": 0.7776,
       "step": 2166
+    },
+    {
+      "epoch": 1.9964973730297724,
+      "grad_norm": 0.636738657951355,
+      "learning_rate": 4.019349164467898e-05,
+      "loss": 0.8015,
+      "step": 2280
     }
   ],
   "logging_steps": 114,
       "attributes": {}
     }
   },
+  "total_flos": 1.2959469426231091e+17,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null