Training in progress, step 77, checkpoint

Files changed (4) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fba76b36e590e7e13470a157729235b7d34fd5f65cd77648e42ec57c79892a5d
 size 100198584

 version https://git-lfs.github.com/spec/v1
+oid sha256:0cb0496349c7b965d5745b83667dddba6d9df375bcaa24821f880398882683c0
 size 100198584

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c48dc9c8c4cf094cfe9ca510b0ee6256aee9062c39b4df8bc829e031d6c096d6
 size 50675156

 version https://git-lfs.github.com/spec/v1
+oid sha256:a0888da8e641e6eaedf98307dcd8e2a8af3dfb612ef7f810d4e6ca8bcadf0e4e
 size 50675156

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46a86174539a86c9c10ef9b72608d49039cdad58e77dd25141a021b27f07e927
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:725ee499aaa0bc04b490ac3af0c734c514c976dd8cd2f204b00fdb43d2a90bf8
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.2030178326474623,
   "eval_steps": 500,
-  "global_step": 74,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -525,6 +525,27 @@
       "learning_rate": 0.000148,
       "loss": 1.1915,
       "step": 74
     }
   ],
   "logging_steps": 1,
@@ -544,7 +565,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 2.1144350488087757e+17,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.2112482853223594,
   "eval_steps": 500,
+  "global_step": 77,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.000148,
       "loss": 1.1915,
       "step": 74
+    },
+    {
+      "epoch": 0.205761316872428,
+      "grad_norm": 0.0682872086763382,
+      "learning_rate": 0.00015000000000000001,
+      "loss": 1.2017,
+      "step": 75
+    },
+    {
+      "epoch": 0.2085048010973937,
+      "grad_norm": 0.07075867056846619,
+      "learning_rate": 0.000152,
+      "loss": 1.1562,
+      "step": 76
+    },
+    {
+      "epoch": 0.2112482853223594,
+      "grad_norm": 0.06364033371210098,
+      "learning_rate": 0.000154,
+      "loss": 1.1936,
+      "step": 77
     }
   ],
   "logging_steps": 1,
       "attributes": {}
     }
   },
+  "total_flos": 2.202346458742948e+17,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null