Training in progress, epoch 4, checkpoint

Files changed (8) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33ea8293e2ebba1645119b756f24536e47fd3cd2d5ed6d00bbe4dc202448e3fd
 size 97307544

 version https://git-lfs.github.com/spec/v1
+oid sha256:ac3627d6de3069b3e0fdf02b18c77895820c6d900ae7ed20c1d2a0cbf44ecb79
 size 97307544

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:29d04aad36858bf9988b7b2d49a78263db6ef1c2f4c13d8e97709961f0105fa4
 size 49846260

 version https://git-lfs.github.com/spec/v1
+oid sha256:642d842b2bfad90c8e6a93509ba68c4a3c169ceede9ef766f57f6452307e02c1
 size 49846260

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4911704193622166ee1ec426e2f5fd91f07b22078787c2fef6eb75e76ecfcebd
 size 14960

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb8ce3b246ac7b214e8511f0933702c8eef2a192e03552fbd70bb29a15b06b11
 size 14960

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7888e2cd4eccd4158073069db68c90b5a2a705a76d137387387b1327ab01b450
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:9973d48d9bbe51ec0d66d6ad554d481faa409d2b1fb44e0ca5d08c274d21dc20
 size 15024

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d95b812422568710ba718fb8a8d9f5eefb569a379b0b351686aa876aa4e735fd
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:328ffded67cfa6abf4c93f77182952d6956017dd426f6d8589aecffd3c33a7a1
 size 15024

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b97f3eeaebec80884f44979aea2187cef9f94a36e6bca59ee17aa729de5af80
 size 15024

 version https://git-lfs.github.com/spec/v1
+oid sha256:c29b2f22a894575acde8eee9b3345021e389b523d4b883ec19eaf701b9fb5369
 size 15024

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5797a1f8ad35c151f6fb72a157c600abf1c5b502880ee9b620a878a10eb438e4
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:aea67b5da66f242c315a67190bee42ac01d2c7b5f9d79262964d41c22411bb70
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.6363636363636362,
   "eval_steps": 500,
-  "global_step": 4,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -35,6 +35,13 @@
       "learning_rate": 1.8594235253127375e-05,
       "loss": 0.8338,
       "step": 4
     }
   ],
   "logging_steps": 1,
@@ -49,12 +56,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 3.689192720275866e+16,
   "train_batch_size": 6,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 4.545454545454545,
   "eval_steps": 500,
+  "global_step": 5,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.8594235253127375e-05,
       "loss": 0.8338,
       "step": 4
+    },
+    {
+      "epoch": 4.545454545454545,
+      "grad_norm": 0.25607359409332275,
+      "learning_rate": 1e-05,
+      "loss": 0.8635,
+      "step": 5
     }
   ],
   "logging_steps": 1,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 4.192264440827085e+16,
   "train_batch_size": 6,
   "trial_name": null,
   "trial_params": null