Training in progress, step 35, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a4f0c0d8d86cef26a072d97f98acadf4578aa0e3357fb39100083acb3e947626
 size 156926880

 version https://git-lfs.github.com/spec/v1
+oid sha256:e100428d4bb7c8b68c8857b4a2310cedb615bd51efa607db4eabb665305889fa
 size 156926880

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3822dcf377fc922f395e85094def75a146277d0f294be9f5d4b05f8fc85d4e95
 size 79968772

 version https://git-lfs.github.com/spec/v1
+oid sha256:759ebfcb6e187fa3ed1d13101a046e93beb51a1eb594e8772ba3f223a922ecf3
 size 79968772

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:15c0eeda3a62034479ea787479fb6c3516b246ee5930ba976a4814c1c12227b2
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ca7e8c3dab8c4e7f141e13a8b59074feffd5b4b261d839d2913a26ec3f9e0b1
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d37b0dad6b9c48822da5c83a071d50252502799ad22c4c4907147ad4e4f8e2f4
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:88f387d8c434535a84694e469cebc18f2e722ba31b0dc0372632798b59011377
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.05639097744360902,
   "eval_steps": 5,
-  "global_step": 30,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -133,6 +133,21 @@
       "eval_samples_per_second": 27.908,
       "eval_steps_per_second": 6.977,
       "step": 30
     }
   ],
   "logging_steps": 3,
@@ -152,7 +167,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 5960489175613440.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.06578947368421052,
   "eval_steps": 5,
+  "global_step": 35,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 27.908,
       "eval_steps_per_second": 6.977,
       "step": 30
+    },
+    {
+      "epoch": 0.06203007518796992,
+      "grad_norm": 1.566185712814331,
+      "learning_rate": 3.832773180720475e-05,
+      "loss": 1.5506,
+      "step": 33
+    },
+    {
+      "epoch": 0.06578947368421052,
+      "eval_loss": 1.5798027515411377,
+      "eval_runtime": 16.0818,
+      "eval_samples_per_second": 27.858,
+      "eval_steps_per_second": 6.964,
+      "step": 35
     }
   ],
   "logging_steps": 3,
       "attributes": {}
     }
   },
+  "total_flos": 6953904038215680.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null