Training in progress, step 25000

Browse files

Files changed (11) hide show

config.json +1 -1
last-checkpoint/config.json +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +71 -3
last-checkpoint/training_args.bin +1 -1
pytorch_model.bin +1 -1
training_args.bin +1 -1

config.json CHANGED Viewed

@@ -18,7 +18,7 @@
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "layer_norm_eps": 1e-12,
-  "mask_ratio": 0.25,
   "model_type": "pixel",
   "norm_pix_loss": true,
   "num_attention_heads": 12,

   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "layer_norm_eps": 1e-12,
+  "mask_ratio": 0.29,
   "model_type": "pixel",
   "norm_pix_loss": true,
   "num_attention_heads": 12,

last-checkpoint/config.json CHANGED Viewed

@@ -18,7 +18,7 @@
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "layer_norm_eps": 1e-12,
-  "mask_ratio": 0.25,
   "model_type": "pixel",
   "norm_pix_loss": true,
   "num_attention_heads": 12,

   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "layer_norm_eps": 1e-12,
+  "mask_ratio": 0.29,
   "model_type": "pixel",
   "norm_pix_loss": true,
   "num_attention_heads": 12,

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:227bb459455ca9395e8701d0b76fa538ae5551af488261f8a6c040d98a6dded3
 size 893438545

 version https://git-lfs.github.com/spec/v1
+oid sha256:54511fdc5c5a7b0e9e913352b7c70eeb4be98b664939b4420d74be15aa007937
 size 893438545

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ee7451dd5ec81a01259d5968e23ec645d0c3962b135c90aa707004f25bc4403
 size 449471589

 version https://git-lfs.github.com/spec/v1
+oid sha256:ef06c37b1b2de2e7bc399a7b91f0e41a8e27ec304f4ab7843f18254e5ab425e3
 size 449471589

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cc90007b132e8f26a3d447fb1e8dee59d5ce3dfd07c853ec26d9c159e851307d
 size 15459

 version https://git-lfs.github.com/spec/v1
+oid sha256:7c7b0cc71c51ef5f7a78f816541ca99e7efff8df2315723a0c94e1b16e8f0771
 size 15459

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:56d7925c4d371c4e7cd499e68da31588c0a08bf1a905f213b26db017a95291f6
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb6982c29cd162f49aeb531674acf574eccd46a8f556bec596040d7c3b95200a
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a6464ca3b88e496d5d945a7955ac6cabd3c94f9611fe337e2e8a9af945aa679a
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:66cad2ac81d79f6484466213369fcababfbacc00f3cf3a8946126f6ba258bade
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8705493166187864,
-  "global_step": 20000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -278,11 +278,79 @@
       "eval_samples_per_second": 52.619,
       "eval_steps_per_second": 0.831,
       "step": 20000
     }
   ],
   "max_steps": 100000,
   "num_train_epochs": 9,
-  "total_flos": 9.419722694590464e+20,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.4352746583093932,
+  "global_step": 25000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 52.619,
       "eval_steps_per_second": 0.831,
       "step": 20000
+    },
+    {
+      "epoch": 1.04,
+      "learning_rate": 9.169394796092694e-05,
+      "loss": 0.4465,
+      "step": 20500
+    },
+    {
+      "epoch": 1.09,
+      "learning_rate": 9.126149821203012e-05,
+      "loss": 0.444,
+      "step": 21000
+    },
+    {
+      "epoch": 1.13,
+      "learning_rate": 9.082019786191564e-05,
+      "loss": 0.4435,
+      "step": 21500
+    },
+    {
+      "epoch": 1.17,
+      "learning_rate": 9.037106452976014e-05,
+      "loss": 0.4422,
+      "step": 22000
+    },
+    {
+      "epoch": 1.22,
+      "learning_rate": 8.991240893598493e-05,
+      "loss": 0.4446,
+      "step": 22500
+    },
+    {
+      "epoch": 1.26,
+      "learning_rate": 8.944523560858406e-05,
+      "loss": 0.4418,
+      "step": 23000
+    },
+    {
+      "epoch": 1.3,
+      "learning_rate": 8.89696598155856e-05,
+      "loss": 0.4412,
+      "step": 23500
+    },
+    {
+      "epoch": 1.35,
+      "learning_rate": 8.848579889820028e-05,
+      "loss": 0.4414,
+      "step": 24000
+    },
+    {
+      "epoch": 1.39,
+      "learning_rate": 8.799377224186928e-05,
+      "loss": 0.4407,
+      "step": 24500
+    },
+    {
+      "epoch": 1.44,
+      "learning_rate": 8.749470933536528e-05,
+      "loss": 0.4402,
+      "step": 25000
+    },
+    {
+      "epoch": 1.44,
+      "eval_loss": 0.42174017429351807,
+      "eval_runtime": 91.5901,
+      "eval_samples_per_second": 54.591,
+      "eval_steps_per_second": 0.863,
+      "step": 25000
     }
   ],
   "max_steps": 100000,
   "num_train_epochs": 9,
+  "total_flos": 1.177465336823808e+21,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fb90956c2fc47703463b50fd267631dda0878fd140ff91c80ab2b7c4fc6e5708
 size 5615

 version https://git-lfs.github.com/spec/v1
+oid sha256:da26d9c8c1c726588ec3b1e697e00057dd4bc580fad19e58afb508d1a16ec382
 size 5615

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ee7451dd5ec81a01259d5968e23ec645d0c3962b135c90aa707004f25bc4403
 size 449471589

 version https://git-lfs.github.com/spec/v1
+oid sha256:ef06c37b1b2de2e7bc399a7b91f0e41a8e27ec304f4ab7843f18254e5ab425e3
 size 449471589

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fb90956c2fc47703463b50fd267631dda0878fd140ff91c80ab2b7c4fc6e5708
 size 5615

 version https://git-lfs.github.com/spec/v1
+oid sha256:da26d9c8c1c726588ec3b1e697e00057dd4bc580fad19e58afb508d1a16ec382
 size 5615