Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/mp_rank_00_model_states.pt +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/latest +3 -0
- checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/zero_to_fp32.py +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/mp_rank_00_model_states.pt +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/latest +3 -0
- checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/zero_to_fp32.py +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/mp_rank_00_model_states.pt +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/latest +3 -0
- checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/zero_to_fp32.py +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/mp_rank_00_model_states.pt +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/latest +3 -0
- checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/zero_to_fp32.py +3 -0
- checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bcd5d1be4eef090f25107320bdc3fa45b0b49de4aa932c10101ecbf8e909fc2
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f6bf8328543f213865d2e8e3e1bb3fdd8a265a04a1481281f124ec81bfe479a
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f75f4fb108ec829abf2bfaaf794e1fbcc46e4d81dcd73d6a6410e51c3e46788
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9482ed426a1450f27282964cb0f01100a576d247113b61b3e97f86e1e2d8fcf5
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e982fd709bf79f0a9cf2e8b31920d55684fca9cd2e51c27190fbde533de19a22
|
3 |
+
size 10570070748
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2809a7ddac3b3ce9e29dbf5c255fc50f36f674438b50f400158ff1a4b8cf07a2
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1c23c9d0ec7fb7f407d540ce769597c583952c41efe961406f061919d63c475
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d88b079ca7d9ddf65b649b7d3a9a7c02a4401f76af13f2a1b7543cac1531448
|
3 |
+
size 10570070428
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/checkpoint/mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e8265ce197916dfa690de7b0cd270c18914ee9baadf3cc000bd992ee88c47f8
|
3 |
+
size 15142167290
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/latest
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47320987f9a49d5b00119b960f247a956773f57543982b8bfcb6da5bb3afd9ef
|
3 |
+
size 10
|
checkpoints/epoch=1-step=38-train_total_step=0.35786.ckpt/zero_to_fp32.py
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92dcd9cc03d6010b4d060b73c8826d71ff9e29a030154e9f192e34ad80457f3a
|
3 |
+
size 29219
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b8500b3023771afba20a264cb6ca23e731137a167c45707b7a7202b47fd33e4
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7760e744ac17ea940dc47bd1664669b391bbb480967b1c135c92ca129e133462
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c72ce2b43aef6723e0a87d44d4c2175d3d9cf4356c9dcf48dbe9b736a8b420a5
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7f2590fee04f9f3349b7fd3dfb76abbe4087e1a724c541f3651fbe5e3ffc45e
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:109bd401bd3a5909cdd8a1aaa09621d65f689464789eeb38fced8e42eb43bd6f
|
3 |
+
size 10570070748
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae23f5a7c636e9db5b90b20bb65d4c21336079d971642217223d8239d07c30cd
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bd01377da6314c1d67534034bcfdcaa39e395353637fe262ec24f534179c1ff
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bc66859f10acba5ae0f2a2d138cd6b9926265842607f7ac0859297e63ee4324
|
3 |
+
size 10570070428
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/checkpoint/mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df64ca27b1ddf7146e7e1e8c1c7084985e87f1b6da001a0ad95ad33c617b1cb4
|
3 |
+
size 15142167290
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/latest
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47320987f9a49d5b00119b960f247a956773f57543982b8bfcb6da5bb3afd9ef
|
3 |
+
size 10
|
checkpoints/epoch=1-step=43-train_total_step=0.31789.ckpt/zero_to_fp32.py
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92dcd9cc03d6010b4d060b73c8826d71ff9e29a030154e9f192e34ad80457f3a
|
3 |
+
size 29219
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:501577397d945219e1308d30038d42b8de0a677b25ac25e5e2e403b80fe19c7b
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd629c05478f096223d9fa65b5ca358d230b40e84818645d9231605453d55ec4
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66a07adc1c481e072830051041682643afc6d64cfb57f0b7a8e59fdf0f6ee29b
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:829a1e30c609431936aabc3d924132109499b0b8624e15241c0ae54bf9cbd125
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f349ebd3da49e26f9cddfb2a10f67e115875e74424d991fc903e65db50ebf955
|
3 |
+
size 10570070748
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e3ce540ab06e73ba7e08adc57a0fe9064114696c273645eadc4cfa900281419
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67710470cb06bdf52eaff528107a0b1fa6a07ce00bd818bb98bb4a558849532a
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7a98d767a177caa7903e2c349d993e9f751312173f8b20c9be8685ad4622b1c
|
3 |
+
size 10570070428
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/checkpoint/mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:846d6636b7e849b04851bd30ce6708acd989c347200746e78780b824dda4e4a4
|
3 |
+
size 15142167290
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/latest
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47320987f9a49d5b00119b960f247a956773f57543982b8bfcb6da5bb3afd9ef
|
3 |
+
size 10
|
checkpoints/epoch=1-step=48-train_total_step=0.19104.ckpt/zero_to_fp32.py
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92dcd9cc03d6010b4d060b73c8826d71ff9e29a030154e9f192e34ad80457f3a
|
3 |
+
size 29219
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:046a98a6fce1f8dc7713d8c0cea09ea0fcf17b1cf0a814e78f0c94e1aad9f732
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a01d81d560c5d9080abe2bc5106d5f17f6f84f08418859f9899d2671865b177d
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb888db1d15c96b30ebe1d6c54613ff409f987b24150ad5e91bd8d1b65f78572
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:562213605019906235631ccf47fdcc10b76237b580854ec3f6b73abbbf9b8d73
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d2d9c62d7c11941aa1d0de0e4e5df96871599ac8247e4221f45f8299ef489ac
|
3 |
+
size 10570070748
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f87e0d58c2406bbc72e7434ae0735cf687eb1e34fdf5b02d90f7594a809ebb5
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc0c8ba476ce7cb1b14afb7affb789b853827585d433ba216cae1a2ce58e32ff
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48490d0473c39dfcd4e9f0dbefafabf2724691089ea97a2996469fa0e8b2d60d
|
3 |
+
size 10570070428
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/checkpoint/mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47251f8ae80b3ece6e5959d6b8d6067e23aebcf3c13e4461a5bb886e1be7c599
|
3 |
+
size 15142167290
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/latest
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47320987f9a49d5b00119b960f247a956773f57543982b8bfcb6da5bb3afd9ef
|
3 |
+
size 10
|
checkpoints/epoch=1-step=53-train_total_step=0.12526.ckpt/zero_to_fp32.py
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92dcd9cc03d6010b4d060b73c8826d71ff9e29a030154e9f192e34ad80457f3a
|
3 |
+
size 29219
|
checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf9eef68dd8f571e506f6b65061898a762158980bcb0957d06b54dfc95b18e65
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8a26e307e8ffbfaf759e7f2c02a960cac8012dc5431802fa54ca5814394a659
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63e9b005d6ef3f42160bc89f2b57e8519163679f14d3175be80c3d67652d2f41
|
3 |
+
size 10570070620
|
checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe3275e4902e1df091d59fc5bb8ef15acf6c77f2e306f31d82953aadf2ae3b64
|
3 |
+
size 10570070556
|
checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e65e49e1d422c8dbb1c4a3bbb5918750b828907467a5571c7360d483fb2f08d8
|
3 |
+
size 10570070748
|
checkpoints/epoch=1-step=56-val_total_epoch=0.13236.ckpt/checkpoint/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe77a514da26ceb4317cae3146482181c1ed292148a0ea387c2666a924e727c3
|
3 |
+
size 10570070556
|