VictorSanh
commited on
Commit
•
c604e0f
1
Parent(s):
fd643bd
End of training
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +9 -5
- adapter_config.json +12 -1
- adapter_model.safetensors +2 -2
- global_step1851/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt +3 -0
- global_step1851/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt +3 -0
- global_step1851/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
- global_step1851/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
README.md
CHANGED
@@ -33,14 +33,18 @@ More information needed
|
|
33 |
### Training hyperparameters
|
34 |
|
35 |
The following hyperparameters were used during training:
|
36 |
-
- learning_rate: 0.
|
37 |
- train_batch_size: 2
|
38 |
- eval_batch_size: 8
|
39 |
- seed: 42
|
|
|
|
|
|
|
|
|
40 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
41 |
- lr_scheduler_type: linear
|
42 |
-
- lr_scheduler_warmup_steps:
|
43 |
-
- num_epochs:
|
44 |
|
45 |
### Training results
|
46 |
|
@@ -48,8 +52,8 @@ The following hyperparameters were used during training:
|
|
48 |
|
49 |
### Framework versions
|
50 |
|
51 |
-
- PEFT 0.
|
52 |
- Transformers 4.41.0.dev0
|
53 |
-
- Pytorch 2.1
|
54 |
- Datasets 2.14.7
|
55 |
- Tokenizers 0.19.1
|
|
|
33 |
### Training hyperparameters
|
34 |
|
35 |
The following hyperparameters were used during training:
|
36 |
+
- learning_rate: 0.0001
|
37 |
- train_batch_size: 2
|
38 |
- eval_batch_size: 8
|
39 |
- seed: 42
|
40 |
+
- distributed_type: multi-GPU
|
41 |
+
- num_devices: 32
|
42 |
+
- total_train_batch_size: 64
|
43 |
+
- total_eval_batch_size: 256
|
44 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
45 |
- lr_scheduler_type: linear
|
46 |
+
- lr_scheduler_warmup_steps: 150
|
47 |
+
- num_epochs: 3
|
48 |
|
49 |
### Training results
|
50 |
|
|
|
52 |
|
53 |
### Framework versions
|
54 |
|
55 |
+
- PEFT 0.8.2
|
56 |
- Transformers 4.41.0.dev0
|
57 |
+
- Pytorch 2.0.1+cu118
|
58 |
- Datasets 2.14.7
|
59 |
- Tokenizers 0.19.1
|
adapter_config.json
CHANGED
@@ -21,7 +21,18 @@
|
|
21 |
"r": 8,
|
22 |
"rank_pattern": {},
|
23 |
"revision": null,
|
24 |
-
"target_modules":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
"task_type": null,
|
26 |
"use_dora": true,
|
27 |
"use_rslora": false
|
|
|
21 |
"r": 8,
|
22 |
"rank_pattern": {},
|
23 |
"revision": null,
|
24 |
+
"target_modules": [
|
25 |
+
"fc1",
|
26 |
+
"down_proj",
|
27 |
+
"v_proj",
|
28 |
+
"fc2",
|
29 |
+
"q_proj",
|
30 |
+
"gate_proj",
|
31 |
+
"up_proj",
|
32 |
+
"k_proj",
|
33 |
+
"out_proj",
|
34 |
+
"o_proj"
|
35 |
+
],
|
36 |
"task_type": null,
|
37 |
"use_dora": true,
|
38 |
"use_rslora": false
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e44ce263e6fd885f50d82ca515b9325375b43ee36ededb75acf161ce88bc2e41
|
3 |
+
size 48
|
global_step1851/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:025b1cd5afbca8d38f5c47b3cfa0228d14de98d80bf3d7dd5e7eb3792c25f2bd
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d952918d209940accbb6b6760be3aeaff64ea5f48b9013ce3b02dc088eae41f
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b48e6c001144fecc9cf24d6c0234aaa8f57cbb6546fb301452e3183a44c3641
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f41afe7b754464fa6f66f38795a12471f2e8797aec0226deb2f58be8b5bf83d2
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f19db86359349ad86ed7bc9fa2ac6785d527c213c5060d30573aa725a60f3c08
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5270cb7c4b931ba77e4ae3179412d47b28d319b4c9e3007368bc63919eed4f02
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2986af12f9b1e5b1635139fbf4a19c5fe7eb2d34650d78879a887af731ae0edc
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffb257e34930ba938b49a5890a8454cb3267493523c68badfb3e8caa3afa0984
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30b14cc55558232a05c86540694a3306d830228bfb73ada754159eab17530ccb
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bc88792755a9da0da4e14d653531861fdd73db813b681f5782ec1d1a4b4fbbb
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1ccfee04a1de5af9afc9bf807e491ae6fa445afc90d08f2478c5c23668ada51
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ac4aae4488ba4c5323e8d76bb0d80f94103fc7d1d4fb43f3518976865b3ee76
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d21f3d8ca5a232578f84f269ec2411b9eb2b49f87d60a6c5e3b753c832df4afb
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f07f1c42880fa800c5c5014d57bad92bb104337262d4be0048f9945442bf9df3
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99cac8d7f6437d6a2ae851c0404ba1f45b672ba92302b71c6c4a5534f7e3c9eb
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e12cd939152eac3931f1d1718ffc59378cbdf8173831e63d4c30d338b5560ca
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b214204ac9205421e0da3948f11bd9fe3c7fd39f91ec1be34d37701802444dc4
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3c3f9a89d26fa299bcf0f43ebc82958ce6b1bbae886b10a167d41c8edbe3e3d
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d557f242ecefbd95d1e660b8f5657abbbdb80ff8187f641c64780e1ae387841
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebb17752213250f062cab0d3a0668fc2c267071bfa8ff63947dfa3bb19e5953c
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6555304629e1a3d37cefe0b2220e0d2f2d780e1a96ea1f280f0f2b13396f4e33
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc525ebc87c1f7aa58d60a510d2aa0ab9518d5c8bf6233caa3d14555e78417e5
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:920f2e69684990176b3380c873136767031d3c5b72ca3f2daee75ad1875fecc0
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4baed8cbc04198e4e73835a48a65a53f4edc654b3a24b1c73b3f5d8624e4174a
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a23982b6bc7a206a97855ce54f5d6ad0c568f6a055d2663d88687228bda7d6bd
|
3 |
+
size 11065661
|
global_step1851/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90b5f73da5763d8bd618db0dbad365aad25216bc27f8afae03ee4660096112dd
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16bcf9ac0b62036551b8acbc9db9b3c1eb0358b58319bc6b976223b0c6243457
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80c3f3b0535b060821b883c728f18955902716d2718d5e741ffd223bf002d8a6
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bf8b9e5f6e87e3f78eb6202c28bb3c559e66a83f3f51b1b57242c738e7e3282
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6838931b32868aae01141d6f194e8302bf8d9a84ca685302d59280ab58466e4f
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a56344a10b279fadb8d0d141b60209e77c02449e61f154b329f29716691c32d2
|
3 |
+
size 11065655
|
global_step1851/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76827fa3b7dad13afd552e09d03fe62c1aa41a48f7d55e9b170a50cafa6b4ec4
|
3 |
+
size 11065655
|
global_step1851/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c93b3877dd23615af54355e8c7c39550729cec91b78fde54ea0ef6a4a3fee65b
|
3 |
+
size 526932687
|
global_step1851/zero_pp_rank_10_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d51aa79247167cab6c12bc19d50868cf6e463b2777ce76651c461044e0bc46b
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_11_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce906b0d6b350a48c983d1ce236c363ae0823a4c8d71f9cfaee7883b191be4d4
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_12_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bec42fd58898de452f3986ca86f2f05eacb3ed429e8e4b48b79f59626707180d
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_13_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9521594521b888df18bc98094ae9d6d12e620f63587ca9ad94141b25b0e2f80
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_14_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db95b3cc74d30eb5fa45d5e7e6b8b02d64719fa34afe27b597ff84a3becd9be8
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_15_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eab529ea20ced93e80dca7ecab4c69a05e748341f0259daaf863895a288f1e83
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_16_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f7f1a538fdd8f7665cc455c03bdd8f6c1b8bb15062048f748ceba7f3e99dd53
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_17_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc00c0885cdddde76db513e739f58456e95a255fe0a9d4f009463079ed0b102e
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_18_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d73143ba31897864028bc99357fb7b6432573df23106a13f343bb971ee88ff9
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_19_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d05a6d71b9bb4d67a0941daf6834d79d8f7ad7d77cdd0fa9f5c58aec902f9d01
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abd26f545bbaf53db05106c2d762f978c218701550b8742c63fd6569097fca55
|
3 |
+
size 526932687
|
global_step1851/zero_pp_rank_20_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f69acd690339f4e607dc2ed0be2f448a55cd6b14f0ec223d7fcb37bc2e8edcfd
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_21_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48a5abec20e07c4989d51c3b011a577aea82c3d56a50ac65eb1f534e40350060
|
3 |
+
size 526935445
|
global_step1851/zero_pp_rank_22_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d09274d1752934484470667d48d5b5738b7ca64408882b1550526fcbfc9daa5
|
3 |
+
size 526935445
|