jasmeeetsingh commited on
Commit
c99c202
1 Parent(s): f96ce9d

Training in progress, step 3000, checkpoint

Browse files
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90c26c9d06a857c490bef2859c8d9f1a0df37d5078b3e76552e968745a76cdbb
3
  size 8970189
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da1cbe447f27f1838e8a3a4ba8302e4d8d976346b15ee6f1136786e98b394d93
3
  size 8970189
last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65d2c17ea78ecdbdd84dcb5f4a124f13cf024c24d7a6240f894f9819a0533fc5
3
+ size 7759329147
last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b69a387a9b8d458508c6ace3e508c8297d1fe155d5107569a40e1a5c3ce41ac3
3
+ size 13335934
last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41525d9f268025a34b25f008223b081e3ffa2a05c7598f72aa95b3f4f01ae2a5
3
+ size 7759329083
last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:917832de0a4a336a973ef97e8c51977da1b954b9d3357322eb0cc2579a8796cc
3
+ size 13335934
last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9f915bbc3e211cc307a3f6e74be947895da6a115b2dd65f99a7c5b520acf964
3
+ size 7759329083
last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f33e2c55894e94abd96ff61f174f9fd7ea02e9772bb1c6a476a40ae5b8a3459
3
+ size 13335934
last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa63ff62eca3690ecc5b6d93cdf9ccd2a3d4fbc974350a056af880d4f46ae1ea
3
+ size 7759329083
last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9b200211cc8db0a98d1dee6a4ac63c3638e224e1e4e33e1887f8fcdaf0e28f2
3
+ size 13335934
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step2000
 
1
+ global_step3000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f36f3108739132271885035e5faf177e77e529c599274b592066cfd46847f09
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ad5c18e0204ef6122ea3f403ea10fd74e71251302fb20ee72972df1617b8b41
3
  size 17655
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52c562c02b52d9091784791fd63a8de14c04f388fc95bf7cfc96a06c0d535229
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e839a832de9abea85f961777181743f876cb830aba916358b29bec0afd58bed
3
  size 17655
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:854590c01dfe34d93f0fa12d48d05e5d5bcb7605ecd3692ab90d1341b4528c3b
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57219858a72145c49bcfe75287fcacf1a98cb31ab42e9b504c552f4c3d2e517f
3
  size 17655
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f023641060de0ce868c668d29989cc44bffe8e1bb9aea8330ec656170354cf64
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3776db9e505779d6fc4f1b27ffc245809ec06fd0bdf7ccb144630a66b1e545ab
3
  size 17655
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7818608287724785,
5
  "eval_steps": 500,
6
- "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -19,13 +19,19 @@
19
  "learning_rate": 1e-05,
20
  "loss": 0.7436,
21
  "step": 2000
 
 
 
 
 
 
22
  }
23
  ],
24
  "logging_steps": 1000,
25
  "max_steps": 7674,
26
  "num_train_epochs": 3,
27
  "save_steps": 1000,
28
- "total_flos": 27337888366592.0,
29
  "trial_name": null,
30
  "trial_params": null
31
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.1727912431587177,
5
  "eval_steps": 500,
6
+ "global_step": 3000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
19
  "learning_rate": 1e-05,
20
  "loss": 0.7436,
21
  "step": 2000
22
+ },
23
+ {
24
+ "epoch": 1.17,
25
+ "learning_rate": 1e-05,
26
+ "loss": 0.7002,
27
+ "step": 3000
28
  }
29
  ],
30
  "logging_steps": 1000,
31
  "max_steps": 7674,
32
  "num_train_epochs": 3,
33
  "save_steps": 1000,
34
+ "total_flos": 41011800702976.0,
35
  "trial_name": null,
36
  "trial_params": null
37
  }