Training in progress, step 300, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +2 -2
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/rng_state_4.pth +1 -1
- last-checkpoint/rng_state_5.pth +1 -1
- last-checkpoint/rng_state_6.pth +1 -1
- last-checkpoint/rng_state_7.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +13 -5
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 157308096
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af13b68fa43378eeb1d9477887e1f4b280a05be96737b5750839609cdd90a6d8
|
3 |
size 157308096
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ab7c0f5a4a81699b122c49904d07e780819ce82f6ed8f06b2193f1320c4453f
|
3 |
+
size 314671226
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9afbf9b2cc7ffb82e39603ea3e9793624776e974898f71cddb75c50b95a8ff20
|
3 |
size 15920
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca4fa167ac420fbc12a0b1225ad375db648a55f16b7e4866651104ea0cc00a49
|
3 |
size 15920
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e799329eb62e1eb372f5e1a106e0710d002dddfe0cb96b7478769d095e752b5f
|
3 |
size 15920
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:148ecc351dae84aea8cdc86447e26d57a1165551634773232252cd35029fec44
|
3 |
size 15920
|
last-checkpoint/rng_state_4.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6c737fa9218e50ea3ce9320b640c05dff0f18b8b0409fe5e3f6340fa144ae6f
|
3 |
size 15920
|
last-checkpoint/rng_state_5.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40fdcad7ba51bcc458150b1d4b2c87d4dee4fcbb7619ccd347b91ff0f61763b2
|
3 |
size 15920
|
last-checkpoint/rng_state_6.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3d21b509f3e70f8a0fe13164c8b6d889c6ab04755a1218812e3a6427ea94537
|
3 |
size 15920
|
last-checkpoint/rng_state_7.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1304350d7f8258aaa5c749bd82f5c7ddf08eafecb5eb5f18652eb3f7d1198b19
|
3 |
size 15920
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d0bcc3306c506981564a07ff3b261b32731741ed53940e879827feb4c6814eb
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 100,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -23,6 +23,14 @@
|
|
23 |
"eval_samples_per_second": 6.015,
|
24 |
"eval_steps_per_second": 0.376,
|
25 |
"step": 200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
26 |
}
|
27 |
],
|
28 |
"logging_steps": 500,
|
@@ -42,7 +50,7 @@
|
|
42 |
"attributes": {}
|
43 |
}
|
44 |
},
|
45 |
-
"total_flos":
|
46 |
"train_batch_size": 2,
|
47 |
"trial_name": null,
|
48 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.05055840685963631,
|
3 |
+
"best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-300",
|
4 |
+
"epoch": 0.37546933667083854,
|
5 |
"eval_steps": 100,
|
6 |
+
"global_step": 300,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
23 |
"eval_samples_per_second": 6.015,
|
24 |
"eval_steps_per_second": 0.376,
|
25 |
"step": 200
|
26 |
+
},
|
27 |
+
{
|
28 |
+
"epoch": 0.37546933667083854,
|
29 |
+
"eval_loss": 0.05055840685963631,
|
30 |
+
"eval_runtime": 5.3195,
|
31 |
+
"eval_samples_per_second": 6.016,
|
32 |
+
"eval_steps_per_second": 0.376,
|
33 |
+
"step": 300
|
34 |
}
|
35 |
],
|
36 |
"logging_steps": 500,
|
|
|
50 |
"attributes": {}
|
51 |
}
|
52 |
},
|
53 |
+
"total_flos": 3.425702422511616e+17,
|
54 |
"train_batch_size": 2,
|
55 |
"trial_name": null,
|
56 |
"trial_params": null
|