evgmaslov commited on
Commit
332b172
1 Parent(s): c2f260c

Training in progress, step 300, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24f82954ad3814c1f6ed93e8408a170671cca2dc4fa9032ddf5b248a7742cfa1
3
  size 157308096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af13b68fa43378eeb1d9477887e1f4b280a05be96737b5750839609cdd90a6d8
3
  size 157308096
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b984a0be79f86161305d301a06191b369cef1b5655520bf65f5395387448abec
3
- size 314671098
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ab7c0f5a4a81699b122c49904d07e780819ce82f6ed8f06b2193f1320c4453f
3
+ size 314671226
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f0f83458f7c9f12052de248fd5909300c5c52d396aed861ce1fd8edc5fef56c
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9afbf9b2cc7ffb82e39603ea3e9793624776e974898f71cddb75c50b95a8ff20
3
  size 15920
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81ca9fda20a3de2994a219637972c54487fa75f056392a78be59c68d2abb1d90
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca4fa167ac420fbc12a0b1225ad375db648a55f16b7e4866651104ea0cc00a49
3
  size 15920
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:065123427c993e64d893467b3ad76bcd70b24cf5e4b4c4ec9e1fb962712019ca
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e799329eb62e1eb372f5e1a106e0710d002dddfe0cb96b7478769d095e752b5f
3
  size 15920
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4de644fb25d0d8fe55597cbdbc5a66de50ec97a4729760c9bb1de3ad8d9c65fb
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:148ecc351dae84aea8cdc86447e26d57a1165551634773232252cd35029fec44
3
  size 15920
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eefef284b9424cec6c28323321e1ff9ee61f8ce10e5420e294134670022eb5e2
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6c737fa9218e50ea3ce9320b640c05dff0f18b8b0409fe5e3f6340fa144ae6f
3
  size 15920
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f19e59de787eca7935663eb49b221916b3d3997a51b43803a7f9ffc6655ca497
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40fdcad7ba51bcc458150b1d4b2c87d4dee4fcbb7619ccd347b91ff0f61763b2
3
  size 15920
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd6fc8a12ffae29eb1afd35a51f6ddbb40e09461bd500a089b3c64f8b7f03bff
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3d21b509f3e70f8a0fe13164c8b6d889c6ab04755a1218812e3a6427ea94537
3
  size 15920
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:669eea3e7eb6a2264ee496eb3023b358361935d64b4be016844c9341d0d16d75
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1304350d7f8258aaa5c749bd82f5c7ddf08eafecb5eb5f18652eb3f7d1198b19
3
  size 15920
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffeb5abb4ae2d8ef1270c7764dbf7f7fc55d16002d5dabc5eb812fa241ecb11c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d0bcc3306c506981564a07ff3b261b32731741ed53940e879827feb4c6814eb
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.05197252705693245,
3
- "best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-200",
4
- "epoch": 0.2503128911138924,
5
  "eval_steps": 100,
6
- "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -23,6 +23,14 @@
23
  "eval_samples_per_second": 6.015,
24
  "eval_steps_per_second": 0.376,
25
  "step": 200
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
  "logging_steps": 500,
@@ -42,7 +50,7 @@
42
  "attributes": {}
43
  }
44
  },
45
- "total_flos": 2.283801615007744e+17,
46
  "train_batch_size": 2,
47
  "trial_name": null,
48
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.05055840685963631,
3
+ "best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-300",
4
+ "epoch": 0.37546933667083854,
5
  "eval_steps": 100,
6
+ "global_step": 300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
23
  "eval_samples_per_second": 6.015,
24
  "eval_steps_per_second": 0.376,
25
  "step": 200
26
+ },
27
+ {
28
+ "epoch": 0.37546933667083854,
29
+ "eval_loss": 0.05055840685963631,
30
+ "eval_runtime": 5.3195,
31
+ "eval_samples_per_second": 6.016,
32
+ "eval_steps_per_second": 0.376,
33
+ "step": 300
34
  }
35
  ],
36
  "logging_steps": 500,
 
50
  "attributes": {}
51
  }
52
  },
53
+ "total_flos": 3.425702422511616e+17,
54
  "train_batch_size": 2,
55
  "trial_name": null,
56
  "trial_params": null