evgmaslov commited on
Commit
97b9945
1 Parent(s): 44e88f5

Training in progress, step 200, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:feec9c2fc880157fdf1af2bfa44f9ed2d221e96023c2d55f086262fb9a2f2c9f
3
  size 157308096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24f82954ad3814c1f6ed93e8408a170671cca2dc4fa9032ddf5b248a7742cfa1
3
  size 157308096
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08f0e2ba49e5fc6242ec0b63d665c32ccde3ba3a985a8bf138513ccdfdc0a055
3
  size 314671098
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b984a0be79f86161305d301a06191b369cef1b5655520bf65f5395387448abec
3
  size 314671098
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51dee332d2275cc0831c1ea0d0b5b2263457ff95fff00680e5043e944b844a04
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f0f83458f7c9f12052de248fd5909300c5c52d396aed861ce1fd8edc5fef56c
3
  size 15920
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9dd41ef4ed5f7287caff4fbd63c7a8fe2bdaf897c1e0d8462e29234862b1d008
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81ca9fda20a3de2994a219637972c54487fa75f056392a78be59c68d2abb1d90
3
  size 15920
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38f9352bf4c207908a2139b5f9b00e28565f619c4bf592f8d44d4fd7bab9e233
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:065123427c993e64d893467b3ad76bcd70b24cf5e4b4c4ec9e1fb962712019ca
3
  size 15920
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f65483c1d522a1cffd17408a379086fe58926f97fc8b98bbf33ca6096fedbaa
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4de644fb25d0d8fe55597cbdbc5a66de50ec97a4729760c9bb1de3ad8d9c65fb
3
  size 15920
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7cde8693d11e7616878cf88486a40f4b06a4e1c5183cede7db3bc7feed749431
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eefef284b9424cec6c28323321e1ff9ee61f8ce10e5420e294134670022eb5e2
3
  size 15920
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72d0344dcf2d5f0e04a15864a370633a27e082c0bc3a6fc6cb92b047029e94ee
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f19e59de787eca7935663eb49b221916b3d3997a51b43803a7f9ffc6655ca497
3
  size 15920
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4a6ce273116b22c7e48d400c7fad4266b453a25f35bdb6ff40b8fd387c52039
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd6fc8a12ffae29eb1afd35a51f6ddbb40e09461bd500a089b3c64f8b7f03bff
3
  size 15920
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:721c7edddc274b916092408fb1b3bd5030be85a6bdb989ce16a729345640c7ab
3
  size 15920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:669eea3e7eb6a2264ee496eb3023b358361935d64b4be016844c9341d0d16d75
3
  size 15920
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbaba77b7ae8890f2b70278aac610a39d4e81d78f312f9f6ab0d92ef1151e3b7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffeb5abb4ae2d8ef1270c7764dbf7f7fc55d16002d5dabc5eb812fa241ecb11c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.05901213735342026,
3
- "best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-100",
4
- "epoch": 0.1251564455569462,
5
  "eval_steps": 100,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -15,6 +15,14 @@
15
  "eval_samples_per_second": 6.008,
16
  "eval_steps_per_second": 0.375,
17
  "step": 100
 
 
 
 
 
 
 
 
18
  }
19
  ],
20
  "logging_steps": 500,
@@ -34,7 +42,7 @@
34
  "attributes": {}
35
  }
36
  },
37
- "total_flos": 1.141900807503872e+17,
38
  "train_batch_size": 2,
39
  "trial_name": null,
40
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.05197252705693245,
3
+ "best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-200",
4
+ "epoch": 0.2503128911138924,
5
  "eval_steps": 100,
6
+ "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
15
  "eval_samples_per_second": 6.008,
16
  "eval_steps_per_second": 0.375,
17
  "step": 100
18
+ },
19
+ {
20
+ "epoch": 0.2503128911138924,
21
+ "eval_loss": 0.05197252705693245,
22
+ "eval_runtime": 5.3201,
23
+ "eval_samples_per_second": 6.015,
24
+ "eval_steps_per_second": 0.376,
25
+ "step": 200
26
  }
27
  ],
28
  "logging_steps": 500,
 
42
  "attributes": {}
43
  }
44
  },
45
+ "total_flos": 2.283801615007744e+17,
46
  "train_batch_size": 2,
47
  "trial_name": null,
48
  "trial_params": null