rakhman-llm commited on
Commit
71eee4b
1 Parent(s): 79e05fd

Training in progress, step 15462, checkpoint

Browse files
Files changed (1) hide show
  1. last-checkpoint/trainer_state.json +45 -45
last-checkpoint/trainer_state.json CHANGED
@@ -25,9 +25,9 @@
25
  {
26
  "epoch": 0.19402405898331393,
27
  "eval_loss": 1.1814582347869873,
28
- "eval_runtime": 49.4809,
29
- "eval_samples_per_second": 104.747,
30
- "eval_steps_per_second": 3.274,
31
  "step": 1000
32
  },
33
  {
@@ -47,9 +47,9 @@
47
  {
48
  "epoch": 0.38804811796662786,
49
  "eval_loss": 1.1394085884094238,
50
- "eval_runtime": 49.4813,
51
- "eval_samples_per_second": 104.747,
52
- "eval_steps_per_second": 3.274,
53
  "step": 2000
54
  },
55
  {
@@ -69,9 +69,9 @@
69
  {
70
  "epoch": 0.5820721769499418,
71
  "eval_loss": 1.1180071830749512,
72
- "eval_runtime": 49.4875,
73
- "eval_samples_per_second": 104.733,
74
- "eval_steps_per_second": 3.274,
75
  "step": 3000
76
  },
77
  {
@@ -91,9 +91,9 @@
91
  {
92
  "epoch": 0.7760962359332557,
93
  "eval_loss": 1.1015874147415161,
94
- "eval_runtime": 49.4673,
95
- "eval_samples_per_second": 104.776,
96
- "eval_steps_per_second": 3.275,
97
  "step": 4000
98
  },
99
  {
@@ -113,9 +113,9 @@
113
  {
114
  "epoch": 0.9701202949165697,
115
  "eval_loss": 1.091620922088623,
116
- "eval_runtime": 49.4696,
117
- "eval_samples_per_second": 104.771,
118
- "eval_steps_per_second": 3.275,
119
  "step": 5000
120
  },
121
  {
@@ -135,9 +135,9 @@
135
  {
136
  "epoch": 1.1641443538998835,
137
  "eval_loss": 1.0831941366195679,
138
- "eval_runtime": 49.4837,
139
- "eval_samples_per_second": 104.742,
140
- "eval_steps_per_second": 3.274,
141
  "step": 6000
142
  },
143
  {
@@ -157,9 +157,9 @@
157
  {
158
  "epoch": 1.3581684128831975,
159
  "eval_loss": 1.0764732360839844,
160
- "eval_runtime": 49.4861,
161
- "eval_samples_per_second": 104.736,
162
- "eval_steps_per_second": 3.274,
163
  "step": 7000
164
  },
165
  {
@@ -179,9 +179,9 @@
179
  {
180
  "epoch": 1.5521924718665114,
181
  "eval_loss": 1.07025945186615,
182
- "eval_runtime": 49.4895,
183
- "eval_samples_per_second": 104.729,
184
- "eval_steps_per_second": 3.273,
185
  "step": 8000
186
  },
187
  {
@@ -201,9 +201,9 @@
201
  {
202
  "epoch": 1.7462165308498254,
203
  "eval_loss": 1.0663487911224365,
204
- "eval_runtime": 49.4879,
205
- "eval_samples_per_second": 104.733,
206
- "eval_steps_per_second": 3.274,
207
  "step": 9000
208
  },
209
  {
@@ -223,9 +223,9 @@
223
  {
224
  "epoch": 1.9402405898331394,
225
  "eval_loss": 1.0637460947036743,
226
- "eval_runtime": 49.4829,
227
- "eval_samples_per_second": 104.743,
228
- "eval_steps_per_second": 3.274,
229
  "step": 10000
230
  },
231
  {
@@ -245,9 +245,9 @@
245
  {
246
  "epoch": 2.1342646488164534,
247
  "eval_loss": 1.0619136095046997,
248
- "eval_runtime": 49.4906,
249
- "eval_samples_per_second": 104.727,
250
- "eval_steps_per_second": 3.273,
251
  "step": 11000
252
  },
253
  {
@@ -267,9 +267,9 @@
267
  {
268
  "epoch": 2.328288707799767,
269
  "eval_loss": 1.0580228567123413,
270
- "eval_runtime": 49.4724,
271
- "eval_samples_per_second": 104.765,
272
- "eval_steps_per_second": 3.275,
273
  "step": 12000
274
  },
275
  {
@@ -289,9 +289,9 @@
289
  {
290
  "epoch": 2.522312766783081,
291
  "eval_loss": 1.0561449527740479,
292
- "eval_runtime": 49.4628,
293
- "eval_samples_per_second": 104.786,
294
- "eval_steps_per_second": 3.275,
295
  "step": 13000
296
  },
297
  {
@@ -311,9 +311,9 @@
311
  {
312
  "epoch": 2.716336825766395,
313
  "eval_loss": 1.0557653903961182,
314
- "eval_runtime": 49.4704,
315
- "eval_samples_per_second": 104.77,
316
- "eval_steps_per_second": 3.275,
317
  "step": 14000
318
  },
319
  {
@@ -333,9 +333,9 @@
333
  {
334
  "epoch": 2.910360884749709,
335
  "eval_loss": 1.054747223854065,
336
- "eval_runtime": 49.4705,
337
- "eval_samples_per_second": 104.769,
338
- "eval_steps_per_second": 3.275,
339
  "step": 15000
340
  }
341
  ],
 
25
  {
26
  "epoch": 0.19402405898331393,
27
  "eval_loss": 1.1814582347869873,
28
+ "eval_runtime": 49.6691,
29
+ "eval_samples_per_second": 104.351,
30
+ "eval_steps_per_second": 3.262,
31
  "step": 1000
32
  },
33
  {
 
47
  {
48
  "epoch": 0.38804811796662786,
49
  "eval_loss": 1.1394085884094238,
50
+ "eval_runtime": 49.6277,
51
+ "eval_samples_per_second": 104.438,
52
+ "eval_steps_per_second": 3.264,
53
  "step": 2000
54
  },
55
  {
 
69
  {
70
  "epoch": 0.5820721769499418,
71
  "eval_loss": 1.1180071830749512,
72
+ "eval_runtime": 49.6817,
73
+ "eval_samples_per_second": 104.324,
74
+ "eval_steps_per_second": 3.261,
75
  "step": 3000
76
  },
77
  {
 
91
  {
92
  "epoch": 0.7760962359332557,
93
  "eval_loss": 1.1015874147415161,
94
+ "eval_runtime": 49.6378,
95
+ "eval_samples_per_second": 104.416,
96
+ "eval_steps_per_second": 3.264,
97
  "step": 4000
98
  },
99
  {
 
113
  {
114
  "epoch": 0.9701202949165697,
115
  "eval_loss": 1.091620922088623,
116
+ "eval_runtime": 49.6213,
117
+ "eval_samples_per_second": 104.451,
118
+ "eval_steps_per_second": 3.265,
119
  "step": 5000
120
  },
121
  {
 
135
  {
136
  "epoch": 1.1641443538998835,
137
  "eval_loss": 1.0831941366195679,
138
+ "eval_runtime": 49.6774,
139
+ "eval_samples_per_second": 104.333,
140
+ "eval_steps_per_second": 3.261,
141
  "step": 6000
142
  },
143
  {
 
157
  {
158
  "epoch": 1.3581684128831975,
159
  "eval_loss": 1.0764732360839844,
160
+ "eval_runtime": 49.6981,
161
+ "eval_samples_per_second": 104.29,
162
+ "eval_steps_per_second": 3.26,
163
  "step": 7000
164
  },
165
  {
 
179
  {
180
  "epoch": 1.5521924718665114,
181
  "eval_loss": 1.07025945186615,
182
+ "eval_runtime": 49.6881,
183
+ "eval_samples_per_second": 104.311,
184
+ "eval_steps_per_second": 3.26,
185
  "step": 8000
186
  },
187
  {
 
201
  {
202
  "epoch": 1.7462165308498254,
203
  "eval_loss": 1.0663487911224365,
204
+ "eval_runtime": 49.6731,
205
+ "eval_samples_per_second": 104.342,
206
+ "eval_steps_per_second": 3.261,
207
  "step": 9000
208
  },
209
  {
 
223
  {
224
  "epoch": 1.9402405898331394,
225
  "eval_loss": 1.0637460947036743,
226
+ "eval_runtime": 49.672,
227
+ "eval_samples_per_second": 104.344,
228
+ "eval_steps_per_second": 3.261,
229
  "step": 10000
230
  },
231
  {
 
245
  {
246
  "epoch": 2.1342646488164534,
247
  "eval_loss": 1.0619136095046997,
248
+ "eval_runtime": 49.6813,
249
+ "eval_samples_per_second": 104.325,
250
+ "eval_steps_per_second": 3.261,
251
  "step": 11000
252
  },
253
  {
 
267
  {
268
  "epoch": 2.328288707799767,
269
  "eval_loss": 1.0580228567123413,
270
+ "eval_runtime": 49.6253,
271
+ "eval_samples_per_second": 104.443,
272
+ "eval_steps_per_second": 3.264,
273
  "step": 12000
274
  },
275
  {
 
289
  {
290
  "epoch": 2.522312766783081,
291
  "eval_loss": 1.0561449527740479,
292
+ "eval_runtime": 49.663,
293
+ "eval_samples_per_second": 104.363,
294
+ "eval_steps_per_second": 3.262,
295
  "step": 13000
296
  },
297
  {
 
311
  {
312
  "epoch": 2.716336825766395,
313
  "eval_loss": 1.0557653903961182,
314
+ "eval_runtime": 49.6516,
315
+ "eval_samples_per_second": 104.387,
316
+ "eval_steps_per_second": 3.263,
317
  "step": 14000
318
  },
319
  {
 
333
  {
334
  "epoch": 2.910360884749709,
335
  "eval_loss": 1.054747223854065,
336
+ "eval_runtime": 49.5431,
337
+ "eval_samples_per_second": 104.616,
338
+ "eval_steps_per_second": 3.27,
339
  "step": 15000
340
  }
341
  ],