Theoreticallyhugo commited on
Commit
8f22474
·
verified ·
1 Parent(s): 6c0bf65

Training in progress, epoch 12, checkpoint

Browse files
checkpoint-492/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32e0f3665e357e9850bfc04afc3d109586a5d95f0f76c4fe44df576d2f7da2f4
3
  size 592324828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a6646aa66b3a94c59ffa3908580c116e3110b578a9fc325fbdb06c314dbffa3
3
  size 592324828
checkpoint-492/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ecb58cde0bfaec47430ba557738e4a5126a730fb6abce4c1cb3e59c810cb209
3
  size 1014657786
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7372ad8507f8cf9652f5a5281e6d3d7b033168a3ac3e05254ce8fbc9ab3ea257
3
  size 1014657786
checkpoint-492/trainer_state.json CHANGED
@@ -11,540 +11,540 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_Claim": {
14
- "f1-score": 0.3472626289341444,
15
- "precision": 0.3978787878787879,
16
- "recall": 0.3080713280150164,
17
- "support": 4262.0
18
  },
19
  "eval_MajorClaim": {
20
- "f1-score": 0.5334239746204397,
21
- "precision": 0.5235765124555161,
22
- "recall": 0.54364896073903,
23
- "support": 2165.0
24
  },
25
  "eval_O": {
26
- "f1-score": 0.8390533194223273,
27
- "precision": 0.9157377442167086,
28
- "recall": 0.7742197000405351,
29
- "support": 9868.0
30
  },
31
  "eval_Premise": {
32
- "f1-score": 0.8562600940945159,
33
- "precision": 0.7896134170821731,
34
- "recall": 0.9351944167497508,
35
- "support": 13039.0
36
  },
37
- "eval_accuracy": 0.7610281584509443,
38
- "eval_loss": 0.6209574341773987,
39
  "eval_macro avg": {
40
- "f1-score": 0.6440000042678569,
41
- "precision": 0.6567016154082965,
42
- "recall": 0.6402836013860831,
43
- "support": 29334.0
44
- },
45
- "eval_runtime": 1.3904,
46
- "eval_samples_per_second": 57.539,
47
- "eval_steps_per_second": 7.192,
48
  "eval_weighted avg": {
49
- "f1-score": 0.7526914076678427,
50
- "precision": 0.7554909643645776,
51
- "recall": 0.7610281584509443,
52
- "support": 29334.0
53
  },
54
  "step": 41
55
  },
56
  {
57
  "epoch": 2.0,
58
  "eval_Claim": {
59
- "f1-score": 0.4196301564722618,
60
- "precision": 0.5328757225433526,
61
- "recall": 0.34608165180666356,
62
- "support": 4262.0
63
  },
64
  "eval_MajorClaim": {
65
- "f1-score": 0.6500777604976672,
66
- "precision": 0.6262842465753424,
67
- "recall": 0.6757505773672056,
68
- "support": 2165.0
69
  },
70
  "eval_O": {
71
- "f1-score": 0.8802794869120867,
72
- "precision": 0.9066595059076262,
73
- "recall": 0.8553911633563032,
74
- "support": 9868.0
75
  },
76
  "eval_Premise": {
77
- "f1-score": 0.8765692621338388,
78
- "precision": 0.821313672922252,
79
- "recall": 0.9397959966255081,
80
- "support": 13039.0
81
  },
82
- "eval_accuracy": 0.8056521442694484,
83
- "eval_loss": 0.5057439804077148,
84
  "eval_macro avg": {
85
- "f1-score": 0.7066391665039636,
86
- "precision": 0.7217832869871433,
87
- "recall": 0.7042548472889201,
88
- "support": 29334.0
89
- },
90
- "eval_runtime": 1.3936,
91
- "eval_samples_per_second": 57.406,
92
- "eval_steps_per_second": 7.176,
93
  "eval_weighted avg": {
94
- "f1-score": 0.7947114837449316,
95
- "precision": 0.7937221895699558,
96
- "recall": 0.8056521442694484,
97
- "support": 29334.0
98
  },
99
  "step": 82
100
  },
101
  {
102
  "epoch": 3.0,
103
  "eval_Claim": {
104
- "f1-score": 0.5597184377838329,
105
- "precision": 0.542234931808183,
106
- "recall": 0.5783669638667293,
107
- "support": 4262.0
108
  },
109
  "eval_MajorClaim": {
110
- "f1-score": 0.7123406094661768,
111
- "precision": 0.669374492282697,
112
- "recall": 0.7612009237875289,
113
- "support": 2165.0
114
  },
115
  "eval_O": {
116
- "f1-score": 0.896587330270019,
117
- "precision": 0.9139037996000421,
118
- "recall": 0.8799148763680583,
119
- "support": 9868.0
120
  },
121
  "eval_Premise": {
122
- "f1-score": 0.879910300030931,
123
- "precision": 0.8872514619883041,
124
- "recall": 0.8726896234373802,
125
- "support": 13039.0
126
  },
127
- "eval_accuracy": 0.8241289970682485,
128
- "eval_loss": 0.47074389457702637,
129
  "eval_macro avg": {
130
- "f1-score": 0.76213916938774,
131
- "precision": 0.7531911714198065,
132
- "recall": 0.7730430968649242,
133
- "support": 29334.0
134
- },
135
- "eval_runtime": 1.3982,
136
- "eval_samples_per_second": 57.218,
137
- "eval_steps_per_second": 7.152,
138
  "eval_weighted avg": {
139
- "f1-score": 0.8266316076408545,
140
- "precision": 0.8300087121591747,
141
- "recall": 0.8241289970682485,
142
- "support": 29334.0
143
  },
144
  "step": 123
145
  },
146
  {
147
  "epoch": 4.0,
148
  "eval_Claim": {
149
- "f1-score": 0.5578872907333177,
150
- "precision": 0.5606635071090047,
151
- "recall": 0.5551384326607227,
152
- "support": 4262.0
153
  },
154
  "eval_MajorClaim": {
155
- "f1-score": 0.7178253548231899,
156
- "precision": 0.748995983935743,
157
- "recall": 0.6891454965357968,
158
- "support": 2165.0
159
  },
160
  "eval_O": {
161
- "f1-score": 0.8866524874202418,
162
- "precision": 0.9082793070464449,
163
- "recall": 0.8660316173490069,
164
- "support": 9868.0
165
  },
166
  "eval_Premise": {
167
- "f1-score": 0.8822517942583731,
168
- "precision": 0.8605702617953767,
169
- "recall": 0.9050540685635402,
170
- "support": 13039.0
171
  },
172
- "eval_accuracy": 0.8251517010977023,
173
- "eval_loss": 0.49949103593826294,
174
  "eval_macro avg": {
175
- "f1-score": 0.7611542318087806,
176
- "precision": 0.7696272649716422,
177
- "recall": 0.7538424037772666,
178
- "support": 29334.0
179
- },
180
- "eval_runtime": 1.3933,
181
- "eval_samples_per_second": 57.419,
182
- "eval_steps_per_second": 7.177,
183
  "eval_weighted avg": {
184
- "f1-score": 0.8244690603905188,
185
- "precision": 0.8248108003682995,
186
- "recall": 0.8251517010977023,
187
- "support": 29334.0
188
  },
189
  "step": 164
190
  },
191
  {
192
  "epoch": 5.0,
193
  "eval_Claim": {
194
- "f1-score": 0.5622098421541318,
195
- "precision": 0.5562700964630225,
196
- "recall": 0.5682778038479587,
197
- "support": 4262.0
198
  },
199
  "eval_MajorClaim": {
200
- "f1-score": 0.7078507078507079,
201
- "precision": 0.7994186046511628,
202
- "recall": 0.6351039260969977,
203
- "support": 2165.0
204
  },
205
  "eval_O": {
206
- "f1-score": 0.8867608581894296,
207
- "precision": 0.9167929019692708,
208
- "recall": 0.858633968382651,
209
- "support": 9868.0
210
  },
211
  "eval_Premise": {
212
- "f1-score": 0.8842074139778985,
213
- "precision": 0.8533314310172635,
214
- "recall": 0.9174016412301557,
215
- "support": 13039.0
216
  },
217
- "eval_accuracy": 0.8260721347242108,
218
- "eval_loss": 0.5355645418167114,
219
  "eval_macro avg": {
220
- "f1-score": 0.760257205543042,
221
- "precision": 0.7814532585251799,
222
- "recall": 0.7448543348894408,
223
- "support": 29334.0
224
- },
225
- "eval_runtime": 1.3973,
226
- "eval_samples_per_second": 57.254,
227
- "eval_steps_per_second": 7.157,
228
  "eval_weighted avg": {
229
- "f1-score": 0.8252666444817892,
230
- "precision": 0.827540237126271,
231
- "recall": 0.8260721347242108,
232
- "support": 29334.0
233
  },
234
  "step": 205
235
  },
236
  {
237
  "epoch": 6.0,
238
  "eval_Claim": {
239
- "f1-score": 0.5778948628906718,
240
- "precision": 0.5901198337001712,
241
- "recall": 0.5661661191928672,
242
- "support": 4262.0
243
  },
244
  "eval_MajorClaim": {
245
- "f1-score": 0.7630429786256032,
246
- "precision": 0.7593778591033852,
247
- "recall": 0.766743648960739,
248
- "support": 2165.0
249
  },
250
  "eval_O": {
251
- "f1-score": 0.8932349450436038,
252
- "precision": 0.909998948585848,
253
- "recall": 0.877077421970004,
254
- "support": 9868.0
255
  },
256
  "eval_Premise": {
257
- "f1-score": 0.8871252867942979,
258
- "precision": 0.8704605845881311,
259
- "recall": 0.9044405245801058,
260
- "support": 13039.0
261
  },
262
- "eval_accuracy": 0.8359241835412832,
263
- "eval_loss": 0.5402312278747559,
264
  "eval_macro avg": {
265
- "f1-score": 0.7803245183385442,
266
- "precision": 0.7824893064943839,
267
- "recall": 0.778606928675929,
268
- "support": 29334.0
269
- },
270
- "eval_runtime": 1.3946,
271
- "eval_samples_per_second": 57.364,
272
- "eval_steps_per_second": 7.17,
273
  "eval_weighted avg": {
274
- "f1-score": 0.8350939185438606,
275
- "precision": 0.8348315600763192,
276
- "recall": 0.8359241835412832,
277
- "support": 29334.0
278
  },
279
  "step": 246
280
  },
281
  {
282
  "epoch": 7.0,
283
  "eval_Claim": {
284
- "f1-score": 0.5928237129485181,
285
- "precision": 0.5645161290322581,
286
- "recall": 0.6241201313937119,
287
- "support": 4262.0
288
  },
289
  "eval_MajorClaim": {
290
- "f1-score": 0.7545109211775878,
291
- "precision": 0.776257938446507,
292
- "recall": 0.7339491916859122,
293
- "support": 2165.0
294
  },
295
  "eval_O": {
296
- "f1-score": 0.8982721603108067,
297
- "precision": 0.9063338147307612,
298
- "recall": 0.8903526550466153,
299
- "support": 9868.0
300
  },
301
  "eval_Premise": {
302
- "f1-score": 0.8843364197530864,
303
- "precision": 0.8897601117925626,
304
- "recall": 0.8789784492675818,
305
- "support": 13039.0
306
  },
307
- "eval_accuracy": 0.835071930183405,
308
- "eval_loss": 0.5522010922431946,
309
  "eval_macro avg": {
310
- "f1-score": 0.7824858035474997,
311
- "precision": 0.7842169985005223,
312
- "recall": 0.7818501068484554,
313
- "support": 29334.0
314
- },
315
- "eval_runtime": 1.3973,
316
- "eval_samples_per_second": 57.253,
317
- "eval_steps_per_second": 7.157,
318
  "eval_weighted avg": {
319
- "f1-score": 0.8370881251804593,
320
- "precision": 0.8397030872059231,
321
- "recall": 0.835071930183405,
322
- "support": 29334.0
323
  },
324
  "step": 287
325
  },
326
  {
327
  "epoch": 8.0,
328
  "eval_Claim": {
329
- "f1-score": 0.5708034520481342,
330
- "precision": 0.5921815889029004,
331
- "recall": 0.5509150633505396,
332
- "support": 4262.0
333
  },
334
  "eval_MajorClaim": {
335
- "f1-score": 0.7608799617407939,
336
- "precision": 0.7887952404561229,
337
- "recall": 0.7348729792147806,
338
- "support": 2165.0
339
  },
340
  "eval_O": {
341
- "f1-score": 0.9017624521072796,
342
- "precision": 0.909240754094983,
343
- "recall": 0.8944061613295501,
344
- "support": 9868.0
345
  },
346
  "eval_Premise": {
347
- "f1-score": 0.888622395442962,
348
- "precision": 0.868889703187981,
349
- "recall": 0.909272183449651,
350
- "support": 13039.0
351
  },
352
- "eval_accuracy": 0.8393331969727961,
353
- "eval_loss": 0.5863537788391113,
354
  "eval_macro avg": {
355
- "f1-score": 0.7805170653347924,
356
- "precision": 0.7897768216604968,
357
- "recall": 0.7723665968361304,
358
- "support": 29334.0
359
- },
360
- "eval_runtime": 1.4013,
361
- "eval_samples_per_second": 57.089,
362
- "eval_steps_per_second": 7.136,
363
  "eval_weighted avg": {
364
- "f1-score": 0.8374380828176649,
365
- "precision": 0.8363489544136171,
366
- "recall": 0.8393331969727961,
367
- "support": 29334.0
368
  },
369
  "step": 328
370
  },
371
  {
372
  "epoch": 9.0,
373
  "eval_Claim": {
374
- "f1-score": 0.5834502103786816,
375
- "precision": 0.5400439384861194,
376
- "recall": 0.6344439230408259,
377
- "support": 4262.0
378
  },
379
  "eval_MajorClaim": {
380
- "f1-score": 0.739652870493992,
381
- "precision": 0.7136109918419923,
382
- "recall": 0.7676674364896073,
383
- "support": 2165.0
384
  },
385
  "eval_O": {
386
- "f1-score": 0.8923944839114083,
387
- "precision": 0.9208710651142734,
388
- "recall": 0.8656262667207134,
389
- "support": 9868.0
390
  },
391
  "eval_Premise": {
392
- "f1-score": 0.8790807810255813,
393
- "precision": 0.8900330136770948,
394
- "recall": 0.86839481555334,
395
- "support": 13039.0
396
  },
397
- "eval_accuracy": 0.8260380445898957,
398
- "eval_loss": 0.6257872581481934,
399
  "eval_macro avg": {
400
- "f1-score": 0.7736445864524157,
401
- "precision": 0.76613975227987,
402
- "recall": 0.7840331104511216,
403
- "support": 29334.0
404
- },
405
- "eval_runtime": 1.3929,
406
- "eval_samples_per_second": 57.435,
407
- "eval_steps_per_second": 7.179,
408
  "eval_weighted avg": {
409
- "f1-score": 0.8303162314135053,
410
- "precision": 0.8365354605252965,
411
- "recall": 0.8260380445898957,
412
- "support": 29334.0
413
  },
414
  "step": 369
415
  },
416
  {
417
  "epoch": 10.0,
418
  "eval_Claim": {
419
- "f1-score": 0.5916413728694839,
420
- "precision": 0.5887546468401487,
421
- "recall": 0.5945565462224308,
422
- "support": 4262.0
423
  },
424
  "eval_MajorClaim": {
425
- "f1-score": 0.747756258856873,
426
- "precision": 0.765103914934751,
427
- "recall": 0.7311778290993072,
428
- "support": 2165.0
429
  },
430
  "eval_O": {
431
- "f1-score": 0.8968070337806571,
432
- "precision": 0.9102390147166266,
433
- "recall": 0.8837657073368463,
434
- "support": 9868.0
435
  },
436
  "eval_Premise": {
437
- "f1-score": 0.8894356334456263,
438
- "precision": 0.878101644245142,
439
- "recall": 0.9010660326712171,
440
- "support": 13039.0
441
  },
442
- "eval_accuracy": 0.8381741324060816,
443
- "eval_loss": 0.643328845500946,
444
  "eval_macro avg": {
445
- "f1-score": 0.78141007473816,
446
- "precision": 0.7855498051841671,
447
- "recall": 0.7776415288324503,
448
- "support": 29334.0
449
- },
450
- "eval_runtime": 1.3951,
451
- "eval_samples_per_second": 57.345,
452
- "eval_steps_per_second": 7.168,
453
  "eval_weighted avg": {
454
- "f1-score": 0.8381915478775454,
455
- "precision": 0.8385330407446147,
456
- "recall": 0.8381741324060816,
457
- "support": 29334.0
458
  },
459
  "step": 410
460
  },
461
  {
462
  "epoch": 11.0,
463
  "eval_Claim": {
464
- "f1-score": 0.5791188895594448,
465
- "precision": 0.5963211533681332,
466
- "recall": 0.5628812763960582,
467
- "support": 4262.0
468
  },
469
  "eval_MajorClaim": {
470
- "f1-score": 0.7536862460720328,
471
- "precision": 0.7905679513184585,
472
- "recall": 0.7200923787528868,
473
- "support": 2165.0
474
  },
475
  "eval_O": {
476
- "f1-score": 0.896530612244898,
477
- "precision": 0.9027949034114262,
478
- "recall": 0.8903526550466153,
479
- "support": 9868.0
480
  },
481
  "eval_Premise": {
482
- "f1-score": 0.888538617428507,
483
- "precision": 0.8699933857573308,
484
- "recall": 0.9078917094869239,
485
- "support": 13039.0
486
  },
487
- "eval_accuracy": 0.838003681734506,
488
- "eval_loss": 0.691639244556427,
489
  "eval_macro avg": {
490
- "f1-score": 0.7794685913262207,
491
- "precision": 0.7899193484638372,
492
- "recall": 0.770304504920621,
493
- "support": 29334.0
494
- },
495
- "eval_runtime": 1.3951,
496
- "eval_samples_per_second": 57.345,
497
- "eval_steps_per_second": 7.168,
498
  "eval_weighted avg": {
499
- "f1-score": 0.836318079509486,
500
- "precision": 0.8354034306270279,
501
- "recall": 0.838003681734506,
502
- "support": 29334.0
503
  },
504
  "step": 451
505
  },
506
  {
507
  "epoch": 12.0,
508
  "eval_Claim": {
509
- "f1-score": 0.5808454740864581,
510
- "precision": 0.5914396887159533,
511
- "recall": 0.5706241201313937,
512
- "support": 4262.0
513
  },
514
  "eval_MajorClaim": {
515
- "f1-score": 0.7569141193595342,
516
- "precision": 0.797138477261114,
517
- "recall": 0.7205542725173211,
518
- "support": 2165.0
519
  },
520
  "eval_O": {
521
- "f1-score": 0.8973055414336554,
522
- "precision": 0.9003264639869415,
523
- "recall": 0.8943048236724767,
524
- "support": 9868.0
525
  },
526
  "eval_Premise": {
527
- "f1-score": 0.8841596860614294,
528
- "precision": 0.870236945703038,
529
- "recall": 0.8985351637395506,
530
- "support": 13039.0
531
  },
532
- "eval_accuracy": 0.8363332651530647,
533
- "eval_loss": 0.6996743679046631,
534
  "eval_macro avg": {
535
- "f1-score": 0.7798062052352693,
536
- "precision": 0.7897853939167616,
537
- "recall": 0.7710045950151856,
538
- "support": 29334.0
539
- },
540
- "eval_runtime": 1.3919,
541
- "eval_samples_per_second": 57.477,
542
- "eval_steps_per_second": 7.185,
543
  "eval_weighted avg": {
544
- "f1-score": 0.8351214191174802,
545
- "precision": 0.8344570068256206,
546
- "recall": 0.8363332651530647,
547
- "support": 29334.0
548
  },
549
  "step": 492
550
  }
 
11
  {
12
  "epoch": 1.0,
13
  "eval_Claim": {
14
+ "f1-score": 0.47523786289338865,
15
+ "precision": 0.535017852238396,
16
+ "recall": 0.4274742154926487,
17
+ "support": 4557.0
18
  },
19
  "eval_MajorClaim": {
20
+ "f1-score": 0.5895036615134255,
21
+ "precision": 0.5474121647147714,
22
+ "recall": 0.6386073159982371,
23
+ "support": 2269.0
24
  },
25
  "eval_O": {
26
+ "f1-score": 0.8362336114421931,
27
+ "precision": 0.845403060609712,
28
+ "recall": 0.8272609362103526,
29
+ "support": 8481.0
30
  },
31
  "eval_Premise": {
32
+ "f1-score": 0.8706190412246543,
33
+ "precision": 0.850072112232857,
34
+ "recall": 0.8921838447777625,
35
+ "support": 14534.0
36
  },
37
+ "eval_accuracy": 0.7834858081163499,
38
+ "eval_loss": 0.5869407653808594,
39
  "eval_macro avg": {
40
+ "f1-score": 0.6928985442684154,
41
+ "precision": 0.694476297448934,
42
+ "recall": 0.6963815781197502,
43
+ "support": 29841.0
44
+ },
45
+ "eval_runtime": 1.4026,
46
+ "eval_samples_per_second": 57.038,
47
+ "eval_steps_per_second": 7.13,
48
  "eval_weighted avg": {
49
+ "f1-score": 0.7790930985214805,
50
+ "precision": 0.7776202536983177,
51
+ "recall": 0.7834858081163499,
52
+ "support": 29841.0
53
  },
54
  "step": 41
55
  },
56
  {
57
  "epoch": 2.0,
58
  "eval_Claim": {
59
+ "f1-score": 0.5317480394636985,
60
+ "precision": 0.6276500447894894,
61
+ "recall": 0.4612683783190696,
62
+ "support": 4557.0
63
  },
64
  "eval_MajorClaim": {
65
+ "f1-score": 0.7102803738317758,
66
+ "precision": 0.6855268552685527,
67
+ "recall": 0.7368884971353019,
68
+ "support": 2269.0
69
  },
70
  "eval_O": {
71
+ "f1-score": 0.8735280263777673,
72
+ "precision": 0.872397977184523,
73
+ "recall": 0.8746610069567268,
74
+ "support": 8481.0
75
  },
76
  "eval_Premise": {
77
+ "f1-score": 0.884589815184151,
78
+ "precision": 0.8556913183279743,
79
+ "recall": 0.9155084629145452,
80
+ "support": 14534.0
81
  },
82
+ "eval_accuracy": 0.820951040514728,
83
+ "eval_loss": 0.48614954948425293,
84
  "eval_macro avg": {
85
+ "f1-score": 0.7500365637143481,
86
+ "precision": 0.7603165488926349,
87
+ "recall": 0.7470815863314109,
88
+ "support": 29841.0
89
+ },
90
+ "eval_runtime": 1.3997,
91
+ "eval_samples_per_second": 57.154,
92
+ "eval_steps_per_second": 7.144,
93
  "eval_weighted avg": {
94
+ "f1-score": 0.8143098940939201,
95
+ "precision": 0.8126767385071133,
96
+ "recall": 0.820951040514728,
97
+ "support": 29841.0
98
  },
99
  "step": 82
100
  },
101
  {
102
  "epoch": 3.0,
103
  "eval_Claim": {
104
+ "f1-score": 0.5762534088525278,
105
+ "precision": 0.5519389190275267,
106
+ "recall": 0.6028088654816766,
107
+ "support": 4557.0
108
  },
109
  "eval_MajorClaim": {
110
+ "f1-score": 0.7533490937746257,
111
+ "precision": 0.6811542572141076,
112
+ "recall": 0.8426619656236227,
113
+ "support": 2269.0
114
  },
115
  "eval_O": {
116
+ "f1-score": 0.8863363002165023,
117
+ "precision": 0.9045047256658892,
118
+ "recall": 0.868883386393114,
119
+ "support": 8481.0
120
  },
121
  "eval_Premise": {
122
+ "f1-score": 0.8715370552664885,
123
+ "precision": 0.8910855499640546,
124
+ "recall": 0.8528278519333975,
125
+ "support": 14534.0
126
  },
127
+ "eval_accuracy": 0.8184377199155525,
128
+ "eval_loss": 0.46511921286582947,
129
  "eval_macro avg": {
130
+ "f1-score": 0.7718689645275361,
131
+ "precision": 0.7571708629678946,
132
+ "recall": 0.7917955173579527,
133
+ "support": 29841.0
134
+ },
135
+ "eval_runtime": 1.4011,
136
+ "eval_samples_per_second": 57.099,
137
+ "eval_steps_per_second": 7.137,
138
  "eval_weighted avg": {
139
+ "f1-score": 0.8216639389194362,
140
+ "precision": 0.8271460951435015,
141
+ "recall": 0.8184377199155525,
142
+ "support": 29841.0
143
  },
144
  "step": 123
145
  },
146
  {
147
  "epoch": 4.0,
148
  "eval_Claim": {
149
+ "f1-score": 0.5960000000000001,
150
+ "precision": 0.5727291118753793,
151
+ "recall": 0.6212420452051789,
152
+ "support": 4557.0
153
  },
154
  "eval_MajorClaim": {
155
+ "f1-score": 0.7671584348941629,
156
+ "precision": 0.7450166112956811,
157
+ "recall": 0.7906566769501984,
158
+ "support": 2269.0
159
  },
160
  "eval_O": {
161
+ "f1-score": 0.8945798982634625,
162
+ "precision": 0.8872651356993737,
163
+ "recall": 0.9020162716660771,
164
+ "support": 8481.0
165
  },
166
  "eval_Premise": {
167
+ "f1-score": 0.8770509119076122,
168
+ "precision": 0.8981107585809057,
169
+ "recall": 0.8569561029310582,
170
+ "support": 14534.0
171
  },
172
+ "eval_accuracy": 0.8287255789015113,
173
+ "eval_loss": 0.46847572922706604,
174
  "eval_macro avg": {
175
+ "f1-score": 0.7836973112663095,
176
+ "precision": 0.7757804043628349,
177
+ "recall": 0.792717774188128,
178
+ "support": 29841.0
179
+ },
180
+ "eval_runtime": 1.3906,
181
+ "eval_samples_per_second": 57.529,
182
+ "eval_steps_per_second": 7.191,
183
  "eval_weighted avg": {
184
+ "f1-score": 0.8307578351802057,
185
+ "precision": 0.8336988249364055,
186
+ "recall": 0.8287255789015113,
187
+ "support": 29841.0
188
  },
189
  "step": 164
190
  },
191
  {
192
  "epoch": 5.0,
193
  "eval_Claim": {
194
+ "f1-score": 0.5957255343082115,
195
+ "precision": 0.6111239326102008,
196
+ "recall": 0.5810840465218345,
197
+ "support": 4557.0
198
  },
199
  "eval_MajorClaim": {
200
+ "f1-score": 0.7869718309859155,
201
+ "precision": 0.7859340659340659,
202
+ "recall": 0.7880123402379903,
203
+ "support": 2269.0
204
  },
205
  "eval_O": {
206
+ "f1-score": 0.8924617196702003,
207
+ "precision": 0.8915166490175315,
208
+ "recall": 0.8934087961325315,
209
+ "support": 8481.0
210
  },
211
  "eval_Premise": {
212
+ "f1-score": 0.8858138581385815,
213
+ "precision": 0.8798018189222208,
214
+ "recall": 0.8919086280445852,
215
+ "support": 14534.0
216
  },
217
+ "eval_accuracy": 0.8369692704668074,
218
+ "eval_loss": 0.4714011251926422,
219
  "eval_macro avg": {
220
+ "f1-score": 0.7902432357757272,
221
+ "precision": 0.7920941166210047,
222
+ "recall": 0.7886034527342354,
223
+ "support": 29841.0
224
+ },
225
+ "eval_runtime": 1.4,
226
+ "eval_samples_per_second": 57.143,
227
+ "eval_steps_per_second": 7.143,
228
  "eval_weighted avg": {
229
+ "f1-score": 0.8358884354766487,
230
+ "precision": 0.8349642603479214,
231
+ "recall": 0.8369692704668074,
232
+ "support": 29841.0
233
  },
234
  "step": 205
235
  },
236
  {
237
  "epoch": 6.0,
238
  "eval_Claim": {
239
+ "f1-score": 0.5968608901311546,
240
+ "precision": 0.5850368809272919,
241
+ "recall": 0.6091727013385999,
242
+ "support": 4557.0
243
  },
244
  "eval_MajorClaim": {
245
+ "f1-score": 0.8127323420074349,
246
+ "precision": 0.8594594594594595,
247
+ "recall": 0.7708241516086382,
248
+ "support": 2269.0
249
  },
250
  "eval_O": {
251
+ "f1-score": 0.8972979364985514,
252
+ "precision": 0.8999051233396584,
253
+ "recall": 0.8947058129937507,
254
+ "support": 8481.0
255
  },
256
  "eval_Premise": {
257
+ "f1-score": 0.8825566642663649,
258
+ "precision": 0.8796910246770114,
259
+ "recall": 0.8854410348149168,
260
+ "support": 14534.0
261
  },
262
+ "eval_accuracy": 0.8371703361147415,
263
+ "eval_loss": 0.5037193298339844,
264
  "eval_macro avg": {
265
+ "f1-score": 0.7973619582258764,
266
+ "precision": 0.8060231221008552,
267
+ "recall": 0.7900359251889764,
268
+ "support": 29841.0
269
+ },
270
+ "eval_runtime": 1.4008,
271
+ "eval_samples_per_second": 57.109,
272
+ "eval_steps_per_second": 7.139,
273
  "eval_weighted avg": {
274
+ "f1-score": 0.8378086229762441,
275
+ "precision": 0.8389012192486348,
276
+ "recall": 0.8371703361147415,
277
+ "support": 29841.0
278
  },
279
  "step": 246
280
  },
281
  {
282
  "epoch": 7.0,
283
  "eval_Claim": {
284
+ "f1-score": 0.6057510824913955,
285
+ "precision": 0.6130337078651685,
286
+ "recall": 0.5986394557823129,
287
+ "support": 4557.0
288
  },
289
  "eval_MajorClaim": {
290
+ "f1-score": 0.7914081145584726,
291
+ "precision": 0.8630921395106715,
292
+ "recall": 0.7307183781401498,
293
+ "support": 2269.0
294
  },
295
  "eval_O": {
296
+ "f1-score": 0.8969556393157437,
297
+ "precision": 0.8824737562756733,
298
+ "recall": 0.9119207640608419,
299
+ "support": 8481.0
300
  },
301
  "eval_Premise": {
302
+ "f1-score": 0.8857729138166894,
303
+ "precision": 0.880592955256358,
304
+ "recall": 0.8910141736617586,
305
+ "support": 14534.0
306
  },
307
+ "eval_accuracy": 0.8401192989511075,
308
+ "eval_loss": 0.5329757928848267,
309
  "eval_macro avg": {
310
+ "f1-score": 0.7949719375455753,
311
+ "precision": 0.8097981397269679,
312
+ "recall": 0.7830731929112658,
313
+ "support": 29841.0
314
+ },
315
+ "eval_runtime": 1.3907,
316
+ "eval_samples_per_second": 57.526,
317
+ "eval_steps_per_second": 7.191,
318
  "eval_weighted avg": {
319
+ "f1-score": 0.8390140076168712,
320
+ "precision": 0.8389379916879856,
321
+ "recall": 0.8401192989511075,
322
+ "support": 29841.0
323
  },
324
  "step": 287
325
  },
326
  {
327
  "epoch": 8.0,
328
  "eval_Claim": {
329
+ "f1-score": 0.6007012930089853,
330
+ "precision": 0.599912453490917,
331
+ "recall": 0.6014922097871407,
332
+ "support": 4557.0
333
  },
334
  "eval_MajorClaim": {
335
+ "f1-score": 0.8150046598322461,
336
+ "precision": 0.8645575877409788,
337
+ "recall": 0.7708241516086382,
338
+ "support": 2269.0
339
  },
340
  "eval_O": {
341
+ "f1-score": 0.8958295721249322,
342
+ "precision": 0.9148230088495575,
343
+ "recall": 0.8776087725504068,
344
+ "support": 8481.0
345
  },
346
  "eval_Premise": {
347
+ "f1-score": 0.8864303302189092,
348
+ "precision": 0.8694501422616291,
349
+ "recall": 0.9040869684876841,
350
+ "support": 14534.0
351
  },
352
+ "eval_accuracy": 0.8402198317750745,
353
+ "eval_loss": 0.5759353637695312,
354
  "eval_macro avg": {
355
+ "f1-score": 0.7994914637962682,
356
+ "precision": 0.8121857980857706,
357
+ "recall": 0.7885030256084674,
358
+ "support": 29841.0
359
+ },
360
+ "eval_runtime": 1.4002,
361
+ "eval_samples_per_second": 57.137,
362
+ "eval_steps_per_second": 7.142,
363
  "eval_weighted avg": {
364
+ "f1-score": 0.8400372100799064,
365
+ "precision": 0.8408124567818104,
366
+ "recall": 0.8402198317750745,
367
+ "support": 29841.0
368
  },
369
  "step": 328
370
  },
371
  {
372
  "epoch": 9.0,
373
  "eval_Claim": {
374
+ "f1-score": 0.6078538018057218,
375
+ "precision": 0.6026747195858498,
376
+ "recall": 0.6131226684222076,
377
+ "support": 4557.0
378
  },
379
  "eval_MajorClaim": {
380
+ "f1-score": 0.8104317335086566,
381
+ "precision": 0.8060156931124673,
382
+ "recall": 0.8148964301454386,
383
+ "support": 2269.0
384
  },
385
  "eval_O": {
386
+ "f1-score": 0.8967088304058509,
387
+ "precision": 0.9120731707317074,
388
+ "recall": 0.8818535550053059,
389
+ "support": 8481.0
390
  },
391
  "eval_Premise": {
392
+ "f1-score": 0.8858266370319713,
393
+ "precision": 0.8804975868397797,
394
+ "recall": 0.8912205862116417,
395
+ "support": 14534.0
396
  },
397
+ "eval_accuracy": 0.8402868536577193,
398
+ "eval_loss": 0.597597062587738,
399
  "eval_macro avg": {
400
+ "f1-score": 0.8002052506880502,
401
+ "precision": 0.800315292567451,
402
+ "recall": 0.8002733099461484,
403
+ "support": 29841.0
404
+ },
405
+ "eval_runtime": 1.4006,
406
+ "eval_samples_per_second": 57.118,
407
+ "eval_steps_per_second": 7.14,
408
  "eval_weighted avg": {
409
+ "f1-score": 0.8407376197665799,
410
+ "precision": 0.8413820848138425,
411
+ "recall": 0.8402868536577193,
412
+ "support": 29841.0
413
  },
414
  "step": 369
415
  },
416
  {
417
  "epoch": 10.0,
418
  "eval_Claim": {
419
+ "f1-score": 0.6166648417825469,
420
+ "precision": 0.6153846153846154,
421
+ "recall": 0.6179504059688391,
422
+ "support": 4557.0
423
  },
424
  "eval_MajorClaim": {
425
+ "f1-score": 0.8066597294484912,
426
+ "precision": 0.7641955835962145,
427
+ "recall": 0.8541207580431909,
428
+ "support": 2269.0
429
  },
430
  "eval_O": {
431
+ "f1-score": 0.8995083343326538,
432
+ "precision": 0.9150908869098451,
433
+ "recall": 0.8844475887277443,
434
+ "support": 8481.0
435
  },
436
  "eval_Premise": {
437
+ "f1-score": 0.8894240693593889,
438
+ "precision": 0.8894852738783374,
439
+ "recall": 0.8893628732626944,
440
+ "support": 14534.0
441
  },
442
+ "eval_accuracy": 0.8438390134378875,
443
+ "eval_loss": 0.6327010989189148,
444
  "eval_macro avg": {
445
+ "f1-score": 0.8030642437307701,
446
+ "precision": 0.7960390899422531,
447
+ "recall": 0.8114704065006171,
448
+ "support": 29841.0
449
+ },
450
+ "eval_runtime": 1.3944,
451
+ "eval_samples_per_second": 57.373,
452
+ "eval_steps_per_second": 7.172,
453
  "eval_weighted avg": {
454
+ "f1-score": 0.8443440976397001,
455
+ "precision": 0.8453782465037248,
456
+ "recall": 0.8438390134378875,
457
+ "support": 29841.0
458
  },
459
  "step": 410
460
  },
461
  {
462
  "epoch": 11.0,
463
  "eval_Claim": {
464
+ "f1-score": 0.6205015213513796,
465
+ "precision": 0.5944913550462404,
466
+ "recall": 0.6488918147904323,
467
+ "support": 4557.0
468
  },
469
  "eval_MajorClaim": {
470
+ "f1-score": 0.8115818607621886,
471
+ "precision": 0.78500823723229,
472
+ "recall": 0.8400176289114147,
473
+ "support": 2269.0
474
  },
475
  "eval_O": {
476
+ "f1-score": 0.8931679980922858,
477
+ "precision": 0.9032919329555047,
478
+ "recall": 0.8832684824902723,
479
+ "support": 8481.0
480
  },
481
  "eval_Premise": {
482
+ "f1-score": 0.8841004184100418,
483
+ "precision": 0.8962250812950657,
484
+ "recall": 0.872299435805697,
485
+ "support": 14534.0
486
  },
487
+ "eval_accuracy": 0.8388458831808585,
488
+ "eval_loss": 0.6347343325614929,
489
  "eval_macro avg": {
490
+ "f1-score": 0.802337949653974,
491
+ "precision": 0.7947541516322751,
492
+ "recall": 0.8111193404994541,
493
+ "support": 29841.0
494
+ },
495
+ "eval_runtime": 1.3894,
496
+ "eval_samples_per_second": 57.578,
497
+ "eval_steps_per_second": 7.197,
498
  "eval_weighted avg": {
499
+ "f1-score": 0.8409094181783406,
500
+ "precision": 0.843699440707882,
501
+ "recall": 0.8388458831808585,
502
+ "support": 29841.0
503
  },
504
  "step": 451
505
  },
506
  {
507
  "epoch": 12.0,
508
  "eval_Claim": {
509
+ "f1-score": 0.6289669861554845,
510
+ "precision": 0.6110076557003932,
511
+ "recall": 0.6480140443274084,
512
+ "support": 4557.0
513
  },
514
  "eval_MajorClaim": {
515
+ "f1-score": 0.8147826086956521,
516
+ "precision": 0.803946803946804,
517
+ "recall": 0.8259144997796386,
518
+ "support": 2269.0
519
  },
520
  "eval_O": {
521
+ "f1-score": 0.9003071107961257,
522
+ "precision": 0.901905099988167,
523
+ "recall": 0.8987147742011555,
524
+ "support": 8481.0
525
  },
526
  "eval_Premise": {
527
+ "f1-score": 0.8883866481223922,
528
+ "precision": 0.8980036552790664,
529
+ "recall": 0.8789734415852484,
530
+ "support": 14534.0
531
  },
532
+ "eval_accuracy": 0.8452799839147481,
533
+ "eval_loss": 0.6512799859046936,
534
  "eval_macro avg": {
535
+ "f1-score": 0.8081108384424137,
536
+ "precision": 0.8037158037286076,
537
+ "recall": 0.8129041899733627,
538
+ "support": 29841.0
539
+ },
540
+ "eval_runtime": 1.3915,
541
+ "eval_samples_per_second": 57.493,
542
+ "eval_steps_per_second": 7.187,
543
  "eval_weighted avg": {
544
+ "f1-score": 0.8465621274593268,
545
+ "precision": 0.8481337577161484,
546
+ "recall": 0.8452799839147481,
547
+ "support": 29841.0
548
  },
549
  "step": 492
550
  }
checkpoint-492/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7094583e4fe5a2c55a5632947c89b5062ef3102a7d8117131675dc677677192b
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdcb45ede21ecca936ab63090715c5dc953e544931a449f7e44cc1bbcab87ad8
3
  size 4664