varcoder commited on
Commit
84778f4
1 Parent(s): 4ddb7ae

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 9.8,
3
- "eval_accuracy": 0.8715686274509804,
4
- "eval_loss": 0.3589998185634613,
5
- "eval_runtime": 34.1863,
6
- "eval_samples_per_second": 59.673,
7
- "eval_steps_per_second": 1.872,
8
- "total_flos": 7.501244449451129e+18,
9
- "train_loss": 0.7515069055557251,
10
- "train_runtime": 2638.4717,
11
- "train_samples_per_second": 30.923,
12
- "train_steps_per_second": 0.095
13
  }
 
1
  {
2
+ "epoch": 8.11,
3
+ "eval_accuracy": 0.0,
4
+ "eval_loss": NaN,
5
+ "eval_runtime": 5.2931,
6
+ "eval_samples_per_second": 55.733,
7
+ "eval_steps_per_second": 1.889,
8
+ "total_flos": 3.675135085585367e+17,
9
+ "train_loss": 0.0,
10
+ "train_runtime": 249.2359,
11
+ "train_samples_per_second": 47.345,
12
+ "train_steps_per_second": 0.12
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.8,
3
- "eval_accuracy": 0.8715686274509804,
4
- "eval_loss": 0.3589998185634613,
5
- "eval_runtime": 34.1863,
6
- "eval_samples_per_second": 59.673,
7
- "eval_steps_per_second": 1.872
8
  }
 
1
  {
2
+ "epoch": 8.11,
3
+ "eval_accuracy": 0.0,
4
+ "eval_loss": NaN,
5
+ "eval_runtime": 5.2931,
6
+ "eval_samples_per_second": 55.733,
7
+ "eval_steps_per_second": 1.889
8
  }
runs/Mar10_00-45-05_f2dfbab62cd5/events.out.tfevents.1710031788.f2dfbab62cd5.3507.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:129e2846aa4a442120924ff1dcd5ac816254453c356e816f2b5408868cad1073
3
+ size 405
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.8,
3
- "total_flos": 7.501244449451129e+18,
4
- "train_loss": 0.7515069055557251,
5
- "train_runtime": 2638.4717,
6
- "train_samples_per_second": 30.923,
7
- "train_steps_per_second": 0.095
8
  }
 
1
  {
2
+ "epoch": 8.11,
3
+ "total_flos": 3.675135085585367e+17,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 249.2359,
6
+ "train_samples_per_second": 47.345,
7
+ "train_steps_per_second": 0.12
8
  }
trainer_state.json CHANGED
@@ -1,268 +1,132 @@
1
  {
2
- "best_metric": 0.8715686274509804,
3
- "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k/checkpoint-204",
4
- "epoch": 9.803921568627452,
5
  "eval_steps": 500,
6
- "global_step": 250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.39,
13
- "learning_rate": 0.00011999999999999999,
14
- "loss": 2.6064,
15
- "step": 10
16
- },
17
- {
18
- "epoch": 0.78,
19
- "learning_rate": 0.00023999999999999998,
20
- "loss": 2.4679,
21
- "step": 20
22
- },
23
- {
24
- "epoch": 0.98,
25
- "eval_accuracy": 0.5367647058823529,
26
- "eval_loss": 1.9448940753936768,
27
- "eval_runtime": 41.2734,
28
- "eval_samples_per_second": 49.426,
29
- "eval_steps_per_second": 1.551,
30
- "step": 25
31
- },
32
- {
33
- "epoch": 1.18,
34
- "learning_rate": 0.00029333333333333327,
35
- "loss": 1.9417,
36
- "step": 30
37
- },
38
- {
39
- "epoch": 1.57,
40
- "learning_rate": 0.00028,
41
- "loss": 1.3729,
42
- "step": 40
43
- },
44
- {
45
- "epoch": 1.96,
46
- "learning_rate": 0.0002666666666666666,
47
- "loss": 1.2247,
48
- "step": 50
49
- },
50
- {
51
- "epoch": 2.0,
52
- "eval_accuracy": 0.6799019607843138,
53
- "eval_loss": 1.1000670194625854,
54
- "eval_runtime": 42.9676,
55
- "eval_samples_per_second": 47.478,
56
- "eval_steps_per_second": 1.489,
57
- "step": 51
58
- },
59
- {
60
- "epoch": 2.35,
61
- "learning_rate": 0.00025333333333333333,
62
- "loss": 1.062,
63
- "step": 60
64
- },
65
- {
66
- "epoch": 2.75,
67
- "learning_rate": 0.00023999999999999998,
68
- "loss": 0.8434,
69
- "step": 70
70
- },
71
- {
72
- "epoch": 2.98,
73
- "eval_accuracy": 0.7887254901960784,
74
- "eval_loss": 0.5851422548294067,
75
- "eval_runtime": 40.7115,
76
- "eval_samples_per_second": 50.109,
77
- "eval_steps_per_second": 1.572,
78
- "step": 76
79
- },
80
- {
81
- "epoch": 3.14,
82
- "learning_rate": 0.00022666666666666663,
83
- "loss": 0.6665,
84
- "step": 80
85
- },
86
- {
87
- "epoch": 3.53,
88
- "learning_rate": 0.00021333333333333333,
89
- "loss": 0.5464,
90
- "step": 90
91
- },
92
- {
93
- "epoch": 3.92,
94
- "learning_rate": 0.00019999999999999998,
95
- "loss": 0.491,
96
- "step": 100
97
  },
98
  {
99
- "epoch": 4.0,
100
- "eval_accuracy": 0.8338235294117647,
101
- "eval_loss": 0.43349361419677734,
102
- "eval_runtime": 41.9829,
103
- "eval_samples_per_second": 48.591,
104
- "eval_steps_per_second": 1.524,
105
- "step": 102
106
  },
107
  {
108
- "epoch": 4.31,
109
- "learning_rate": 0.00018666666666666666,
110
- "loss": 0.4475,
111
- "step": 110
112
- },
113
- {
114
- "epoch": 4.71,
115
- "learning_rate": 0.0001733333333333333,
116
- "loss": 0.4512,
117
- "step": 120
118
- },
119
- {
120
- "epoch": 4.98,
121
- "eval_accuracy": 0.8401960784313726,
122
- "eval_loss": 0.40097689628601074,
123
- "eval_runtime": 40.6062,
124
- "eval_samples_per_second": 50.239,
125
- "eval_steps_per_second": 1.576,
126
- "step": 127
127
- },
128
- {
129
- "epoch": 5.1,
130
- "learning_rate": 0.00015999999999999999,
131
- "loss": 0.4392,
132
- "step": 130
133
- },
134
- {
135
- "epoch": 5.49,
136
- "learning_rate": 0.00014666666666666664,
137
- "loss": 0.4147,
138
- "step": 140
139
- },
140
- {
141
- "epoch": 5.88,
142
- "learning_rate": 0.0001333333333333333,
143
- "loss": 0.3891,
144
- "step": 150
145
  },
146
  {
147
- "epoch": 6.0,
148
- "eval_accuracy": 0.8544117647058823,
149
- "eval_loss": 0.38171347975730896,
150
- "eval_runtime": 43.7502,
151
- "eval_samples_per_second": 46.628,
152
- "eval_steps_per_second": 1.463,
153
- "step": 153
154
  },
155
  {
156
- "epoch": 6.27,
157
- "learning_rate": 0.00011999999999999999,
158
- "loss": 0.3902,
159
- "step": 160
 
 
 
160
  },
161
  {
162
- "epoch": 6.67,
163
- "learning_rate": 0.00010666666666666667,
164
- "loss": 0.3533,
165
- "step": 170
 
 
 
166
  },
167
  {
168
- "epoch": 6.98,
169
- "eval_accuracy": 0.8602941176470589,
170
- "eval_loss": 0.3679962158203125,
171
- "eval_runtime": 38.6694,
172
- "eval_samples_per_second": 52.755,
173
- "eval_steps_per_second": 1.655,
174
- "step": 178
175
  },
176
  {
177
- "epoch": 7.06,
178
- "learning_rate": 9.333333333333333e-05,
179
- "loss": 0.3553,
180
- "step": 180
 
 
 
181
  },
182
  {
183
- "epoch": 7.45,
184
- "learning_rate": 7.999999999999999e-05,
185
- "loss": 0.352,
186
- "step": 190
 
 
 
187
  },
188
  {
189
  "epoch": 7.84,
190
- "learning_rate": 6.666666666666666e-05,
191
- "loss": 0.3407,
192
- "step": 200
 
 
 
193
  },
194
  {
195
- "epoch": 8.0,
196
- "eval_accuracy": 0.8715686274509804,
197
- "eval_loss": 0.3589998185634613,
198
- "eval_runtime": 31.761,
199
- "eval_samples_per_second": 64.23,
200
- "eval_steps_per_second": 2.015,
201
- "step": 204
202
- },
203
- {
204
- "epoch": 8.24,
205
- "learning_rate": 5.333333333333333e-05,
206
- "loss": 0.351,
207
- "step": 210
208
- },
209
- {
210
- "epoch": 8.63,
211
- "learning_rate": 3.9999999999999996e-05,
212
- "loss": 0.3244,
213
- "step": 220
214
- },
215
- {
216
- "epoch": 8.98,
217
- "eval_accuracy": 0.8661764705882353,
218
- "eval_loss": 0.36056193709373474,
219
- "eval_runtime": 34.9574,
220
- "eval_samples_per_second": 58.357,
221
- "eval_steps_per_second": 1.831,
222
- "step": 229
223
- },
224
- {
225
- "epoch": 9.02,
226
- "learning_rate": 2.6666666666666667e-05,
227
- "loss": 0.3148,
228
- "step": 230
229
- },
230
- {
231
- "epoch": 9.41,
232
- "learning_rate": 1.3333333333333333e-05,
233
- "loss": 0.3156,
234
- "step": 240
235
- },
236
- {
237
- "epoch": 9.8,
238
  "learning_rate": 0.0,
239
- "loss": 0.3258,
240
- "step": 250
241
  },
242
  {
243
- "epoch": 9.8,
244
- "eval_accuracy": 0.8691176470588236,
245
- "eval_loss": 0.3549394905567169,
246
- "eval_runtime": 38.198,
247
- "eval_samples_per_second": 53.406,
248
- "eval_steps_per_second": 1.675,
249
- "step": 250
250
  },
251
  {
252
- "epoch": 9.8,
253
- "step": 250,
254
- "total_flos": 7.501244449451129e+18,
255
- "train_loss": 0.7515069055557251,
256
- "train_runtime": 2638.4717,
257
- "train_samples_per_second": 30.923,
258
- "train_steps_per_second": 0.095
259
  }
260
  ],
261
  "logging_steps": 10,
262
- "max_steps": 250,
 
263
  "num_train_epochs": 10,
264
  "save_steps": 500,
265
- "total_flos": 7.501244449451129e+18,
 
266
  "trial_name": null,
267
  "trial_params": null
268
  }
 
1
  {
2
+ "best_metric": 0.0,
3
+ "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k/checkpoint-3",
4
+ "epoch": 8.108108108108109,
5
  "eval_steps": 500,
6
+ "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.81,
13
+ "eval_accuracy": 0.0,
14
+ "eval_loss": NaN,
15
+ "eval_runtime": 5.4471,
16
+ "eval_samples_per_second": 54.157,
17
+ "eval_steps_per_second": 1.836,
18
+ "step": 3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  },
20
  {
21
+ "epoch": 1.89,
22
+ "eval_accuracy": 0.0,
23
+ "eval_loss": NaN,
24
+ "eval_runtime": 5.2566,
25
+ "eval_samples_per_second": 56.12,
26
+ "eval_steps_per_second": 1.902,
27
+ "step": 7
28
  },
29
  {
30
+ "epoch": 2.7,
31
+ "grad_norm": NaN,
32
+ "learning_rate": 0.00022222222222222218,
33
+ "loss": 0.0,
34
+ "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
35
  },
36
  {
37
+ "epoch": 2.97,
38
+ "eval_accuracy": 0.0,
39
+ "eval_loss": NaN,
40
+ "eval_runtime": 5.2368,
41
+ "eval_samples_per_second": 56.332,
42
+ "eval_steps_per_second": 1.91,
43
+ "step": 11
44
  },
45
  {
46
+ "epoch": 3.78,
47
+ "eval_accuracy": 0.0,
48
+ "eval_loss": NaN,
49
+ "eval_runtime": 5.1779,
50
+ "eval_samples_per_second": 56.973,
51
+ "eval_steps_per_second": 1.931,
52
+ "step": 14
53
  },
54
  {
55
+ "epoch": 4.86,
56
+ "eval_accuracy": 0.0,
57
+ "eval_loss": NaN,
58
+ "eval_runtime": 5.1256,
59
+ "eval_samples_per_second": 57.555,
60
+ "eval_steps_per_second": 1.951,
61
+ "step": 18
62
  },
63
  {
64
+ "epoch": 5.41,
65
+ "grad_norm": NaN,
66
+ "learning_rate": 0.00011111111111111109,
67
+ "loss": 0.0,
68
+ "step": 20
 
 
69
  },
70
  {
71
+ "epoch": 5.95,
72
+ "eval_accuracy": 0.0,
73
+ "eval_loss": NaN,
74
+ "eval_runtime": 5.1976,
75
+ "eval_samples_per_second": 56.757,
76
+ "eval_steps_per_second": 1.924,
77
+ "step": 22
78
  },
79
  {
80
+ "epoch": 6.76,
81
+ "eval_accuracy": 0.0,
82
+ "eval_loss": NaN,
83
+ "eval_runtime": 5.1726,
84
+ "eval_samples_per_second": 57.032,
85
+ "eval_steps_per_second": 1.933,
86
+ "step": 25
87
  },
88
  {
89
  "epoch": 7.84,
90
+ "eval_accuracy": 0.0,
91
+ "eval_loss": NaN,
92
+ "eval_runtime": 5.0794,
93
+ "eval_samples_per_second": 58.078,
94
+ "eval_steps_per_second": 1.969,
95
+ "step": 29
96
  },
97
  {
98
+ "epoch": 8.11,
99
+ "grad_norm": NaN,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
100
  "learning_rate": 0.0,
101
+ "loss": 0.0,
102
+ "step": 30
103
  },
104
  {
105
+ "epoch": 8.11,
106
+ "eval_accuracy": 0.0,
107
+ "eval_loss": NaN,
108
+ "eval_runtime": 5.2939,
109
+ "eval_samples_per_second": 55.725,
110
+ "eval_steps_per_second": 1.889,
111
+ "step": 30
112
  },
113
  {
114
+ "epoch": 8.11,
115
+ "step": 30,
116
+ "total_flos": 3.675135085585367e+17,
117
+ "train_loss": 0.0,
118
+ "train_runtime": 249.2359,
119
+ "train_samples_per_second": 47.345,
120
+ "train_steps_per_second": 0.12
121
  }
122
  ],
123
  "logging_steps": 10,
124
+ "max_steps": 30,
125
+ "num_input_tokens_seen": 0,
126
  "num_train_epochs": 10,
127
  "save_steps": 500,
128
+ "total_flos": 3.675135085585367e+17,
129
+ "train_batch_size": 32,
130
  "trial_name": null,
131
  "trial_params": null
132
  }