varcoder commited on
Commit
e3f532e
1 Parent(s): 4e5f4a5

End of training

Browse files
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [microsoft/resnet-101](https://huggingface.co/microsoft/resnet-101) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.3944
21
- - Accuracy: 0.8471
22
 
23
  ## Model description
24
 
 
17
 
18
  This model is a fine-tuned version of [microsoft/resnet-101](https://huggingface.co/microsoft/resnet-101) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.3785
21
+ - Accuracy: 0.8569
22
 
23
  ## Model description
24
 
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 9.8,
3
- "eval_accuracy": 0.7700980392156863,
4
- "eval_loss": 0.6762834191322327,
5
- "eval_runtime": 27.2812,
6
- "eval_samples_per_second": 74.777,
7
- "eval_steps_per_second": 2.346,
8
- "total_flos": 3.072509726495183e+18,
9
- "train_loss": 1.3191132202148437,
10
- "train_runtime": 2261.7516,
11
- "train_samples_per_second": 36.074,
12
- "train_steps_per_second": 0.111
13
  }
 
1
  {
2
+ "epoch": 15.0,
3
+ "eval_accuracy": 0.8568627450980392,
4
+ "eval_loss": 0.3784649968147278,
5
+ "eval_runtime": 25.0793,
6
+ "eval_samples_per_second": 81.342,
7
+ "eval_steps_per_second": 2.552,
8
+ "total_flos": 4.700892636385505e+18,
9
+ "train_loss": 0.7059793472290039,
10
+ "train_runtime": 3152.3203,
11
+ "train_samples_per_second": 38.824,
12
+ "train_steps_per_second": 0.081
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.8,
3
- "eval_accuracy": 0.7700980392156863,
4
- "eval_loss": 0.6762834191322327,
5
- "eval_runtime": 27.2812,
6
- "eval_samples_per_second": 74.777,
7
- "eval_steps_per_second": 2.346
8
  }
 
1
  {
2
+ "epoch": 15.0,
3
+ "eval_accuracy": 0.8568627450980392,
4
+ "eval_loss": 0.3784649968147278,
5
+ "eval_runtime": 25.0793,
6
+ "eval_samples_per_second": 81.342,
7
+ "eval_steps_per_second": 2.552
8
  }
runs/Jan25_03-08-49_173fbb9c3dc5/events.out.tfevents.1706155344.173fbb9c3dc5.3455.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e928d6d3f08ac14fc46e55c05215b33f65006a2e4178439b77125e41794eb08
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.8,
3
- "total_flos": 3.072509726495183e+18,
4
- "train_loss": 1.3191132202148437,
5
- "train_runtime": 2261.7516,
6
- "train_samples_per_second": 36.074,
7
- "train_steps_per_second": 0.111
8
  }
 
1
  {
2
+ "epoch": 15.0,
3
+ "total_flos": 4.700892636385505e+18,
4
+ "train_loss": 0.7059793472290039,
5
+ "train_runtime": 3152.3203,
6
+ "train_samples_per_second": 38.824,
7
+ "train_steps_per_second": 0.081
8
  }
trainer_state.json CHANGED
@@ -1,268 +1,265 @@
1
  {
2
- "best_metric": 0.7700980392156863,
3
- "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k/checkpoint-229",
4
- "epoch": 9.803921568627452,
5
  "eval_steps": 500,
6
- "global_step": 250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.39,
13
- "learning_rate": 4e-05,
14
- "loss": 2.6157,
15
- "step": 10
16
  },
17
  {
18
- "epoch": 0.78,
19
- "learning_rate": 8e-05,
20
- "loss": 2.5769,
21
- "step": 20
 
 
 
22
  },
23
  {
24
- "epoch": 0.98,
25
- "eval_accuracy": 0.5269607843137255,
26
- "eval_loss": 2.49281907081604,
27
- "eval_runtime": 40.5904,
28
- "eval_samples_per_second": 50.258,
29
- "eval_steps_per_second": 1.577,
30
- "step": 25
31
- },
32
- {
33
- "epoch": 1.18,
34
- "learning_rate": 9.777777777777778e-05,
35
- "loss": 2.4933,
36
  "step": 30
37
  },
38
- {
39
- "epoch": 1.57,
40
- "learning_rate": 9.333333333333334e-05,
41
- "loss": 2.3726,
42
- "step": 40
43
- },
44
- {
45
- "epoch": 1.96,
46
- "learning_rate": 8.888888888888889e-05,
47
- "loss": 2.2271,
48
- "step": 50
49
- },
50
  {
51
  "epoch": 2.0,
52
- "eval_accuracy": 0.5284313725490196,
53
- "eval_loss": 2.184375047683716,
54
- "eval_runtime": 41.3607,
55
- "eval_samples_per_second": 49.322,
56
- "eval_steps_per_second": 1.547,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  "step": 51
58
  },
59
  {
60
- "epoch": 2.35,
61
- "learning_rate": 8.444444444444444e-05,
62
- "loss": 2.004,
63
  "step": 60
64
  },
65
  {
66
- "epoch": 2.75,
67
- "learning_rate": 8e-05,
68
- "loss": 1.6261,
69
- "step": 70
 
 
 
70
  },
71
  {
72
- "epoch": 2.98,
73
- "eval_accuracy": 0.5269607843137255,
74
- "eval_loss": 1.4098289012908936,
75
- "eval_runtime": 40.6734,
76
- "eval_samples_per_second": 50.156,
77
- "eval_steps_per_second": 1.574,
78
- "step": 76
79
  },
80
  {
81
- "epoch": 3.14,
82
- "learning_rate": 7.555555555555556e-05,
83
- "loss": 1.4818,
84
- "step": 80
 
 
 
85
  },
86
  {
87
- "epoch": 3.53,
88
- "learning_rate": 7.111111111111112e-05,
89
- "loss": 1.3531,
90
  "step": 90
91
  },
92
  {
93
- "epoch": 3.92,
94
- "learning_rate": 6.666666666666667e-05,
95
- "loss": 1.2715,
96
- "step": 100
97
- },
98
- {
99
- "epoch": 4.0,
100
- "eval_accuracy": 0.5799019607843138,
101
- "eval_loss": 1.204033613204956,
102
- "eval_runtime": 41.3797,
103
- "eval_samples_per_second": 49.3,
104
- "eval_steps_per_second": 1.547,
105
  "step": 102
106
  },
107
  {
108
- "epoch": 4.31,
109
- "learning_rate": 6.222222222222222e-05,
110
- "loss": 1.1843,
111
- "step": 110
112
  },
113
  {
114
- "epoch": 4.71,
115
- "learning_rate": 5.7777777777777776e-05,
116
- "loss": 1.1368,
117
- "step": 120
 
 
 
118
  },
119
  {
120
- "epoch": 4.98,
121
- "eval_accuracy": 0.6852941176470588,
122
- "eval_loss": 1.0043939352035522,
123
- "eval_runtime": 40.9737,
124
- "eval_samples_per_second": 49.788,
125
- "eval_steps_per_second": 1.562,
126
- "step": 127
127
  },
128
  {
129
- "epoch": 5.1,
130
- "learning_rate": 5.333333333333333e-05,
131
- "loss": 1.0742,
132
- "step": 130
133
  },
134
  {
135
- "epoch": 5.49,
136
- "learning_rate": 4.888888888888889e-05,
137
- "loss": 0.9825,
138
- "step": 140
 
 
 
139
  },
140
  {
141
- "epoch": 5.88,
142
- "learning_rate": 4.4444444444444447e-05,
143
- "loss": 0.9366,
144
  "step": 150
145
  },
146
  {
147
- "epoch": 6.0,
148
- "eval_accuracy": 0.7455882352941177,
149
- "eval_loss": 0.8462627530097961,
150
- "eval_runtime": 40.2496,
151
- "eval_samples_per_second": 50.684,
152
- "eval_steps_per_second": 1.59,
153
  "step": 153
154
  },
155
  {
156
- "epoch": 6.27,
157
- "learning_rate": 4e-05,
158
- "loss": 0.899,
159
- "step": 160
160
  },
161
  {
162
- "epoch": 6.67,
163
- "learning_rate": 3.555555555555556e-05,
164
- "loss": 0.8249,
 
 
 
165
  "step": 170
166
  },
167
  {
168
- "epoch": 6.98,
169
- "eval_accuracy": 0.7686274509803922,
170
- "eval_loss": 0.7511501908302307,
171
- "eval_runtime": 47.4571,
172
- "eval_samples_per_second": 42.986,
173
- "eval_steps_per_second": 1.349,
174
- "step": 178
175
- },
176
- {
177
- "epoch": 7.06,
178
- "learning_rate": 3.111111111111111e-05,
179
- "loss": 0.8197,
180
  "step": 180
181
  },
182
  {
183
- "epoch": 7.45,
184
- "learning_rate": 2.6666666666666667e-05,
185
- "loss": 0.7562,
186
- "step": 190
 
 
 
187
  },
188
  {
189
- "epoch": 7.84,
190
- "learning_rate": 2.2222222222222223e-05,
191
- "loss": 0.7635,
192
- "step": 200
193
  },
194
  {
195
- "epoch": 8.0,
196
- "eval_accuracy": 0.7612745098039215,
197
- "eval_loss": 0.7078944444656372,
198
- "eval_runtime": 40.9903,
199
- "eval_samples_per_second": 49.768,
200
- "eval_steps_per_second": 1.561,
201
  "step": 204
202
  },
203
  {
204
- "epoch": 8.24,
205
- "learning_rate": 1.777777777777778e-05,
206
- "loss": 0.7415,
207
  "step": 210
208
  },
209
  {
210
- "epoch": 8.63,
211
- "learning_rate": 1.3333333333333333e-05,
212
- "loss": 0.7213,
213
- "step": 220
 
 
 
214
  },
215
  {
216
- "epoch": 8.98,
217
- "eval_accuracy": 0.7700980392156863,
218
- "eval_loss": 0.6762834191322327,
219
- "eval_runtime": 40.8595,
220
- "eval_samples_per_second": 49.927,
221
- "eval_steps_per_second": 1.566,
222
- "step": 229
223
  },
224
  {
225
- "epoch": 9.02,
226
- "learning_rate": 8.88888888888889e-06,
227
- "loss": 0.6951,
228
- "step": 230
 
 
 
229
  },
230
  {
231
- "epoch": 9.41,
232
- "learning_rate": 4.444444444444445e-06,
233
- "loss": 0.7295,
234
  "step": 240
235
  },
236
  {
237
- "epoch": 9.8,
238
  "learning_rate": 0.0,
239
- "loss": 0.6905,
240
- "step": 250
241
- },
242
- {
243
- "epoch": 9.8,
244
- "eval_accuracy": 0.7676470588235295,
245
- "eval_loss": 0.6683045625686646,
246
- "eval_runtime": 39.5198,
247
- "eval_samples_per_second": 51.62,
248
- "eval_steps_per_second": 1.619,
249
- "step": 250
250
- },
251
- {
252
- "epoch": 9.8,
253
- "step": 250,
254
- "total_flos": 3.072509726495183e+18,
255
- "train_loss": 1.3191132202148437,
256
- "train_runtime": 2261.7516,
257
- "train_samples_per_second": 36.074,
258
- "train_steps_per_second": 0.111
259
  }
260
  ],
261
- "logging_steps": 10,
262
- "max_steps": 250,
263
- "num_train_epochs": 10,
264
  "save_steps": 500,
265
- "total_flos": 3.072509726495183e+18,
266
  "trial_name": null,
267
  "trial_params": null
268
  }
 
1
  {
2
+ "best_metric": 0.8568627450980392,
3
+ "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k/checkpoint-238",
4
+ "epoch": 15.0,
5
  "eval_steps": 500,
6
+ "global_step": 255,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.88,
13
+ "learning_rate": 0.00017307692307692304,
14
+ "loss": 2.6258,
15
+ "step": 15
16
  },
17
  {
18
+ "epoch": 1.0,
19
+ "eval_accuracy": 0.5504901960784314,
20
+ "eval_loss": 2.5047667026519775,
21
+ "eval_runtime": 36.2965,
22
+ "eval_samples_per_second": 56.204,
23
+ "eval_steps_per_second": 1.763,
24
+ "step": 17
25
  },
26
  {
27
+ "epoch": 1.76,
28
+ "learning_rate": 0.0002947598253275109,
29
+ "loss": 2.2924,
 
 
 
 
 
 
 
 
 
30
  "step": 30
31
  },
 
 
 
 
 
 
 
 
 
 
 
 
32
  {
33
  "epoch": 2.0,
34
+ "eval_accuracy": 0.5274509803921569,
35
+ "eval_loss": 1.4727771282196045,
36
+ "eval_runtime": 37.3662,
37
+ "eval_samples_per_second": 54.595,
38
+ "eval_steps_per_second": 1.713,
39
+ "step": 34
40
+ },
41
+ {
42
+ "epoch": 2.65,
43
+ "learning_rate": 0.00027510917030567684,
44
+ "loss": 1.452,
45
+ "step": 45
46
+ },
47
+ {
48
+ "epoch": 3.0,
49
+ "eval_accuracy": 0.6950980392156862,
50
+ "eval_loss": 1.0708895921707153,
51
+ "eval_runtime": 36.9842,
52
+ "eval_samples_per_second": 55.159,
53
+ "eval_steps_per_second": 1.73,
54
  "step": 51
55
  },
56
  {
57
+ "epoch": 3.53,
58
+ "learning_rate": 0.0002554585152838428,
59
+ "loss": 1.0363,
60
  "step": 60
61
  },
62
  {
63
+ "epoch": 4.0,
64
+ "eval_accuracy": 0.7710784313725491,
65
+ "eval_loss": 0.6555339694023132,
66
+ "eval_runtime": 36.72,
67
+ "eval_samples_per_second": 55.556,
68
+ "eval_steps_per_second": 1.743,
69
+ "step": 68
70
  },
71
  {
72
+ "epoch": 4.41,
73
+ "learning_rate": 0.0002358078602620087,
74
+ "loss": 0.7086,
75
+ "step": 75
 
 
 
76
  },
77
  {
78
+ "epoch": 5.0,
79
+ "eval_accuracy": 0.8122549019607843,
80
+ "eval_loss": 0.4875487685203552,
81
+ "eval_runtime": 37.4307,
82
+ "eval_samples_per_second": 54.501,
83
+ "eval_steps_per_second": 1.71,
84
+ "step": 85
85
  },
86
  {
87
+ "epoch": 5.29,
88
+ "learning_rate": 0.00021615720524017465,
89
+ "loss": 0.5185,
90
  "step": 90
91
  },
92
  {
93
+ "epoch": 6.0,
94
+ "eval_accuracy": 0.8357843137254902,
95
+ "eval_loss": 0.43364840745925903,
96
+ "eval_runtime": 37.5452,
97
+ "eval_samples_per_second": 54.334,
98
+ "eval_steps_per_second": 1.705,
 
 
 
 
 
 
99
  "step": 102
100
  },
101
  {
102
+ "epoch": 6.18,
103
+ "learning_rate": 0.00019650655021834058,
104
+ "loss": 0.4238,
105
+ "step": 105
106
  },
107
  {
108
+ "epoch": 7.0,
109
+ "eval_accuracy": 0.8509803921568627,
110
+ "eval_loss": 0.3962140381336212,
111
+ "eval_runtime": 39.9756,
112
+ "eval_samples_per_second": 51.031,
113
+ "eval_steps_per_second": 1.601,
114
+ "step": 119
115
  },
116
  {
117
+ "epoch": 7.06,
118
+ "learning_rate": 0.00017685589519650654,
119
+ "loss": 0.3846,
120
+ "step": 120
 
 
 
121
  },
122
  {
123
+ "epoch": 7.94,
124
+ "learning_rate": 0.00015720524017467246,
125
+ "loss": 0.3436,
126
+ "step": 135
127
  },
128
  {
129
+ "epoch": 8.0,
130
+ "eval_accuracy": 0.8514705882352941,
131
+ "eval_loss": 0.3823707103729248,
132
+ "eval_runtime": 40.0175,
133
+ "eval_samples_per_second": 50.978,
134
+ "eval_steps_per_second": 1.599,
135
+ "step": 136
136
  },
137
  {
138
+ "epoch": 8.82,
139
+ "learning_rate": 0.00013755458515283842,
140
+ "loss": 0.3185,
141
  "step": 150
142
  },
143
  {
144
+ "epoch": 9.0,
145
+ "eval_accuracy": 0.8514705882352941,
146
+ "eval_loss": 0.38265544176101685,
147
+ "eval_runtime": 39.6707,
148
+ "eval_samples_per_second": 51.423,
149
+ "eval_steps_per_second": 1.613,
150
  "step": 153
151
  },
152
  {
153
+ "epoch": 9.71,
154
+ "learning_rate": 0.00011790393013100435,
155
+ "loss": 0.3116,
156
+ "step": 165
157
  },
158
  {
159
+ "epoch": 10.0,
160
+ "eval_accuracy": 0.8534313725490196,
161
+ "eval_loss": 0.37894687056541443,
162
+ "eval_runtime": 38.7692,
163
+ "eval_samples_per_second": 52.619,
164
+ "eval_steps_per_second": 1.651,
165
  "step": 170
166
  },
167
  {
168
+ "epoch": 10.59,
169
+ "learning_rate": 9.825327510917029e-05,
170
+ "loss": 0.2983,
 
 
 
 
 
 
 
 
 
171
  "step": 180
172
  },
173
  {
174
+ "epoch": 11.0,
175
+ "eval_accuracy": 0.8558823529411764,
176
+ "eval_loss": 0.3759206235408783,
177
+ "eval_runtime": 38.4006,
178
+ "eval_samples_per_second": 53.124,
179
+ "eval_steps_per_second": 1.667,
180
+ "step": 187
181
  },
182
  {
183
+ "epoch": 11.47,
184
+ "learning_rate": 7.860262008733623e-05,
185
+ "loss": 0.2703,
186
+ "step": 195
187
  },
188
  {
189
+ "epoch": 12.0,
190
+ "eval_accuracy": 0.8480392156862745,
191
+ "eval_loss": 0.3838962912559509,
192
+ "eval_runtime": 38.2843,
193
+ "eval_samples_per_second": 53.286,
194
+ "eval_steps_per_second": 1.672,
195
  "step": 204
196
  },
197
  {
198
+ "epoch": 12.35,
199
+ "learning_rate": 5.8951965065502174e-05,
200
+ "loss": 0.2618,
201
  "step": 210
202
  },
203
  {
204
+ "epoch": 13.0,
205
+ "eval_accuracy": 0.8539215686274509,
206
+ "eval_loss": 0.38307902216911316,
207
+ "eval_runtime": 38.0757,
208
+ "eval_samples_per_second": 53.577,
209
+ "eval_steps_per_second": 1.681,
210
+ "step": 221
211
  },
212
  {
213
+ "epoch": 13.24,
214
+ "learning_rate": 3.9301310043668116e-05,
215
+ "loss": 0.2613,
216
+ "step": 225
 
 
 
217
  },
218
  {
219
+ "epoch": 14.0,
220
+ "eval_accuracy": 0.8568627450980392,
221
+ "eval_loss": 0.3784649968147278,
222
+ "eval_runtime": 38.1613,
223
+ "eval_samples_per_second": 53.457,
224
+ "eval_steps_per_second": 1.677,
225
+ "step": 238
226
  },
227
  {
228
+ "epoch": 14.12,
229
+ "learning_rate": 1.9650655021834058e-05,
230
+ "loss": 0.2514,
231
  "step": 240
232
  },
233
  {
234
+ "epoch": 15.0,
235
  "learning_rate": 0.0,
236
+ "loss": 0.2428,
237
+ "step": 255
238
+ },
239
+ {
240
+ "epoch": 15.0,
241
+ "eval_accuracy": 0.8470588235294118,
242
+ "eval_loss": 0.39441215991973877,
243
+ "eval_runtime": 38.4101,
244
+ "eval_samples_per_second": 53.111,
245
+ "eval_steps_per_second": 1.666,
246
+ "step": 255
247
+ },
248
+ {
249
+ "epoch": 15.0,
250
+ "step": 255,
251
+ "total_flos": 4.700892636385505e+18,
252
+ "train_loss": 0.7059793472290039,
253
+ "train_runtime": 3152.3203,
254
+ "train_samples_per_second": 38.824,
255
+ "train_steps_per_second": 0.081
256
  }
257
  ],
258
+ "logging_steps": 15,
259
+ "max_steps": 255,
260
+ "num_train_epochs": 15,
261
  "save_steps": 500,
262
+ "total_flos": 4.700892636385505e+18,
263
  "trial_name": null,
264
  "trial_params": null
265
  }