anurag629 commited on
Commit
e135060
1 Parent(s): aa46f07

End of training

Browse files
all_results.json CHANGED
@@ -1,8 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 1.232080345041961e+17,
4
- "train_loss": 2.0565889065082255,
5
- "train_runtime": 193.8332,
6
- "train_samples_per_second": 25.553,
7
- "train_steps_per_second": 0.201
 
 
 
 
 
8
  }
 
1
  {
2
+ "epoch": 15.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.01327650435268879,
5
+ "eval_runtime": 4.8947,
6
+ "eval_samples_per_second": 37.592,
7
+ "eval_steps_per_second": 1.226,
8
+ "total_flos": 6.160401725209805e+17,
9
+ "train_loss": 0.1391575378485215,
10
+ "train_runtime": 1009.255,
11
+ "train_samples_per_second": 24.538,
12
+ "train_steps_per_second": 0.193
13
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 15.0,
3
+ "eval_accuracy": 1.0,
4
+ "eval_loss": 0.01327650435268879,
5
+ "eval_runtime": 4.8947,
6
+ "eval_samples_per_second": 37.592,
7
+ "eval_steps_per_second": 1.226
8
+ }
runs/Sep15_16-08-50_0e9448f70cc0/events.out.tfevents.1694795267.0e9448f70cc0.5168.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:727e4e90d3fcb55d9b625fe7acb0712069ce68a06cb2de14d45356f1433f565b
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 1.232080345041961e+17,
4
- "train_loss": 2.0565889065082255,
5
- "train_runtime": 193.8332,
6
- "train_samples_per_second": 25.553,
7
- "train_steps_per_second": 0.201
8
  }
 
1
  {
2
+ "epoch": 15.0,
3
+ "total_flos": 6.160401725209805e+17,
4
+ "train_loss": 0.1391575378485215,
5
+ "train_runtime": 1009.255,
6
+ "train_samples_per_second": 24.538,
7
+ "train_steps_per_second": 0.193
8
  }
trainer_state.json CHANGED
@@ -1,70 +1,274 @@
1
  {
2
- "best_metric": 0.8641304347826086,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-39",
4
- "epoch": 3.0,
5
- "global_step": 39,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.77,
12
- "learning_rate": 4.1428571428571437e-05,
13
- "loss": 3.2618,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 1.0,
18
- "eval_accuracy": 0.483695652173913,
19
- "eval_loss": 2.5475988388061523,
20
- "eval_runtime": 5.3667,
21
- "eval_samples_per_second": 34.285,
22
- "eval_steps_per_second": 1.118,
23
  "step": 13
24
  },
25
  {
26
  "epoch": 1.54,
27
- "learning_rate": 2.714285714285714e-05,
28
- "loss": 2.4064,
29
  "step": 20
30
  },
31
  {
32
  "epoch": 2.0,
33
- "eval_accuracy": 0.7445652173913043,
34
- "eval_loss": 1.3322842121124268,
35
- "eval_runtime": 5.3179,
36
- "eval_samples_per_second": 34.6,
37
- "eval_steps_per_second": 1.128,
38
  "step": 26
39
  },
40
  {
41
  "epoch": 2.31,
42
- "learning_rate": 1.2857142857142857e-05,
43
- "loss": 1.4499,
44
  "step": 30
45
  },
46
  {
47
  "epoch": 3.0,
48
- "eval_accuracy": 0.8641304347826086,
49
- "eval_loss": 0.9030408263206482,
50
- "eval_runtime": 4.6219,
51
- "eval_samples_per_second": 39.81,
52
- "eval_steps_per_second": 1.298,
53
  "step": 39
54
  },
55
  {
56
- "epoch": 3.0,
57
- "step": 39,
58
- "total_flos": 1.232080345041961e+17,
59
- "train_loss": 2.0565889065082255,
60
- "train_runtime": 193.8332,
61
- "train_samples_per_second": 25.553,
62
- "train_steps_per_second": 0.201
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  }
64
  ],
65
- "max_steps": 39,
66
- "num_train_epochs": 3,
67
- "total_flos": 1.232080345041961e+17,
68
  "trial_name": null,
69
  "trial_params": null
70
  }
 
1
  {
2
+ "best_metric": 1.0,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-91",
4
+ "epoch": 15.0,
5
+ "global_step": 195,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.77,
12
+ "learning_rate": 2.5e-05,
13
+ "loss": 0.8235,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 1.0,
18
+ "eval_accuracy": 0.9239130434782609,
19
+ "eval_loss": 0.6033865213394165,
20
+ "eval_runtime": 4.2784,
21
+ "eval_samples_per_second": 43.007,
22
+ "eval_steps_per_second": 1.402,
23
  "step": 13
24
  },
25
  {
26
  "epoch": 1.54,
27
+ "learning_rate": 5e-05,
28
+ "loss": 0.5091,
29
  "step": 20
30
  },
31
  {
32
  "epoch": 2.0,
33
+ "eval_accuracy": 0.9728260869565217,
34
+ "eval_loss": 0.1870061606168747,
35
+ "eval_runtime": 5.3886,
36
+ "eval_samples_per_second": 34.146,
37
+ "eval_steps_per_second": 1.113,
38
  "step": 26
39
  },
40
  {
41
  "epoch": 2.31,
42
+ "learning_rate": 4.714285714285714e-05,
43
+ "loss": 0.273,
44
  "step": 30
45
  },
46
  {
47
  "epoch": 3.0,
48
+ "eval_accuracy": 0.9945652173913043,
49
+ "eval_loss": 0.08950551599264145,
50
+ "eval_runtime": 4.1088,
51
+ "eval_samples_per_second": 44.782,
52
+ "eval_steps_per_second": 1.46,
53
  "step": 39
54
  },
55
  {
56
+ "epoch": 3.08,
57
+ "learning_rate": 4.428571428571428e-05,
58
+ "loss": 0.1833,
59
+ "step": 40
60
+ },
61
+ {
62
+ "epoch": 3.85,
63
+ "learning_rate": 4.1428571428571437e-05,
64
+ "loss": 0.1401,
65
+ "step": 50
66
+ },
67
+ {
68
+ "epoch": 4.0,
69
+ "eval_accuracy": 0.9945652173913043,
70
+ "eval_loss": 0.054347552359104156,
71
+ "eval_runtime": 4.17,
72
+ "eval_samples_per_second": 44.125,
73
+ "eval_steps_per_second": 1.439,
74
+ "step": 52
75
+ },
76
+ {
77
+ "epoch": 4.62,
78
+ "learning_rate": 3.857142857142858e-05,
79
+ "loss": 0.0936,
80
+ "step": 60
81
+ },
82
+ {
83
+ "epoch": 5.0,
84
+ "eval_accuracy": 0.9891304347826086,
85
+ "eval_loss": 0.04841860011219978,
86
+ "eval_runtime": 4.1427,
87
+ "eval_samples_per_second": 44.416,
88
+ "eval_steps_per_second": 1.448,
89
+ "step": 65
90
+ },
91
+ {
92
+ "epoch": 5.38,
93
+ "learning_rate": 3.571428571428572e-05,
94
+ "loss": 0.091,
95
+ "step": 70
96
+ },
97
+ {
98
+ "epoch": 6.0,
99
+ "eval_accuracy": 0.9891304347826086,
100
+ "eval_loss": 0.04977855086326599,
101
+ "eval_runtime": 4.8364,
102
+ "eval_samples_per_second": 38.045,
103
+ "eval_steps_per_second": 1.241,
104
+ "step": 78
105
+ },
106
+ {
107
+ "epoch": 6.15,
108
+ "learning_rate": 3.285714285714286e-05,
109
+ "loss": 0.0664,
110
+ "step": 80
111
+ },
112
+ {
113
+ "epoch": 6.92,
114
+ "learning_rate": 3e-05,
115
+ "loss": 0.0603,
116
+ "step": 90
117
+ },
118
+ {
119
+ "epoch": 7.0,
120
+ "eval_accuracy": 1.0,
121
+ "eval_loss": 0.01327650435268879,
122
+ "eval_runtime": 5.4357,
123
+ "eval_samples_per_second": 33.85,
124
+ "eval_steps_per_second": 1.104,
125
+ "step": 91
126
+ },
127
+ {
128
+ "epoch": 7.69,
129
+ "learning_rate": 2.714285714285714e-05,
130
+ "loss": 0.0421,
131
+ "step": 100
132
+ },
133
+ {
134
+ "epoch": 8.0,
135
+ "eval_accuracy": 0.9945652173913043,
136
+ "eval_loss": 0.019574709236621857,
137
+ "eval_runtime": 5.3751,
138
+ "eval_samples_per_second": 34.232,
139
+ "eval_steps_per_second": 1.116,
140
+ "step": 104
141
+ },
142
+ {
143
+ "epoch": 8.46,
144
+ "learning_rate": 2.4285714285714288e-05,
145
+ "loss": 0.0557,
146
+ "step": 110
147
+ },
148
+ {
149
+ "epoch": 9.0,
150
+ "eval_accuracy": 0.9945652173913043,
151
+ "eval_loss": 0.01723380759358406,
152
+ "eval_runtime": 5.3966,
153
+ "eval_samples_per_second": 34.096,
154
+ "eval_steps_per_second": 1.112,
155
+ "step": 117
156
+ },
157
+ {
158
+ "epoch": 9.23,
159
+ "learning_rate": 2.1428571428571428e-05,
160
+ "loss": 0.0646,
161
+ "step": 120
162
+ },
163
+ {
164
+ "epoch": 10.0,
165
+ "learning_rate": 1.8571428571428572e-05,
166
+ "loss": 0.0552,
167
+ "step": 130
168
+ },
169
+ {
170
+ "epoch": 10.0,
171
+ "eval_accuracy": 1.0,
172
+ "eval_loss": 0.010338729247450829,
173
+ "eval_runtime": 5.2174,
174
+ "eval_samples_per_second": 35.267,
175
+ "eval_steps_per_second": 1.15,
176
+ "step": 130
177
+ },
178
+ {
179
+ "epoch": 10.77,
180
+ "learning_rate": 1.5714285714285715e-05,
181
+ "loss": 0.045,
182
+ "step": 140
183
+ },
184
+ {
185
+ "epoch": 11.0,
186
+ "eval_accuracy": 1.0,
187
+ "eval_loss": 0.00823963712900877,
188
+ "eval_runtime": 4.9659,
189
+ "eval_samples_per_second": 37.052,
190
+ "eval_steps_per_second": 1.208,
191
+ "step": 143
192
+ },
193
+ {
194
+ "epoch": 11.54,
195
+ "learning_rate": 1.2857142857142857e-05,
196
+ "loss": 0.0355,
197
+ "step": 150
198
+ },
199
+ {
200
+ "epoch": 12.0,
201
+ "eval_accuracy": 1.0,
202
+ "eval_loss": 0.007135531399399042,
203
+ "eval_runtime": 5.3254,
204
+ "eval_samples_per_second": 34.551,
205
+ "eval_steps_per_second": 1.127,
206
+ "step": 156
207
+ },
208
+ {
209
+ "epoch": 12.31,
210
+ "learning_rate": 1e-05,
211
+ "loss": 0.0491,
212
+ "step": 160
213
+ },
214
+ {
215
+ "epoch": 13.0,
216
+ "eval_accuracy": 1.0,
217
+ "eval_loss": 0.008664855733513832,
218
+ "eval_runtime": 4.2336,
219
+ "eval_samples_per_second": 43.462,
220
+ "eval_steps_per_second": 1.417,
221
+ "step": 169
222
+ },
223
+ {
224
+ "epoch": 13.08,
225
+ "learning_rate": 7.142857142857143e-06,
226
+ "loss": 0.0395,
227
+ "step": 170
228
+ },
229
+ {
230
+ "epoch": 13.85,
231
+ "learning_rate": 4.285714285714286e-06,
232
+ "loss": 0.0384,
233
+ "step": 180
234
+ },
235
+ {
236
+ "epoch": 14.0,
237
+ "eval_accuracy": 1.0,
238
+ "eval_loss": 0.006527730729430914,
239
+ "eval_runtime": 4.2794,
240
+ "eval_samples_per_second": 42.997,
241
+ "eval_steps_per_second": 1.402,
242
+ "step": 182
243
+ },
244
+ {
245
+ "epoch": 14.62,
246
+ "learning_rate": 1.4285714285714286e-06,
247
+ "loss": 0.0324,
248
+ "step": 190
249
+ },
250
+ {
251
+ "epoch": 15.0,
252
+ "eval_accuracy": 1.0,
253
+ "eval_loss": 0.006102540995925665,
254
+ "eval_runtime": 4.1839,
255
+ "eval_samples_per_second": 43.978,
256
+ "eval_steps_per_second": 1.434,
257
+ "step": 195
258
+ },
259
+ {
260
+ "epoch": 15.0,
261
+ "step": 195,
262
+ "total_flos": 6.160401725209805e+17,
263
+ "train_loss": 0.1391575378485215,
264
+ "train_runtime": 1009.255,
265
+ "train_samples_per_second": 24.538,
266
+ "train_steps_per_second": 0.193
267
  }
268
  ],
269
+ "max_steps": 195,
270
+ "num_train_epochs": 15,
271
+ "total_flos": 6.160401725209805e+17,
272
  "trial_name": null,
273
  "trial_params": null
274
  }