marinone94 commited on
Commit
30cd992
β€’
1 Parent(s): 287246d

Training in progress, step 200

Browse files
checkpoint-10/trainer_state.json DELETED
@@ -1,94 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 0.029006526468455404,
5
- "global_step": 10,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.0,
12
- "learning_rate": 3.75e-06,
13
- "loss": 13.605,
14
- "step": 1
15
- },
16
- {
17
- "epoch": 0.01,
18
- "learning_rate": 7.5e-06,
19
- "loss": 11.0063,
20
- "step": 2
21
- },
22
- {
23
- "epoch": 0.01,
24
- "learning_rate": 1.1249999999999999e-05,
25
- "loss": 11.6693,
26
- "step": 3
27
- },
28
- {
29
- "epoch": 0.01,
30
- "learning_rate": 1.5e-05,
31
- "loss": 13.432,
32
- "step": 4
33
- },
34
- {
35
- "epoch": 0.01,
36
- "learning_rate": 1.875e-05,
37
- "loss": 10.3458,
38
- "step": 5
39
- },
40
- {
41
- "epoch": 0.01,
42
- "eval_loss": 15.09913444519043,
43
- "eval_runtime": 139.8551,
44
- "eval_samples_per_second": 33.034,
45
- "eval_steps_per_second": 4.133,
46
- "eval_wer": 1.0,
47
- "step": 5
48
- },
49
- {
50
- "epoch": 0.02,
51
- "learning_rate": 2.2499999999999998e-05,
52
- "loss": 15.2451,
53
- "step": 6
54
- },
55
- {
56
- "epoch": 0.02,
57
- "learning_rate": 2.625e-05,
58
- "loss": 10.0481,
59
- "step": 7
60
- },
61
- {
62
- "epoch": 0.02,
63
- "learning_rate": 3e-05,
64
- "loss": 12.3838,
65
- "step": 8
66
- },
67
- {
68
- "epoch": 0.03,
69
- "learning_rate": 3.3749999999999994e-05,
70
- "loss": 11.9858,
71
- "step": 9
72
- },
73
- {
74
- "epoch": 0.03,
75
- "learning_rate": 3.75e-05,
76
- "loss": 11.9029,
77
- "step": 10
78
- },
79
- {
80
- "epoch": 0.03,
81
- "eval_loss": 14.213573455810547,
82
- "eval_runtime": 160.2552,
83
- "eval_samples_per_second": 28.829,
84
- "eval_steps_per_second": 3.607,
85
- "eval_wer": 1.0,
86
- "step": 10
87
- }
88
- ],
89
- "max_steps": 10,
90
- "num_train_epochs": 1,
91
- "total_flos": 4.405923604988928e+16,
92
- "trial_name": null,
93
- "trial_params": null
94
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
{checkpoint-10 β†’ checkpoint-200}/config.json RENAMED
File without changes
{checkpoint-10 β†’ checkpoint-200}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edcb67a936a475709d3e3723b7e3224e64b185948f313f11f94438218cf2c5b2
3
  size 2490361937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1202a5092b4eef4129f21d94d892672eedd0f405c7b97384c527938ad263ff2
3
  size 2490361937
{checkpoint-10 β†’ checkpoint-200}/preprocessor_config.json RENAMED
File without changes
{checkpoint-10 β†’ checkpoint-200}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd61f5511562b14319e58a1b70c496d7e20b55df954b4ca337e122de41cab04e
3
  size 1262075377
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81a809773f4c41661a588636b358c9e5380d7596cf519d3864f59d078d6b5d56
3
  size 1262075377
{checkpoint-10 β†’ checkpoint-200}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bd055f4e5c4ffd4371a3565bfa995a6c8cb41314bc604e8debedf999343a113
3
  size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac8c2cbd9ad36e5da5c9bde6c85c2a957009b424972b91ca2f61d198a65abaf
3
  size 14567
{checkpoint-10 β†’ checkpoint-200}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20e4b012b4b9ab1daa876390beea4afff370d4f83e20e939f16cdf1855daf52f
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:456d3f8c3511ae0b0f0b3bf14cf84027d3dd6e2dd5258c9c8a92b9132d6ccfef
3
  size 559
{checkpoint-10 β†’ checkpoint-200}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6e3ad42da29f9983fc79cb4c120fb5415e138f4bb390c579ef4600450de045a
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efd672a046efb6eb5df47d5237a07689c59887dac098586f96bf610f5cf17f77
3
  size 623
checkpoint-200/trainer_state.json ADDED
@@ -0,0 +1,172 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 0.580130529369108,
5
+ "global_step": 200,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.03,
12
+ "learning_rate": 3.75e-05,
13
+ "loss": 12.1562,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.06,
18
+ "learning_rate": 7.125e-05,
19
+ "loss": 8.7679,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.09,
24
+ "learning_rate": 7.398952095808383e-05,
25
+ "loss": 5.3683,
26
+ "step": 30
27
+ },
28
+ {
29
+ "epoch": 0.12,
30
+ "learning_rate": 7.286676646706586e-05,
31
+ "loss": 4.3219,
32
+ "step": 40
33
+ },
34
+ {
35
+ "epoch": 0.15,
36
+ "learning_rate": 7.17440119760479e-05,
37
+ "loss": 3.7182,
38
+ "step": 50
39
+ },
40
+ {
41
+ "epoch": 0.15,
42
+ "eval_loss": 3.836604595184326,
43
+ "eval_runtime": 133.4846,
44
+ "eval_samples_per_second": 34.611,
45
+ "eval_steps_per_second": 4.33,
46
+ "eval_wer": 1.0,
47
+ "step": 50
48
+ },
49
+ {
50
+ "epoch": 0.17,
51
+ "learning_rate": 7.062125748502993e-05,
52
+ "loss": 3.478,
53
+ "step": 60
54
+ },
55
+ {
56
+ "epoch": 0.2,
57
+ "learning_rate": 6.949850299401197e-05,
58
+ "loss": 3.4492,
59
+ "step": 70
60
+ },
61
+ {
62
+ "epoch": 0.23,
63
+ "learning_rate": 6.837574850299401e-05,
64
+ "loss": 3.3928,
65
+ "step": 80
66
+ },
67
+ {
68
+ "epoch": 0.26,
69
+ "learning_rate": 6.725299401197604e-05,
70
+ "loss": 3.3183,
71
+ "step": 90
72
+ },
73
+ {
74
+ "epoch": 0.29,
75
+ "learning_rate": 6.613023952095809e-05,
76
+ "loss": 3.2075,
77
+ "step": 100
78
+ },
79
+ {
80
+ "epoch": 0.29,
81
+ "eval_loss": 3.258362293243408,
82
+ "eval_runtime": 126.6078,
83
+ "eval_samples_per_second": 36.491,
84
+ "eval_steps_per_second": 4.565,
85
+ "eval_wer": 1.0,
86
+ "step": 100
87
+ },
88
+ {
89
+ "epoch": 0.32,
90
+ "learning_rate": 6.500748502994012e-05,
91
+ "loss": 3.14,
92
+ "step": 110
93
+ },
94
+ {
95
+ "epoch": 0.35,
96
+ "learning_rate": 6.388473053892215e-05,
97
+ "loss": 3.1281,
98
+ "step": 120
99
+ },
100
+ {
101
+ "epoch": 0.38,
102
+ "learning_rate": 6.276197604790418e-05,
103
+ "loss": 3.0987,
104
+ "step": 130
105
+ },
106
+ {
107
+ "epoch": 0.41,
108
+ "learning_rate": 6.163922155688622e-05,
109
+ "loss": 3.1003,
110
+ "step": 140
111
+ },
112
+ {
113
+ "epoch": 0.44,
114
+ "learning_rate": 6.0516467065868256e-05,
115
+ "loss": 3.0922,
116
+ "step": 150
117
+ },
118
+ {
119
+ "epoch": 0.44,
120
+ "eval_loss": 3.127869129180908,
121
+ "eval_runtime": 126.3837,
122
+ "eval_samples_per_second": 36.555,
123
+ "eval_steps_per_second": 4.573,
124
+ "eval_wer": 1.0,
125
+ "step": 150
126
+ },
127
+ {
128
+ "epoch": 0.46,
129
+ "learning_rate": 5.9393712574850293e-05,
130
+ "loss": 3.0588,
131
+ "step": 160
132
+ },
133
+ {
134
+ "epoch": 0.49,
135
+ "learning_rate": 5.827095808383233e-05,
136
+ "loss": 3.0477,
137
+ "step": 170
138
+ },
139
+ {
140
+ "epoch": 0.52,
141
+ "learning_rate": 5.714820359281436e-05,
142
+ "loss": 3.045,
143
+ "step": 180
144
+ },
145
+ {
146
+ "epoch": 0.55,
147
+ "learning_rate": 5.602544910179641e-05,
148
+ "loss": 3.0439,
149
+ "step": 190
150
+ },
151
+ {
152
+ "epoch": 0.58,
153
+ "learning_rate": 5.490269461077844e-05,
154
+ "loss": 3.0846,
155
+ "step": 200
156
+ },
157
+ {
158
+ "epoch": 0.58,
159
+ "eval_loss": 3.079519271850586,
160
+ "eval_runtime": 125.7215,
161
+ "eval_samples_per_second": 36.748,
162
+ "eval_steps_per_second": 4.597,
163
+ "eval_wer": 1.0,
164
+ "step": 200
165
+ }
166
+ ],
167
+ "max_steps": 688,
168
+ "num_train_epochs": 2,
169
+ "total_flos": 5.906333355279667e+17,
170
+ "trial_name": null,
171
+ "trial_params": null
172
+ }
{checkpoint-10 β†’ checkpoint-200}/training_args.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0148471a0b194f620865125fd17f84a2e502a9e0a6acef5304251538d67e034
3
  size 2991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77806a16ec6ef209c8a5c1c085159a0bc8e45c23f2d143f2c13e01527f13b5b2
3
  size 2991
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:386439db8a06ec7bb8279d96099b6db5fee78683933dd8e79efdb684fee3e2c0
3
  size 1262075377
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81a809773f4c41661a588636b358c9e5380d7596cf519d3864f59d078d6b5d56
3
  size 1262075377