hanasim commited on
Commit
a3a68ac
1 Parent(s): 074ccb8

End of training

Browse files
README.md CHANGED
@@ -1,39 +1,42 @@
1
  ---
 
 
2
  license: apache-2.0
3
  base_model: openai/whisper-base
4
  tags:
 
5
  - generated_from_trainer
6
  datasets:
7
- - common_voice_16_0
8
  metrics:
9
  - wer
10
  model-index:
11
- - name: breeze-listen-dsw-base-te
12
  results:
13
  - task:
14
  name: Automatic Speech Recognition
15
  type: automatic-speech-recognition
16
  dataset:
17
- name: common_voice_16_0
18
- type: common_voice_16_0
19
  config: te
20
  split: test
21
  args: te
22
  metrics:
23
  - name: Wer
24
  type: wer
25
- value: 3.3333333333333335
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
  should probably proofread and complete it, then remove this comment. -->
30
 
31
- # breeze-listen-dsw-base-te
32
 
33
- This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the common_voice_16_0 dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.0546
36
- - Wer: 3.3333
37
 
38
  ## Model description
39
 
 
1
  ---
2
+ language:
3
+ - te
4
  license: apache-2.0
5
  base_model: openai/whisper-base
6
  tags:
7
+ - whisper-event
8
  - generated_from_trainer
9
  datasets:
10
+ - mozilla-foundation/common_voice_16_0
11
  metrics:
12
  - wer
13
  model-index:
14
+ - name: Breeze DSW Telugu - base
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
18
  type: automatic-speech-recognition
19
  dataset:
20
+ name: mozilla-foundation/common_voice_16_0 te
21
+ type: mozilla-foundation/common_voice_16_0
22
  config: te
23
  split: test
24
  args: te
25
  metrics:
26
  - name: Wer
27
  type: wer
28
+ value: 85.71428571428571
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
32
  should probably proofread and complete it, then remove this comment. -->
33
 
34
+ # Breeze DSW Telugu - base
35
 
36
+ This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the mozilla-foundation/common_voice_16_0 te dataset.
37
  It achieves the following results on the evaluation set:
38
+ - Loss: 2.1055
39
+ - Wer: 85.7143
40
 
41
  ## Model description
42
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 199.0,
3
- "eval_loss": 2.046875,
4
- "eval_runtime": 52.5501,
5
- "eval_samples_per_second": 0.514,
6
- "eval_steps_per_second": 0.038,
7
- "eval_wer": 89.28571428571429,
8
  "train_loss": 0.0,
9
- "train_runtime": 28.0812,
10
- "train_samples_per_second": 2279.101,
11
- "train_steps_per_second": 71.222
12
  }
 
1
  {
2
+ "epoch": 99.0,
3
+ "eval_loss": 2.10546875,
4
+ "eval_runtime": 58.8742,
5
+ "eval_samples_per_second": 0.459,
6
+ "eval_steps_per_second": 0.034,
7
+ "eval_wer": 85.71428571428571,
8
  "train_loss": 0.0,
9
+ "train_runtime": 2.6625,
10
+ "train_samples_per_second": 24037.247,
11
+ "train_steps_per_second": 751.164
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 199.0,
3
- "eval_loss": 2.046875,
4
- "eval_runtime": 52.5501,
5
- "eval_samples_per_second": 0.514,
6
- "eval_steps_per_second": 0.038,
7
- "eval_wer": 89.28571428571429
8
  }
 
1
  {
2
+ "epoch": 99.0,
3
+ "eval_loss": 2.10546875,
4
+ "eval_runtime": 58.8742,
5
+ "eval_samples_per_second": 0.459,
6
+ "eval_steps_per_second": 0.034,
7
+ "eval_wer": 85.71428571428571
8
  }
runs/Jan21_12-33-49_knight/events.out.tfevents.1705836917.knight.61506.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b4f40e2575333e5b790555d99491ca3133f32a11059ef86ad92e2d5aa2ba8be
3
+ size 406
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 199.0,
3
  "train_loss": 0.0,
4
- "train_runtime": 28.0812,
5
- "train_samples_per_second": 2279.101,
6
- "train_steps_per_second": 71.222
7
  }
 
1
  {
2
+ "epoch": 99.0,
3
  "train_loss": 0.0,
4
+ "train_runtime": 2.6625,
5
+ "train_samples_per_second": 24037.247,
6
+ "train_steps_per_second": 751.164
7
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 89.28571428571429,
3
  "best_model_checkpoint": "/cosmos/home/sp-operator/ai/training/models/huggingface/scripts/../breeze-listen-dsw-base-te/checkpoint-200",
4
- "epoch": 199.001,
5
  "eval_steps": 200,
6
- "global_step": 400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,125 +11,68 @@
11
  {
12
  "epoch": 12.0,
13
  "learning_rate": 4.973833272194737e-06,
14
- "loss": 1.7314,
15
  "step": 25
16
  },
17
  {
18
  "epoch": 24.0,
19
  "learning_rate": 6.195318418690893e-06,
20
- "loss": 1.0852,
21
  "step": 50
22
  },
23
  {
24
  "epoch": 37.0,
25
  "learning_rate": 6.881634451095711e-06,
26
- "loss": 0.4273,
27
  "step": 75
28
  },
29
  {
30
  "epoch": 49.0,
31
  "learning_rate": 7.361221988663844e-06,
32
- "loss": 0.0907,
33
  "step": 100
34
  },
35
  {
36
  "epoch": 62.0,
37
  "learning_rate": 7.730207550743121e-06,
38
- "loss": 0.0175,
39
  "step": 125
40
  },
41
  {
42
  "epoch": 74.0,
43
  "learning_rate": 8.03016458599496e-06,
44
- "loss": 0.0032,
45
  "step": 150
46
  },
47
  {
48
  "epoch": 87.0,
49
  "learning_rate": 8.282894746203441e-06,
50
- "loss": 0.0011,
51
  "step": 175
52
  },
53
  {
54
  "epoch": 99.0,
55
  "learning_rate": 8.501266121799902e-06,
56
- "loss": 0.0007,
57
  "step": 200
58
  },
59
  {
60
  "epoch": 99.0,
61
- "eval_loss": 2.046875,
62
- "eval_runtime": 63.8247,
63
- "eval_samples_per_second": 0.423,
64
- "eval_steps_per_second": 0.031,
65
- "eval_wer": 89.28571428571429,
66
  "step": 200
67
  },
68
  {
69
- "epoch": 112.0,
70
- "learning_rate": 8.693512601774437e-06,
71
- "loss": 0.0005,
72
- "step": 225
73
- },
74
- {
75
- "epoch": 124.0,
76
- "learning_rate": 8.865222471593567e-06,
77
- "loss": 0.0004,
78
- "step": 250
79
- },
80
- {
81
- "epoch": 137.0,
82
- "learning_rate": 9.020362953730323e-06,
83
- "loss": 0.0003,
84
- "step": 275
85
- },
86
- {
87
- "epoch": 149.0,
88
- "learning_rate": 9.161852281961698e-06,
89
- "loss": 0.0003,
90
- "step": 300
91
- },
92
- {
93
- "epoch": 162.0,
94
- "learning_rate": 9.29189975311636e-06,
95
- "loss": 0.0002,
96
- "step": 325
97
- },
98
- {
99
- "epoch": 174.0,
100
- "learning_rate": 9.412218256259678e-06,
101
- "loss": 0.0002,
102
- "step": 350
103
- },
104
- {
105
- "epoch": 187.0,
106
- "learning_rate": 9.524162683365145e-06,
107
- "loss": 0.0002,
108
- "step": 375
109
- },
110
- {
111
- "epoch": 199.0,
112
- "learning_rate": 9.62882322733502e-06,
113
- "loss": 0.0002,
114
- "step": 400
115
- },
116
- {
117
- "epoch": 199.0,
118
- "eval_loss": 2.244140625,
119
- "eval_runtime": 56.1817,
120
- "eval_samples_per_second": 0.481,
121
- "eval_steps_per_second": 0.036,
122
- "eval_wer": 90.65934065934066,
123
- "step": 400
124
- },
125
- {
126
- "epoch": 199.0,
127
- "step": 400,
128
- "total_flos": 5.059079773670605e+17,
129
  "train_loss": 0.0,
130
- "train_runtime": 28.0812,
131
- "train_samples_per_second": 2279.101,
132
- "train_steps_per_second": 71.222
133
  }
134
  ],
135
  "logging_steps": 25,
@@ -137,7 +80,7 @@
137
  "num_input_tokens_seen": 0,
138
  "num_train_epochs": 9223372036854775807,
139
  "save_steps": 200,
140
- "total_flos": 5.059079773670605e+17,
141
  "train_batch_size": 32,
142
  "trial_name": null,
143
  "trial_params": null
 
1
  {
2
+ "best_metric": 3.3333333333333335,
3
  "best_model_checkpoint": "/cosmos/home/sp-operator/ai/training/models/huggingface/scripts/../breeze-listen-dsw-base-te/checkpoint-200",
4
+ "epoch": 99.001,
5
  "eval_steps": 200,
6
+ "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 12.0,
13
  "learning_rate": 4.973833272194737e-06,
14
+ "loss": 1.7212,
15
  "step": 25
16
  },
17
  {
18
  "epoch": 24.0,
19
  "learning_rate": 6.195318418690893e-06,
20
+ "loss": 1.1394,
21
  "step": 50
22
  },
23
  {
24
  "epoch": 37.0,
25
  "learning_rate": 6.881634451095711e-06,
26
+ "loss": 0.5083,
27
  "step": 75
28
  },
29
  {
30
  "epoch": 49.0,
31
  "learning_rate": 7.361221988663844e-06,
32
+ "loss": 0.1183,
33
  "step": 100
34
  },
35
  {
36
  "epoch": 62.0,
37
  "learning_rate": 7.730207550743121e-06,
38
+ "loss": 0.022,
39
  "step": 125
40
  },
41
  {
42
  "epoch": 74.0,
43
  "learning_rate": 8.03016458599496e-06,
44
+ "loss": 0.005,
45
  "step": 150
46
  },
47
  {
48
  "epoch": 87.0,
49
  "learning_rate": 8.282894746203441e-06,
50
+ "loss": 0.0016,
51
  "step": 175
52
  },
53
  {
54
  "epoch": 99.0,
55
  "learning_rate": 8.501266121799902e-06,
56
+ "loss": 0.0008,
57
  "step": 200
58
  },
59
  {
60
  "epoch": 99.0,
61
+ "eval_loss": 0.05462646484375,
62
+ "eval_runtime": 53.8277,
63
+ "eval_samples_per_second": 0.725,
64
+ "eval_steps_per_second": 0.056,
65
+ "eval_wer": 3.3333333333333335,
66
  "step": 200
67
  },
68
  {
69
+ "epoch": 99.0,
70
+ "step": 200,
71
+ "total_flos": 2.2700998962393907e+17,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
72
  "train_loss": 0.0,
73
+ "train_runtime": 2.6625,
74
+ "train_samples_per_second": 24037.247,
75
+ "train_steps_per_second": 751.164
76
  }
77
  ],
78
  "logging_steps": 25,
 
80
  "num_input_tokens_seen": 0,
81
  "num_train_epochs": 9223372036854775807,
82
  "save_steps": 200,
83
+ "total_flos": 2.2700998962393907e+17,
84
  "train_batch_size": 32,
85
  "trial_name": null,
86
  "trial_params": null