byungkyu commited on
Commit
3784a9c
1 Parent(s): a6e97b2

End of training

Browse files
Files changed (2) hide show
  1. README.md +3 -3
  2. generation_config.json +92 -11
README.md CHANGED
@@ -1,12 +1,12 @@
1
  ---
 
2
  language:
3
  - ko
4
  license: apache-2.0
5
- library_name: transformers
6
  tags:
7
  - hf-asr-leaderboard
8
  - generated_from_trainer
9
- base_model: openai/whisper-base
10
  datasets:
11
  - byungkyu
12
  model-index:
@@ -45,7 +45,7 @@ The following hyperparameters were used during training:
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
  - lr_scheduler_warmup_steps: 500
48
- - training_steps: 5570
49
  - mixed_precision_training: Native AMP
50
 
51
  ### Training results
 
1
  ---
2
+ library_name: transformers
3
  language:
4
  - ko
5
  license: apache-2.0
6
+ base_model: openai/whisper-base
7
  tags:
8
  - hf-asr-leaderboard
9
  - generated_from_trainer
 
10
  datasets:
11
  - byungkyu
12
  model-index:
 
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
  - lr_scheduler_warmup_steps: 500
48
+ - training_steps: 5000
49
  - mixed_precision_training: Native AMP
50
 
51
  ### Training results
generation_config.json CHANGED
@@ -40,16 +40,6 @@
40
  "bos_token_id": 50257,
41
  "decoder_start_token_id": 50258,
42
  "eos_token_id": 50257,
43
- "forced_decoder_ids": [
44
- [
45
- 1,
46
- null
47
- ],
48
- [
49
- 2,
50
- 50359
51
- ]
52
- ],
53
  "is_multilingual": true,
54
  "lang_to_id": {
55
  "<|af|>": 50327,
@@ -152,13 +142,104 @@
152
  "<|yo|>": 50325,
153
  "<|zh|>": 50260
154
  },
 
155
  "max_initial_timestamp_index": 50,
156
  "max_length": 448,
157
  "no_timestamps_token_id": 50363,
158
  "pad_token_id": 50257,
159
  "prev_sot_token_id": 50361,
160
  "return_timestamps": false,
161
- "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
162
  "task_to_id": {
163
  "transcribe": 50359,
164
  "translate": 50358
 
40
  "bos_token_id": 50257,
41
  "decoder_start_token_id": 50258,
42
  "eos_token_id": 50257,
 
 
 
 
 
 
 
 
 
 
43
  "is_multilingual": true,
44
  "lang_to_id": {
45
  "<|af|>": 50327,
 
142
  "<|yo|>": 50325,
143
  "<|zh|>": 50260
144
  },
145
+ "language": "Korean",
146
  "max_initial_timestamp_index": 50,
147
  "max_length": 448,
148
  "no_timestamps_token_id": 50363,
149
  "pad_token_id": 50257,
150
  "prev_sot_token_id": 50361,
151
  "return_timestamps": false,
152
+ "suppress_tokens": [
153
+ 1,
154
+ 2,
155
+ 7,
156
+ 8,
157
+ 9,
158
+ 10,
159
+ 14,
160
+ 25,
161
+ 26,
162
+ 27,
163
+ 28,
164
+ 29,
165
+ 31,
166
+ 58,
167
+ 59,
168
+ 60,
169
+ 61,
170
+ 62,
171
+ 63,
172
+ 90,
173
+ 91,
174
+ 92,
175
+ 93,
176
+ 359,
177
+ 503,
178
+ 522,
179
+ 542,
180
+ 873,
181
+ 893,
182
+ 902,
183
+ 918,
184
+ 922,
185
+ 931,
186
+ 1350,
187
+ 1853,
188
+ 1982,
189
+ 2460,
190
+ 2627,
191
+ 3246,
192
+ 3253,
193
+ 3268,
194
+ 3536,
195
+ 3846,
196
+ 3961,
197
+ 4183,
198
+ 4667,
199
+ 6585,
200
+ 6647,
201
+ 7273,
202
+ 9061,
203
+ 9383,
204
+ 10428,
205
+ 10929,
206
+ 11938,
207
+ 12033,
208
+ 12331,
209
+ 12562,
210
+ 13793,
211
+ 14157,
212
+ 14635,
213
+ 15265,
214
+ 15618,
215
+ 16553,
216
+ 16604,
217
+ 18362,
218
+ 18956,
219
+ 20075,
220
+ 21675,
221
+ 22520,
222
+ 26130,
223
+ 26161,
224
+ 26435,
225
+ 28279,
226
+ 29464,
227
+ 31650,
228
+ 32302,
229
+ 32470,
230
+ 36865,
231
+ 42863,
232
+ 47425,
233
+ 49870,
234
+ 50254,
235
+ 50258,
236
+ 50358,
237
+ 50359,
238
+ 50360,
239
+ 50361,
240
+ 50362
241
+ ],
242
+ "task": "transcribe",
243
  "task_to_id": {
244
  "transcribe": 50359,
245
  "translate": 50358