mrmuminov commited on
Commit
a555c52
1 Parent(s): 177c7d9

End of training

Browse files
Files changed (2) hide show
  1. README.md +36 -7
  2. generation_config.json +14 -2
README.md CHANGED
@@ -1,15 +1,30 @@
1
  ---
2
  language:
3
- - hi
4
- license: apache-2.0
5
- base_model: openai/whisper-small
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
  - mozilla-foundation/common_voice_16_1
 
 
10
  model-index:
11
  - name: Whisper Large v3 Turbo - Bahriddin Muminov
12
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -17,7 +32,10 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  # Whisper Large v3 Turbo - Bahriddin Muminov
19
 
20
- This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 16.1 dataset.
 
 
 
21
 
22
  ## Model description
23
 
@@ -42,10 +60,21 @@ The following hyperparameters were used during training:
42
  - seed: 42
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: linear
45
- - lr_scheduler_warmup_steps: 500
46
- - training_steps: 4000
47
  - mixed_precision_training: Native AMP
48
 
 
 
 
 
 
 
 
 
 
 
 
49
  ### Framework versions
50
 
51
  - Transformers 4.37.2
 
1
  ---
2
  language:
3
+ - uz
4
+ license: mit
5
+ base_model: openai/whisper-large-v3-turbo
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
  - mozilla-foundation/common_voice_16_1
10
+ metrics:
11
+ - wer
12
  model-index:
13
  - name: Whisper Large v3 Turbo - Bahriddin Muminov
14
+ results:
15
+ - task:
16
+ name: Automatic Speech Recognition
17
+ type: automatic-speech-recognition
18
+ dataset:
19
+ name: Common Voice 16.1
20
+ type: mozilla-foundation/common_voice_16_1
21
+ config: uz
22
+ split: test
23
+ args: 'config: uz, split: test'
24
+ metrics:
25
+ - name: Wer
26
+ type: wer
27
+ value: 28.258182136033867
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  # Whisper Large v3 Turbo - Bahriddin Muminov
34
 
35
+ This model is a fine-tuned version of [openai/whisper-large-v3-turbo](https://huggingface.co/openai/whisper-large-v3-turbo) on the Common Voice 16.1 dataset.
36
+ It achieves the following results on the evaluation set:
37
+ - Loss: 0.2958
38
+ - Wer: 28.2582
39
 
40
  ## Model description
41
 
 
60
  - seed: 42
61
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
62
  - lr_scheduler_type: linear
63
+ - lr_scheduler_warmup_steps: 1000
64
+ - training_steps: 10000
65
  - mixed_precision_training: Native AMP
66
 
67
+ ### Training results
68
+
69
+ | Training Loss | Epoch | Step | Validation Loss | Wer |
70
+ |:-------------:|:-----:|:-----:|:---------------:|:-------:|
71
+ | 0.429 | 0.66 | 2000 | 0.4073 | 38.0018 |
72
+ | 0.2671 | 1.32 | 4000 | 0.3378 | 31.0778 |
73
+ | 0.2511 | 1.98 | 6000 | 0.3102 | 29.2484 |
74
+ | 0.1539 | 2.64 | 8000 | 0.3022 | 30.0763 |
75
+ | 0.111 | 3.3 | 10000 | 0.2958 | 28.2582 |
76
+
77
+
78
  ### Framework versions
79
 
80
  - Transformers 4.37.2
generation_config.json CHANGED
@@ -32,6 +32,20 @@
32
  "bos_token_id": 50257,
33
  "decoder_start_token_id": 50258,
34
  "eos_token_id": 50257,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
35
  "is_multilingual": true,
36
  "lang_to_id": {
37
  "<|af|>": 50327,
@@ -135,7 +149,6 @@
135
  "<|yue|>": 50358,
136
  "<|zh|>": 50260
137
  },
138
- "language": "uzbek",
139
  "max_initial_timestamp_index": 50,
140
  "max_length": 448,
141
  "no_timestamps_token_id": 50364,
@@ -232,7 +245,6 @@
232
  50362,
233
  50363
234
  ],
235
- "task": "transcribe",
236
  "task_to_id": {
237
  "transcribe": 50360,
238
  "translate": 50359
 
32
  "bos_token_id": 50257,
33
  "decoder_start_token_id": 50258,
34
  "eos_token_id": 50257,
35
+ "forced_decoder_ids": [
36
+ [
37
+ 1,
38
+ 50337
39
+ ],
40
+ [
41
+ 2,
42
+ 50360
43
+ ],
44
+ [
45
+ 3,
46
+ 50364
47
+ ]
48
+ ],
49
  "is_multilingual": true,
50
  "lang_to_id": {
51
  "<|af|>": 50327,
 
149
  "<|yue|>": 50358,
150
  "<|zh|>": 50260
151
  },
 
152
  "max_initial_timestamp_index": 50,
153
  "max_length": 448,
154
  "no_timestamps_token_id": 50364,
 
245
  50362,
246
  50363
247
  ],
 
248
  "task_to_id": {
249
  "transcribe": 50360,
250
  "translate": 50359