CookieMonster99 commited on
Commit
9d4dfdf
·
1 Parent(s): 7938205

End of training

Browse files
Files changed (3) hide show
  1. README.md +12 -13
  2. generation_config.json +45 -1
  3. pytorch_model.bin +1 -1
README.md CHANGED
@@ -11,7 +11,7 @@ datasets:
11
  metrics:
12
  - wer
13
  model-index:
14
- - name: Whisper Small Ko - CookieMoster99
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
@@ -19,22 +19,22 @@ model-index:
19
  dataset:
20
  name: zeroth-korean
21
  type: Bingsu/zeroth-korean
22
- args: 'config: ko, split: test'
23
  metrics:
24
  - name: Wer
25
  type: wer
26
- value: 86.67369372082517
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
30
  should probably proofread and complete it, then remove this comment. -->
31
 
32
- # Whisper Small Ko - CookieMoster99
33
 
34
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the zeroth-korean dataset.
35
  It achieves the following results on the evaluation set:
36
  - Loss: 0.0884
37
- - Wer: 86.6737
38
 
39
  ## Model description
40
 
@@ -54,22 +54,21 @@ More information needed
54
 
55
  The following hyperparameters were used during training:
56
  - learning_rate: 1e-05
57
- - train_batch_size: 16
58
  - eval_batch_size: 8
59
  - seed: 42
60
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
61
  - lr_scheduler_type: linear
62
  - lr_scheduler_warmup_steps: 500
63
- - training_steps: 4000
64
 
65
  ### Training results
66
 
67
- | Training Loss | Epoch | Step | Validation Loss | Wer |
68
- |:-------------:|:-----:|:----:|:---------------:|:--------:|
69
- | 0.1053 | 0.72 | 1000 | 0.1508 | 68.2729 |
70
- | 0.0518 | 1.44 | 2000 | 0.1074 | 80.8613 |
71
- | 0.0136 | 2.16 | 3000 | 0.0918 | 106.6707 |
72
- | 0.013 | 2.87 | 4000 | 0.0884 | 86.6737 |
73
 
74
 
75
  ### Framework versions
 
11
  metrics:
12
  - wer
13
  model-index:
14
+ - name: Whisper Small KR - CookieMoster99
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
 
19
  dataset:
20
  name: zeroth-korean
21
  type: Bingsu/zeroth-korean
22
+ args: 'config: KR, split: test'
23
  metrics:
24
  - name: Wer
25
  type: wer
26
+ value: 52.3565728053004
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
30
  should probably proofread and complete it, then remove this comment. -->
31
 
32
+ # Whisper Small KR - CookieMoster99
33
 
34
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the zeroth-korean dataset.
35
  It achieves the following results on the evaluation set:
36
  - Loss: 0.0884
37
+ - Wer: 52.3566
38
 
39
  ## Model description
40
 
 
54
 
55
  The following hyperparameters were used during training:
56
  - learning_rate: 1e-05
57
+ - train_batch_size: 8
58
  - eval_batch_size: 8
59
  - seed: 42
60
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
61
  - lr_scheduler_type: linear
62
  - lr_scheduler_warmup_steps: 500
63
+ - training_steps: 3000
64
 
65
  ### Training results
66
 
67
+ | Training Loss | Epoch | Step | Validation Loss | Wer |
68
+ |:-------------:|:-----:|:----:|:---------------:|:-------:|
69
+ | 0.0254 | 0.36 | 1000 | 0.1079 | 35.4314 |
70
+ | 0.0141 | 0.72 | 2000 | 0.0955 | 41.0029 |
71
+ | 0.0097 | 1.08 | 3000 | 0.0884 | 52.3566 |
 
72
 
73
 
74
  ### Framework versions
generation_config.json CHANGED
@@ -1,4 +1,46 @@
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "begin_suppress_tokens": [
3
  220,
4
  50257
@@ -121,7 +163,7 @@
121
  "max_initial_timestamp_index": 1,
122
  "max_length": 448,
123
  "no_timestamps_token_id": 50363,
124
- "pad_token_id": 50256,
125
  "return_timestamps": false,
126
  "suppress_tokens": [
127
  1,
@@ -207,6 +249,8 @@
207
  49870,
208
  50254,
209
  50258,
 
 
210
  50360,
211
  50361,
212
  50362
 
1
  {
2
+ "alignment_heads": [
3
+ [
4
+ 5,
5
+ 3
6
+ ],
7
+ [
8
+ 5,
9
+ 9
10
+ ],
11
+ [
12
+ 8,
13
+ 0
14
+ ],
15
+ [
16
+ 8,
17
+ 4
18
+ ],
19
+ [
20
+ 8,
21
+ 7
22
+ ],
23
+ [
24
+ 8,
25
+ 8
26
+ ],
27
+ [
28
+ 9,
29
+ 0
30
+ ],
31
+ [
32
+ 9,
33
+ 7
34
+ ],
35
+ [
36
+ 9,
37
+ 9
38
+ ],
39
+ [
40
+ 10,
41
+ 5
42
+ ]
43
+ ],
44
  "begin_suppress_tokens": [
45
  220,
46
  50257
 
163
  "max_initial_timestamp_index": 1,
164
  "max_length": 448,
165
  "no_timestamps_token_id": 50363,
166
+ "pad_token_id": 50257,
167
  "return_timestamps": false,
168
  "suppress_tokens": [
169
  1,
 
249
  49870,
250
  50254,
251
  50258,
252
+ 50358,
253
+ 50359,
254
  50360,
255
  50361,
256
  50362
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f28ffa9ff48a79fc405b0edce95d1bec5dd84405c5f1da72ff15eaa3aa59eab
3
  size 967102729
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:680cb4b6859b3bbd3a69de3f04bac349f8df3060686132bef260e1ff2ddb3413
3
  size 967102729