lichenda commited on
Commit
8c18e1e
·
1 Parent(s): 64db410

add pretrained model

Browse files
Files changed (28) hide show
  1. exp/asr_stats_raw/train/feats_stats.npz +0 -0
  2. exp/asr_train_asr_transformer_raw_char_1gpu/RESULTS.md +10 -0
  3. exp/asr_train_asr_transformer_raw_char_1gpu/config.yaml +208 -0
  4. exp/asr_train_asr_transformer_raw_char_1gpu/images/acc.png +0 -0
  5. exp/asr_train_asr_transformer_raw_char_1gpu/images/backward_time.png +0 -0
  6. exp/asr_train_asr_transformer_raw_char_1gpu/images/cer.png +0 -0
  7. exp/asr_train_asr_transformer_raw_char_1gpu/images/cer_ctc.png +0 -0
  8. exp/asr_train_asr_transformer_raw_char_1gpu/images/forward_time.png +0 -0
  9. exp/asr_train_asr_transformer_raw_char_1gpu/images/iter_time.png +0 -0
  10. exp/asr_train_asr_transformer_raw_char_1gpu/images/loss.png +0 -0
  11. exp/asr_train_asr_transformer_raw_char_1gpu/images/loss_att.png +0 -0
  12. exp/asr_train_asr_transformer_raw_char_1gpu/images/loss_ctc.png +0 -0
  13. exp/asr_train_asr_transformer_raw_char_1gpu/images/lr_0.png +0 -0
  14. exp/asr_train_asr_transformer_raw_char_1gpu/images/optim_step_time.png +0 -0
  15. exp/asr_train_asr_transformer_raw_char_1gpu/images/train_time.png +0 -0
  16. exp/asr_train_asr_transformer_raw_char_1gpu/images/wer.png +0 -0
  17. exp/asr_train_asr_transformer_raw_char_1gpu/valid.acc.ave_10best.pth +3 -0
  18. exp/lm_train_lm_char_sgd/37epoch.pth +3 -0
  19. exp/lm_train_lm_char_sgd/config.yaml +165 -0
  20. exp/lm_train_lm_char_sgd/images/backward_time.png +0 -0
  21. exp/lm_train_lm_char_sgd/images/forward_time.png +0 -0
  22. exp/lm_train_lm_char_sgd/images/iter_time.png +0 -0
  23. exp/lm_train_lm_char_sgd/images/loss.png +0 -0
  24. exp/lm_train_lm_char_sgd/images/lr_0.png +0 -0
  25. exp/lm_train_lm_char_sgd/images/optim_step_time.png +0 -0
  26. exp/lm_train_lm_char_sgd/images/train_time.png +0 -0
  27. exp/lm_train_lm_char_sgd/perplexity_test/ppl +1 -0
  28. meta.yaml +10 -0
exp/asr_stats_raw/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/asr_train_asr_transformer_raw_char_1gpu/RESULTS.md ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Tue Sep 1 15:32:18 CST 2020`
5
+ - python version: `3.7.6 (default, Jan 8 2020, 19:59:22) [GCC 7.3.0]`
6
+ - espnet version: `espnet 0.9.0`
7
+ - pytorch version: `pytorch 1.5.0`
8
+ - Git hash: `9e8a87e02872a9a5e8f58cb0521eda05058195ca`
9
+ - Commit date: `Mon Aug 24 20:21:25 2020 +0800`
10
+
exp/asr_train_asr_transformer_raw_char_1gpu/config.yaml ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_asr_transformer.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: ./exp/asr_train_asr_transformer_raw_char_1gpu
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ cudnn_enabled: true
21
+ cudnn_benchmark: false
22
+ cudnn_deterministic: true
23
+ collect_stats: false
24
+ write_collected_feats: false
25
+ max_epoch: 100
26
+ patience: null
27
+ val_scheduler_criterion:
28
+ - valid
29
+ - loss
30
+ early_stopping_criterion:
31
+ - valid
32
+ - loss
33
+ - min
34
+ best_model_criterion:
35
+ - - valid
36
+ - acc
37
+ - max
38
+ keep_nbest_models: 10
39
+ grad_clip: 5.0
40
+ grad_noise: false
41
+ accum_grad: 8
42
+ no_forward_run: false
43
+ resume: true
44
+ train_dtype: float32
45
+ log_interval: null
46
+ pretrain_path: []
47
+ pretrain_key: []
48
+ num_iters_per_epoch: null
49
+ batch_size: 20
50
+ valid_batch_size: null
51
+ batch_bins: 1000000
52
+ valid_batch_bins: null
53
+ train_shape_file:
54
+ - exp/asr_stats_raw/train/speech_shape
55
+ - exp/asr_stats_raw/train/text_shape.char
56
+ valid_shape_file:
57
+ - exp/asr_stats_raw/valid/speech_shape
58
+ - exp/asr_stats_raw/valid/text_shape.char
59
+ batch_type: folded
60
+ valid_batch_type: null
61
+ fold_length:
62
+ - 80000
63
+ - 150
64
+ sort_in_batch: descending
65
+ sort_batch: descending
66
+ multiple_iterator: false
67
+ chunk_length: 500
68
+ chunk_shift_ratio: 0.5
69
+ num_cache_chunks: 1024
70
+ train_data_path_and_name_and_type:
71
+ - - dump/raw/train_si284/wav.scp
72
+ - speech
73
+ - sound
74
+ - - dump/raw/train_si284/text
75
+ - text
76
+ - text
77
+ valid_data_path_and_name_and_type:
78
+ - - dump/raw/test_dev93/wav.scp
79
+ - speech
80
+ - sound
81
+ - - dump/raw/test_dev93/text
82
+ - text
83
+ - text
84
+ allow_variable_data_keys: false
85
+ max_cache_size: 0.0
86
+ valid_max_cache_size: null
87
+ optim: adam
88
+ optim_conf:
89
+ lr: 0.005
90
+ scheduler: warmuplr
91
+ scheduler_conf:
92
+ warmup_steps: 30000
93
+ token_list:
94
+ - <blank>
95
+ - <unk>
96
+ - <space>
97
+ - E
98
+ - T
99
+ - A
100
+ - N
101
+ - I
102
+ - O
103
+ - S
104
+ - R
105
+ - H
106
+ - L
107
+ - D
108
+ - C
109
+ - U
110
+ - M
111
+ - P
112
+ - F
113
+ - G
114
+ - Y
115
+ - W
116
+ - B
117
+ - V
118
+ - K
119
+ - .
120
+ - X
121
+ - ''''
122
+ - J
123
+ - Q
124
+ - Z
125
+ - <NOISE>
126
+ - ','
127
+ - '-'
128
+ - '"'
129
+ - '*'
130
+ - ':'
131
+ - (
132
+ - )
133
+ - '?'
134
+ - '!'
135
+ - '&'
136
+ - ;
137
+ - '1'
138
+ - '2'
139
+ - '0'
140
+ - /
141
+ - $
142
+ - '{'
143
+ - '}'
144
+ - '8'
145
+ - '9'
146
+ - '6'
147
+ - '3'
148
+ - '5'
149
+ - '7'
150
+ - '4'
151
+ - '~'
152
+ - '`'
153
+ - _
154
+ - <*IN*>
155
+ - <*MR.*>
156
+ - \
157
+ - ^
158
+ - <sos/eos>
159
+ init: xavier_uniform
160
+ input_size: null
161
+ ctc_conf:
162
+ dropout_rate: 0.0
163
+ ctc_type: builtin
164
+ reduce: true
165
+ model_conf:
166
+ ctc_weight: 0.3
167
+ lsm_weight: 0.1
168
+ length_normalized_loss: false
169
+ use_preprocessor: true
170
+ token_type: char
171
+ bpemodel: null
172
+ non_linguistic_symbols: data/nlsyms.txt
173
+ cleaner: null
174
+ g2p: null
175
+ frontend: default
176
+ frontend_conf:
177
+ fs: 8k
178
+ n_fft: 256
179
+ hop_length: 64
180
+ specaug: null
181
+ specaug_conf: {}
182
+ normalize: global_mvn
183
+ normalize_conf:
184
+ stats_file: exp/asr_stats_raw/train/feats_stats.npz
185
+ encoder: transformer
186
+ encoder_conf:
187
+ output_size: 256
188
+ attention_heads: 4
189
+ linear_units: 2048
190
+ num_blocks: 12
191
+ dropout_rate: 0.1
192
+ positional_dropout_rate: 0.1
193
+ attention_dropout_rate: 0.0
194
+ input_layer: conv2d
195
+ normalize_before: true
196
+ decoder: transformer
197
+ decoder_conf:
198
+ attention_heads: 4
199
+ linear_units: 2048
200
+ num_blocks: 6
201
+ dropout_rate: 0.1
202
+ positional_dropout_rate: 0.1
203
+ self_attention_dropout_rate: 0.0
204
+ src_attention_dropout_rate: 0.0
205
+ required:
206
+ - output_dir
207
+ - token_list
208
+ distributed: false
exp/asr_train_asr_transformer_raw_char_1gpu/images/acc.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/backward_time.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/cer.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/cer_ctc.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/forward_time.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/iter_time.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/loss.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/loss_att.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/loss_ctc.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/lr_0.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/optim_step_time.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/train_time.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/images/wer.png ADDED
exp/asr_train_asr_transformer_raw_char_1gpu/valid.acc.ave_10best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88b898a6f90867382bba18481feb0dc497e33a88c6ef2ebe3f7816f131a2d9be
3
+ size 108690752
exp/lm_train_lm_char_sgd/37epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59fb8554c7a96c1c2ed30eee5eb30b9797659d767af739c27526c9159bf4964d
3
+ size 27421563
exp/lm_train_lm_char_sgd/config.yaml ADDED
@@ -0,0 +1,165 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_lm.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: ./exp/lm_train_lm_char_sgd
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ cudnn_enabled: true
21
+ cudnn_benchmark: false
22
+ cudnn_deterministic: true
23
+ collect_stats: false
24
+ write_collected_feats: false
25
+ max_epoch: 40
26
+ patience: null
27
+ val_scheduler_criterion:
28
+ - valid
29
+ - loss
30
+ early_stopping_criterion:
31
+ - valid
32
+ - loss
33
+ - min
34
+ best_model_criterion:
35
+ - - valid
36
+ - loss
37
+ - min
38
+ keep_nbest_models: 1
39
+ grad_clip: 5.0
40
+ grad_noise: false
41
+ accum_grad: 1
42
+ no_forward_run: false
43
+ resume: true
44
+ train_dtype: float32
45
+ log_interval: null
46
+ pretrain_path: []
47
+ pretrain_key: []
48
+ num_iters_per_epoch: null
49
+ batch_size: 30
50
+ valid_batch_size: null
51
+ batch_bins: 1000000
52
+ valid_batch_bins: null
53
+ train_shape_file:
54
+ - exp/lm_stats/train/text_shape.char
55
+ valid_shape_file:
56
+ - exp/lm_stats/valid/text_shape.char
57
+ batch_type: folded
58
+ valid_batch_type: null
59
+ fold_length:
60
+ - 150
61
+ sort_in_batch: descending
62
+ sort_batch: descending
63
+ multiple_iterator: false
64
+ chunk_length: 500
65
+ chunk_shift_ratio: 0.5
66
+ num_cache_chunks: 1024
67
+ train_data_path_and_name_and_type:
68
+ - - dump/raw/srctexts
69
+ - text
70
+ - text
71
+ valid_data_path_and_name_and_type:
72
+ - - dump/raw/test_dev93/text
73
+ - text
74
+ - text
75
+ allow_variable_data_keys: false
76
+ max_cache_size: 0.0
77
+ valid_max_cache_size: null
78
+ optim: sgd
79
+ optim_conf:
80
+ lr: 0.1
81
+ scheduler: null
82
+ scheduler_conf: {}
83
+ token_list:
84
+ - <blank>
85
+ - <unk>
86
+ - <space>
87
+ - E
88
+ - T
89
+ - A
90
+ - N
91
+ - I
92
+ - O
93
+ - S
94
+ - R
95
+ - H
96
+ - L
97
+ - D
98
+ - C
99
+ - U
100
+ - M
101
+ - P
102
+ - F
103
+ - G
104
+ - Y
105
+ - W
106
+ - B
107
+ - V
108
+ - K
109
+ - .
110
+ - X
111
+ - ''''
112
+ - J
113
+ - Q
114
+ - Z
115
+ - <NOISE>
116
+ - ','
117
+ - '-'
118
+ - '"'
119
+ - '*'
120
+ - ':'
121
+ - (
122
+ - )
123
+ - '?'
124
+ - '!'
125
+ - '&'
126
+ - ;
127
+ - '1'
128
+ - '2'
129
+ - '0'
130
+ - /
131
+ - $
132
+ - '{'
133
+ - '}'
134
+ - '8'
135
+ - '9'
136
+ - '6'
137
+ - '3'
138
+ - '5'
139
+ - '7'
140
+ - '4'
141
+ - '~'
142
+ - '`'
143
+ - _
144
+ - <*IN*>
145
+ - <*MR.*>
146
+ - \
147
+ - ^
148
+ - <sos/eos>
149
+ init: null
150
+ model_conf:
151
+ ignore_id: 0
152
+ use_preprocessor: true
153
+ token_type: char
154
+ bpemodel: null
155
+ non_linguistic_symbols: data/nlsyms.txt
156
+ cleaner: null
157
+ g2p: null
158
+ lm: seq_rnn
159
+ lm_conf:
160
+ unit: 650
161
+ nlayers: 2
162
+ required:
163
+ - output_dir
164
+ - token_list
165
+ distributed: false
exp/lm_train_lm_char_sgd/images/backward_time.png ADDED
exp/lm_train_lm_char_sgd/images/forward_time.png ADDED
exp/lm_train_lm_char_sgd/images/iter_time.png ADDED
exp/lm_train_lm_char_sgd/images/loss.png ADDED
exp/lm_train_lm_char_sgd/images/lr_0.png ADDED
exp/lm_train_lm_char_sgd/images/optim_step_time.png ADDED
exp/lm_train_lm_char_sgd/images/train_time.png ADDED
exp/lm_train_lm_char_sgd/perplexity_test/ppl ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.4762186648823223
meta.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ espnet: 0.9.0
2
+ files:
3
+ asr_model_file: exp/asr_train_asr_transformer_raw_char_1gpu/valid.acc.ave_10best.pth
4
+ lm_file: exp/lm_train_lm_char_sgd/37epoch.pth
5
+ python: "3.7.6 (default, Jan 8 2020, 19:59:22) \n[GCC 7.3.0]"
6
+ timestamp: 1599059847.47611
7
+ torch: 1.5.0
8
+ yaml_files:
9
+ asr_train_config: exp/asr_train_asr_transformer_raw_char_1gpu/config.yaml
10
+ lm_train_config: exp/lm_train_lm_char_sgd/config.yaml