Jiatong Shi commited on
Commit
a0868c2
·
1 Parent(s): e767abf

Update model

Browse files
Files changed (32) hide show
  1. README.md +766 -3
  2. data/token_list/bpe_unigram500/bpe.model +3 -0
  3. exp/asr_stats_raw_bpe500_sp/train/feats_stats.npz +0 -0
  4. exp/asr_train_asr_raw_bpe500_sp/RESULTS.md +32 -0
  5. exp/asr_train_asr_raw_bpe500_sp/config.yaml +666 -0
  6. exp/asr_train_asr_raw_bpe500_sp/images/acc.png +0 -0
  7. exp/asr_train_asr_raw_bpe500_sp/images/backward_time.png +0 -0
  8. exp/asr_train_asr_raw_bpe500_sp/images/cer.png +0 -0
  9. exp/asr_train_asr_raw_bpe500_sp/images/cer_ctc.png +0 -0
  10. exp/asr_train_asr_raw_bpe500_sp/images/forward_time.png +0 -0
  11. exp/asr_train_asr_raw_bpe500_sp/images/gpu_max_cached_mem_GB.png +0 -0
  12. exp/asr_train_asr_raw_bpe500_sp/images/iter_time.png +0 -0
  13. exp/asr_train_asr_raw_bpe500_sp/images/loss.png +0 -0
  14. exp/asr_train_asr_raw_bpe500_sp/images/loss_att.png +0 -0
  15. exp/asr_train_asr_raw_bpe500_sp/images/loss_ctc.png +0 -0
  16. exp/asr_train_asr_raw_bpe500_sp/images/optim0_lr0.png +0 -0
  17. exp/asr_train_asr_raw_bpe500_sp/images/optim_step_time.png +0 -0
  18. exp/asr_train_asr_raw_bpe500_sp/images/train_time.png +0 -0
  19. exp/asr_train_asr_raw_bpe500_sp/images/wer.png +0 -0
  20. exp/asr_train_asr_raw_bpe500_sp/valid.acc.ave_10best.pth +3 -0
  21. exp/lm_train_lm_bpe500/19epoch.pth +3 -0
  22. exp/lm_train_lm_bpe500/config.yaml +617 -0
  23. exp/lm_train_lm_bpe500/images/backward_time.png +0 -0
  24. exp/lm_train_lm_bpe500/images/forward_time.png +0 -0
  25. exp/lm_train_lm_bpe500/images/gpu_max_cached_mem_GB.png +0 -0
  26. exp/lm_train_lm_bpe500/images/iter_time.png +0 -0
  27. exp/lm_train_lm_bpe500/images/loss.png +0 -0
  28. exp/lm_train_lm_bpe500/images/optim0_lr0.png +0 -0
  29. exp/lm_train_lm_bpe500/images/optim_step_time.png +0 -0
  30. exp/lm_train_lm_bpe500/images/train_time.png +0 -0
  31. exp/lm_train_lm_bpe500/perplexity_test/ppl +1 -0
  32. meta.yaml +10 -0
README.md CHANGED
@@ -1,3 +1,766 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - espnet
4
+ - audio
5
+ - automatic-speech-recognition
6
+ language: noinfo
7
+ datasets:
8
+ - dsing
9
+ license: cc-by-4.0
10
+ ---
11
+
12
+ ## ESPnet2 ASR model
13
+
14
+ ### `espnet/ftshijt_espnet2_asr_dsing_transformer`
15
+
16
+ This model was trained by jiatong using dsing recipe in [espnet](https://github.com/espnet/espnet/).
17
+
18
+ ### Demo: How to use in ESPnet2
19
+
20
+ ```bash
21
+ cd espnet
22
+
23
+ pip install -e .
24
+ cd egs2/dsing/asr1
25
+ ./run.sh --skip_data_prep false --skip_train true --download_model espnet/ftshijt_espnet2_asr_dsing_transformer
26
+ ```
27
+
28
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
29
+ # RESULTS
30
+ ## Environments
31
+ - date: `Sun Mar 20 00:28:37 EDT 2022`
32
+ - python version: `3.9.7 (default, Sep 16 2021, 13:09:58) [GCC 7.5.0]`
33
+ - espnet version: `espnet 0.10.7a1`
34
+ - pytorch version: `pytorch 1.10.1`
35
+ - Git hash: `c1ed71c6899e54c0b3dad82687886b1183cd0885`
36
+ - Commit date: `Wed Mar 16 23:34:49 2022 -0400`
37
+
38
+ ## asr_train_asr_raw_bpe500_sp
39
+ ### WER
40
+
41
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
42
+ |---|---|---|---|---|---|---|---|---|
43
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/dev|482|4018|77.0|16.2|6.8|4.0|27.0|65.1|
44
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/test|480|4632|76.1|17.3|6.6|3.7|27.6|57.7|
45
+
46
+ ### CER
47
+
48
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
49
+ |---|---|---|---|---|---|---|---|---|
50
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/dev|482|18692|85.0|5.8|9.2|4.2|19.2|65.1|
51
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/test|480|21787|84.9|6.3|8.8|4.2|19.3|57.7|
52
+
53
+ ### TER
54
+
55
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
56
+ |---|---|---|---|---|---|---|---|---|
57
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/dev|482|6097|75.2|12.8|12.0|4.1|28.9|65.1|
58
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/test|480|7736|75.3|14.3|10.4|4.1|28.8|57.7|
59
+
60
+ ## ASR config
61
+
62
+ <details><summary>expand</summary>
63
+
64
+ ```
65
+ config: conf/train_asr.yaml
66
+ print_config: false
67
+ log_level: INFO
68
+ dry_run: false
69
+ iterator_type: sequence
70
+ output_dir: exp/asr_train_asr_raw_bpe500_sp
71
+ ngpu: 1
72
+ seed: 0
73
+ num_workers: 1
74
+ num_att_plot: 3
75
+ dist_backend: nccl
76
+ dist_init_method: env://
77
+ dist_world_size: null
78
+ dist_rank: null
79
+ local_rank: 0
80
+ dist_master_addr: null
81
+ dist_master_port: null
82
+ dist_launcher: null
83
+ multiprocessing_distributed: false
84
+ unused_parameters: false
85
+ sharded_ddp: false
86
+ cudnn_enabled: true
87
+ cudnn_benchmark: false
88
+ cudnn_deterministic: true
89
+ collect_stats: false
90
+ write_collected_feats: false
91
+ max_epoch: 100
92
+ patience: 15
93
+ val_scheduler_criterion:
94
+ - valid
95
+ - loss
96
+ early_stopping_criterion:
97
+ - valid
98
+ - loss
99
+ - min
100
+ best_model_criterion:
101
+ - - valid
102
+ - acc
103
+ - max
104
+ keep_nbest_models: 10
105
+ nbest_averaging_interval: 0
106
+ grad_clip: 5
107
+ grad_clip_type: 2.0
108
+ grad_noise: false
109
+ accum_grad: 2
110
+ no_forward_run: false
111
+ resume: true
112
+ train_dtype: float32
113
+ use_amp: false
114
+ log_interval: null
115
+ use_matplotlib: true
116
+ use_tensorboard: true
117
+ use_wandb: false
118
+ wandb_project: null
119
+ wandb_id: null
120
+ wandb_entity: null
121
+ wandb_name: null
122
+ wandb_model_log_interval: -1
123
+ detect_anomaly: false
124
+ pretrain_path: null
125
+ init_param: []
126
+ ignore_init_mismatch: false
127
+ freeze_param: []
128
+ num_iters_per_epoch: null
129
+ batch_size: 32
130
+ valid_batch_size: null
131
+ batch_bins: 1000000
132
+ valid_batch_bins: null
133
+ train_shape_file:
134
+ - exp/asr_stats_raw_bpe500_sp/train/speech_shape
135
+ - exp/asr_stats_raw_bpe500_sp/train/text_shape.bpe
136
+ valid_shape_file:
137
+ - exp/asr_stats_raw_bpe500_sp/valid/speech_shape
138
+ - exp/asr_stats_raw_bpe500_sp/valid/text_shape.bpe
139
+ batch_type: folded
140
+ valid_batch_type: null
141
+ fold_length:
142
+ - 80000
143
+ - 150
144
+ sort_in_batch: descending
145
+ sort_batch: descending
146
+ multiple_iterator: false
147
+ chunk_length: 500
148
+ chunk_shift_ratio: 0.5
149
+ num_cache_chunks: 1024
150
+ train_data_path_and_name_and_type:
151
+ - - dump/raw/train30_sp/wav.scp
152
+ - speech
153
+ - kaldi_ark
154
+ - - dump/raw/train30_sp/text
155
+ - text
156
+ - text
157
+ valid_data_path_and_name_and_type:
158
+ - - dump/raw/dev/wav.scp
159
+ - speech
160
+ - kaldi_ark
161
+ - - dump/raw/dev/text
162
+ - text
163
+ - text
164
+ allow_variable_data_keys: false
165
+ max_cache_size: 0.0
166
+ max_cache_fd: 32
167
+ valid_max_cache_size: null
168
+ optim: adam
169
+ optim_conf:
170
+ lr: 1.0
171
+ scheduler: noamlr
172
+ scheduler_conf:
173
+ warmup_steps: 25000
174
+ token_list:
175
+ - <blank>
176
+ - <unk>
177
+ - ▁I
178
+ - ''''
179
+ - ▁YOU
180
+ - S
181
+ - T
182
+ - ▁THE
183
+ - M
184
+ - ▁ME
185
+ - ▁A
186
+ - ▁AND
187
+ - ▁TO
188
+ - E
189
+ - A
190
+ - ING
191
+ - D
192
+ - ▁MY
193
+ - ▁
194
+ - O
195
+ - ▁IT
196
+ - I
197
+ - N
198
+ - RE
199
+ - Y
200
+ - ▁BE
201
+ - ▁IN
202
+ - ▁ON
203
+ - ▁LOVE
204
+ - U
205
+ - ▁WE
206
+ - LL
207
+ - H
208
+ - ▁YOUR
209
+ - ▁S
210
+ - IN
211
+ - ▁OF
212
+ - ▁DO
213
+ - ▁THAT
214
+ - ▁ALL
215
+ - L
216
+ - ▁DON
217
+ - ▁OH
218
+ - ▁LIKE
219
+ - ▁KNOW
220
+ - ▁FOR
221
+ - ▁CAN
222
+ - ▁JUST
223
+ - P
224
+ - ▁BUT
225
+ - ED
226
+ - K
227
+ - ▁WHEN
228
+ - ▁SO
229
+ - R
230
+ - ▁GO
231
+ - ▁WHAT
232
+ - ▁C
233
+ - ▁WITH
234
+ - W
235
+ - ▁F
236
+ - C
237
+ - ▁NO
238
+ - ER
239
+ - ▁ONE
240
+ - ▁LET
241
+ - VE
242
+ - ES
243
+ - ▁NOW
244
+ - ▁BABY
245
+ - G
246
+ - ▁GOT
247
+ - ▁COME
248
+ - CAUSE
249
+ - LE
250
+ - B
251
+ - ▁B
252
+ - AR
253
+ - ▁UP
254
+ - ▁'
255
+ - ▁W
256
+ - ▁SEE
257
+ - ▁TIME
258
+ - ▁ARE
259
+ - ▁G
260
+ - ▁LOOK
261
+ - ▁THIS
262
+ - F
263
+ - ▁IS
264
+ - ▁NEVER
265
+ - ▁M
266
+ - ▁P
267
+ - AN
268
+ - ▁WAS
269
+ - ▁WAY
270
+ - ▁IF
271
+ - OR
272
+ - ▁SAY
273
+ - V
274
+ - ▁R
275
+ - ▁T
276
+ - ▁DOWN
277
+ - RA
278
+ - ▁THERE
279
+ - ▁HEART
280
+ - ▁NOT
281
+ - RO
282
+ - ▁WILL
283
+ - ▁OUT
284
+ - CE
285
+ - ▁WANT
286
+ - ▁YEAH
287
+ - ▁HAVE
288
+ - ▁GIVE
289
+ - ▁TOO
290
+ - ▁GONNA
291
+ - ▁HOW
292
+ - ▁NEED
293
+ - ▁GET
294
+ - ▁TAKE
295
+ - ▁EVERY
296
+ - ▁FEEL
297
+ - ▁HE
298
+ - EN
299
+ - ▁FROM
300
+ - ▁HA
301
+ - ▁K
302
+ - ▁SHE
303
+ - 'ON'
304
+ - ▁DI
305
+ - RI
306
+ - ▁ONLY
307
+ - NE
308
+ - ▁WHO
309
+ - ▁AWAY
310
+ - ▁E
311
+ - ▁D
312
+ - ▁LIFE
313
+ - ▁MAKE
314
+ - IC
315
+ - ▁BACK
316
+ - ▁WHERE
317
+ - ▁MADE
318
+ - ▁DAY
319
+ - ▁HERE
320
+ - ▁LO
321
+ - ▁HER
322
+ - ▁AS
323
+ - ▁GOOD
324
+ - ▁WANNA
325
+ - ▁OOH
326
+ - ▁TELL
327
+ - LY
328
+ - TH
329
+ - ▁WON
330
+ - ▁LIGHT
331
+ - ▁KEEP
332
+ - ▁MA
333
+ - ▁LA
334
+ - ▁SH
335
+ - ▁WORLD
336
+ - ▁MORE
337
+ - ▁LI
338
+ - AL
339
+ - ▁COULD
340
+ - ▁GIRL
341
+ - ▁NOTHING
342
+ - ▁EVER
343
+ - ▁THINK
344
+ - IE
345
+ - ▁BY
346
+ - ▁AT
347
+ - ▁TONIGHT
348
+ - ▁THEY
349
+ - ▁CALL
350
+ - ▁HO
351
+ - ▁WOULD
352
+ - IL
353
+ - ▁OUR
354
+ - ▁FALL
355
+ - ▁NIGHT
356
+ - ▁THAN
357
+ - ▁DE
358
+ - ▁SOME
359
+ - ▁WAIT
360
+ - ▁RIGHT
361
+ - ▁RE
362
+ - ▁HALLELUJAH
363
+ - ▁TH
364
+ - NG
365
+ - ▁CO
366
+ - ▁WERE
367
+ - ▁TALK
368
+ - ET
369
+ - ▁BO
370
+ - ▁HOLD
371
+ - UR
372
+ - ▁BEEN
373
+ - ▁US
374
+ - ▁PA
375
+ - VER
376
+ - ▁EYES
377
+ - ▁DREAM
378
+ - ▁SONG
379
+ - ▁SHOULD
380
+ - ▁STILL
381
+ - ▁OVER
382
+ - TA
383
+ - ▁ANYMORE
384
+ - IGHT
385
+ - ▁STAY
386
+ - ▁BETTER
387
+ - LESS
388
+ - ▁THROUGH
389
+ - ▁LITTLE
390
+ - X
391
+ - ▁GONE
392
+ - ▁AIN
393
+ - ▁DA
394
+ - ▁HOLDING
395
+ - ▁HURT
396
+ - ▁TRY
397
+ - ▁FIND
398
+ - Z
399
+ - DE
400
+ - ▁LAST
401
+ - ▁SAID
402
+ - ▁ALWAYS
403
+ - ▁BODY
404
+ - ▁MIND
405
+ - ▁CRY
406
+ - ▁EVEN
407
+ - ▁RUN
408
+ - ▁HOPE
409
+ - ▁WITHOUT
410
+ - ▁MISS
411
+ - ▁ABOUT
412
+ - ▁HAND
413
+ - ▁J
414
+ - ▁AGAIN
415
+ - ▁THOUGH
416
+ - ▁NAH
417
+ - ▁LIVE
418
+ - ▁BA
419
+ - ▁OLD
420
+ - ▁HEAD
421
+ - ▁FIRE
422
+ - ▁MAN
423
+ - ▁SOMETHING
424
+ - ▁WHY
425
+ - THER
426
+ - ▁HOME
427
+ - ▁OR
428
+ - ▁INSIDE
429
+ - ▁NEW
430
+ - ▁HEY
431
+ - TION
432
+ - ▁EVERYTHING
433
+ - ▁HAD
434
+ - ▁SOMETIMES
435
+ - ▁HARD
436
+ - ▁TOUCH
437
+ - ▁HEAR
438
+ - ▁AM
439
+ - ▁MUCH
440
+ - ▁LONG
441
+ - ▁STAR
442
+ - GETTING
443
+ - ▁WALK
444
+ - ▁PEOPLE
445
+ - ▁BEFORE
446
+ - ▁CLOSE
447
+ - ▁TWO
448
+ - ▁FAR
449
+ - ▁SHOW
450
+ - ▁STAND
451
+ - ▁LOSE
452
+ - ▁HELP
453
+ - ▁NAME
454
+ - ▁BOY
455
+ - ▁TRUE
456
+ - ▁PLAY
457
+ - ▁DARK
458
+ - ▁THINGS
459
+ - ▁NA
460
+ - ▁TEAR
461
+ - ▁END
462
+ - ▁NOBODY
463
+ - ▁SEA
464
+ - ▁ROCKABYE
465
+ - ▁BELIEVE
466
+ - ▁BROKE
467
+ - ▁AROUND
468
+ - ▁START
469
+ - ▁KISS
470
+ - ▁FEELING
471
+ - ▁BREAK
472
+ - ▁SOMEONE
473
+ - ▁FRIEND
474
+ - ▁ALONE
475
+ - ▁BEAUTIFUL
476
+ - ▁CRAZY
477
+ - ▁OWN
478
+ - OSE
479
+ - ▁STOP
480
+ - ▁LOST
481
+ - ▁HIM
482
+ - ▁BAD
483
+ - ▁CHANCE
484
+ - ▁REALLY
485
+ - ▁WISH
486
+ - ▁MOVE
487
+ - ▁SKY
488
+ - ▁PLACE
489
+ - AKE
490
+ - ▁LEAVE
491
+ - ▁YA
492
+ - ▁STRONG
493
+ - ▁PUT
494
+ - ▁OPEN
495
+ - ▁WRONG
496
+ - ▁COLD
497
+ - OCK
498
+ - ▁USED
499
+ - ▁FOUND
500
+ - ▁LONELY
501
+ - ▁DANCE
502
+ - EACH
503
+ - ▁ANOTHER
504
+ - ▁SIDE
505
+ - ▁UNDER
506
+ - ▁MATTER
507
+ - ▁THESE
508
+ - ▁CARE
509
+ - ▁MINE
510
+ - ▁SHINE
511
+ - ▁AFRAID
512
+ - ▁TURN
513
+ - ▁PLEASE
514
+ - ▁SUN
515
+ - ▁DIAMOND
516
+ - ▁UNTIL
517
+ - ▁FACE
518
+ - ▁LEARN
519
+ - ▁TRUST
520
+ - ▁WONDER
521
+ - ▁BREATH
522
+ - ATE
523
+ - ▁SORRY
524
+ - ▁HU
525
+ - ▁WATCH
526
+ - ▁LATE
527
+ - ROUND
528
+ - ▁ARMS
529
+ - ▁PERFECT
530
+ - ▁MAYBE
531
+ - ▁PULL
532
+ - ▁REMEMBER
533
+ - ▁FIGHT
534
+ - ▁MYSELF
535
+ - ▁INTO
536
+ - ▁DARLING
537
+ - ▁THUNDER
538
+ - ▁FOLLOW
539
+ - ▁REASON
540
+ - ▁BURN
541
+ - ▁HIS
542
+ - ▁MUST
543
+ - ▁FREE
544
+ - ▁FLASHLIGHT
545
+ - ▁1
546
+ - ▁ENOUGH
547
+ - ▁DRINK
548
+ - ▁WORDS
549
+ - ▁HIDE
550
+ - ▁UN
551
+ - ▁FORGET
552
+ - ▁SURE
553
+ - ▁CHANGE
554
+ - ▁SMILE
555
+ - ▁PROMISE
556
+ - ▁FOREVER
557
+ - '2'
558
+ - ▁SWEET
559
+ - ▁SAME
560
+ - ▁OOOH
561
+ - ▁PART
562
+ - ▁SOMEBODY
563
+ - NESS
564
+ - ▁BRIGHT
565
+ - ▁HEAVEN
566
+ - ▁DEEP
567
+ - ▁HIGH
568
+ - ▁INSTEAD
569
+ - ▁MOMENT
570
+ - ▁ALONG
571
+ - ▁ALRIGHT
572
+ - ▁SLOW
573
+ - ▁TOMORROW
574
+ - ▁SOUL
575
+ - ▁QU
576
+ - ▁PUSH
577
+ - ▁CHANDELIER
578
+ - ▁LEFT
579
+ - SIDE
580
+ - ▁TOLD
581
+ - ▁KNEW
582
+ - READY
583
+ - ▁LOVING
584
+ - ▁SAW
585
+ - '3'
586
+ - ▁WORK
587
+ - ▁DANCING
588
+ - ▁THREE
589
+ - ▁SAVE
590
+ - ▁SHOOT
591
+ - ▁LEAD
592
+ - ▁SKI
593
+ - ▁WILD
594
+ - ▁WIND
595
+ - ▁WHILE
596
+ - ▁EDGE
597
+ - ▁HAPPY
598
+ - ▁FEAR
599
+ - STUCK
600
+ - ▁MOST
601
+ - ▁LISTEN
602
+ - ▁WOAH
603
+ - ▁FIRST
604
+ - ▁JOLENE
605
+ - ▁VOICE
606
+ - ▁COMP
607
+ - ▁MILLION
608
+ - FUL
609
+ - ▁OOOOOH
610
+ - ▁CAME
611
+ - ▁RISE
612
+ - ▁NEXT
613
+ - ▁COUNT
614
+ - ▁MOUNTAIN
615
+ - ▁ROOM
616
+ - ▁BLUE
617
+ - ▁HIT
618
+ - ▁RAISE
619
+ - J
620
+ - ▁THOUSAND
621
+ - ▁SHAP
622
+ - ▁TREAT
623
+ - ▁DRY
624
+ - ▁FINALLY
625
+ - ▁TITANIUM
626
+ - ▁CARRY
627
+ - ▁TRUTH
628
+ - ▁WATER
629
+ - ▁MORNING
630
+ - TIME
631
+ - ▁BELONG
632
+ - ▁UMA
633
+ - ▁ALIVE
634
+ - ▁ELSE
635
+ - ▁ANGEL
636
+ - ▁BRAND
637
+ - ▁APART
638
+ - ▁EVERYBODY
639
+ - ▁SOUND
640
+ - ▁GUESS
641
+ - ▁PRAY
642
+ - ▁FAITH
643
+ - ▁AFTER
644
+ - ▁THROW
645
+ - ▁TRIED
646
+ - ▁SLEEP
647
+ - ▁FOOL
648
+ - ▁DISCOVERING
649
+ - ▁FUCK
650
+ - ▁TASTE
651
+ - ▁UNDERSTAND
652
+ - ▁SHAME
653
+ - ▁POWER
654
+ - ▁WELCOME
655
+ - ▁FELT
656
+ - ▁SAFE
657
+ - ▁DESERVE
658
+ - ▁GAME
659
+ - ▁SUPERMA
660
+ - ▁SWEAR
661
+ - ▁BETWEEN
662
+ - ▁GLASS
663
+ - ▁CATCH
664
+ - ▁TOGETHER
665
+ - '0'
666
+ - '4'
667
+ - '6'
668
+ - '5'
669
+ - '1'
670
+ - '8'
671
+ - '7'
672
+ - '9'
673
+ - Q
674
+ - <sos/eos>
675
+ init: xavier_uniform
676
+ input_size: null
677
+ ctc_conf:
678
+ dropout_rate: 0.0
679
+ ctc_type: builtin
680
+ reduce: true
681
+ ignore_nan_grad: true
682
+ joint_net_conf: null
683
+ model_conf:
684
+ ctc_weight: 0.3
685
+ lsm_weight: 0.1
686
+ length_normalized_loss: false
687
+ use_preprocessor: true
688
+ token_type: bpe
689
+ bpemodel: data/token_list/bpe_unigram500/bpe.model
690
+ non_linguistic_symbols: null
691
+ cleaner: null
692
+ g2p: null
693
+ speech_volume_normalize: null
694
+ rir_scp: null
695
+ rir_apply_prob: 1.0
696
+ noise_scp: null
697
+ noise_apply_prob: 1.0
698
+ noise_db_range: '13_15'
699
+ frontend: default
700
+ frontend_conf:
701
+ fs: 16k
702
+ specaug: null
703
+ specaug_conf: {}
704
+ normalize: global_mvn
705
+ normalize_conf:
706
+ stats_file: exp/asr_stats_raw_bpe500_sp/train/feats_stats.npz
707
+ preencoder: null
708
+ preencoder_conf: {}
709
+ encoder: transformer
710
+ encoder_conf:
711
+ input_layer: conv2d
712
+ num_blocks: 12
713
+ linear_units: 2048
714
+ dropout_rate: 0.1
715
+ output_size: 256
716
+ attention_heads: 4
717
+ attention_dropout_rate: 0.0
718
+ postencoder: null
719
+ postencoder_conf: {}
720
+ decoder: transformer
721
+ decoder_conf:
722
+ input_layer: embed
723
+ num_blocks: 6
724
+ linear_units: 2048
725
+ dropout_rate: 0.1
726
+ required:
727
+ - output_dir
728
+ - token_list
729
+ version: 0.10.7a1
730
+ distributed: false
731
+ ```
732
+
733
+ </details>
734
+
735
+
736
+
737
+ ### Citing ESPnet
738
+
739
+ ```BibTex
740
+ @inproceedings{watanabe2018espnet,
741
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
742
+ title={{ESPnet}: End-to-End Speech Processing Toolkit},
743
+ year={2018},
744
+ booktitle={Proceedings of Interspeech},
745
+ pages={2207--2211},
746
+ doi={10.21437/Interspeech.2018-1456},
747
+ url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
748
+ }
749
+
750
+
751
+
752
+
753
+ ```
754
+
755
+ or arXiv:
756
+
757
+ ```bibtex
758
+ @misc{watanabe2018espnet,
759
+ title={ESPnet: End-to-End Speech Processing Toolkit},
760
+ author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
761
+ year={2018},
762
+ eprint={1804.00015},
763
+ archivePrefix={arXiv},
764
+ primaryClass={cs.CL}
765
+ }
766
+ ```
data/token_list/bpe_unigram500/bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce4280f9977384de1303b1f0586b426caf9080a6f75c2b187a26cf1c87142550
3
+ size 245351
exp/asr_stats_raw_bpe500_sp/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
 
exp/asr_train_asr_raw_bpe500_sp/RESULTS.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_asr_result.sh -->
2
+ # RESULTS
3
+ ## Environments
4
+ - date: `Sun Mar 20 00:28:37 EDT 2022`
5
+ - python version: `3.9.7 (default, Sep 16 2021, 13:09:58) [GCC 7.5.0]`
6
+ - espnet version: `espnet 0.10.7a1`
7
+ - pytorch version: `pytorch 1.10.1`
8
+ - Git hash: `c1ed71c6899e54c0b3dad82687886b1183cd0885`
9
+ - Commit date: `Wed Mar 16 23:34:49 2022 -0400`
10
+
11
+ ## asr_train_asr_raw_bpe500_sp
12
+ ### WER
13
+
14
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
+ |---|---|---|---|---|---|---|---|---|
16
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/dev|482|4018|77.0|16.2|6.8|4.0|27.0|65.1|
17
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/test|480|4632|76.1|17.3|6.6|3.7|27.6|57.7|
18
+
19
+ ### CER
20
+
21
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
22
+ |---|---|---|---|---|---|---|---|---|
23
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/dev|482|18692|85.0|5.8|9.2|4.2|19.2|65.1|
24
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/test|480|21787|84.9|6.3|8.8|4.2|19.3|57.7|
25
+
26
+ ### TER
27
+
28
+ |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
29
+ |---|---|---|---|---|---|---|---|---|
30
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/dev|482|6097|75.2|12.8|12.0|4.1|28.9|65.1|
31
+ |decode_asr_lm_lm_train_lm_bpe500_valid.loss.ave_asr_model_valid.acc.ave/test|480|7736|75.3|14.3|10.4|4.1|28.8|57.7|
32
+
exp/asr_train_asr_raw_bpe500_sp/config.yaml ADDED
@@ -0,0 +1,666 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_asr.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/asr_train_asr_raw_bpe500_sp
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 100
28
+ patience: 15
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - acc
39
+ - max
40
+ keep_nbest_models: 10
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 2
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: false
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ use_wandb: false
54
+ wandb_project: null
55
+ wandb_id: null
56
+ wandb_entity: null
57
+ wandb_name: null
58
+ wandb_model_log_interval: -1
59
+ detect_anomaly: false
60
+ pretrain_path: null
61
+ init_param: []
62
+ ignore_init_mismatch: false
63
+ freeze_param: []
64
+ num_iters_per_epoch: null
65
+ batch_size: 32
66
+ valid_batch_size: null
67
+ batch_bins: 1000000
68
+ valid_batch_bins: null
69
+ train_shape_file:
70
+ - exp/asr_stats_raw_bpe500_sp/train/speech_shape
71
+ - exp/asr_stats_raw_bpe500_sp/train/text_shape.bpe
72
+ valid_shape_file:
73
+ - exp/asr_stats_raw_bpe500_sp/valid/speech_shape
74
+ - exp/asr_stats_raw_bpe500_sp/valid/text_shape.bpe
75
+ batch_type: folded
76
+ valid_batch_type: null
77
+ fold_length:
78
+ - 80000
79
+ - 150
80
+ sort_in_batch: descending
81
+ sort_batch: descending
82
+ multiple_iterator: false
83
+ chunk_length: 500
84
+ chunk_shift_ratio: 0.5
85
+ num_cache_chunks: 1024
86
+ train_data_path_and_name_and_type:
87
+ - - dump/raw/train30_sp/wav.scp
88
+ - speech
89
+ - kaldi_ark
90
+ - - dump/raw/train30_sp/text
91
+ - text
92
+ - text
93
+ valid_data_path_and_name_and_type:
94
+ - - dump/raw/dev/wav.scp
95
+ - speech
96
+ - kaldi_ark
97
+ - - dump/raw/dev/text
98
+ - text
99
+ - text
100
+ allow_variable_data_keys: false
101
+ max_cache_size: 0.0
102
+ max_cache_fd: 32
103
+ valid_max_cache_size: null
104
+ optim: adam
105
+ optim_conf:
106
+ lr: 1.0
107
+ scheduler: noamlr
108
+ scheduler_conf:
109
+ warmup_steps: 25000
110
+ token_list:
111
+ - <blank>
112
+ - <unk>
113
+ - ▁I
114
+ - ''''
115
+ - ▁YOU
116
+ - S
117
+ - T
118
+ - ▁THE
119
+ - M
120
+ - ▁ME
121
+ - ▁A
122
+ - ▁AND
123
+ - ▁TO
124
+ - E
125
+ - A
126
+ - ING
127
+ - D
128
+ - ▁MY
129
+ - ▁
130
+ - O
131
+ - ▁IT
132
+ - I
133
+ - N
134
+ - RE
135
+ - Y
136
+ - ▁BE
137
+ - ▁IN
138
+ - ▁ON
139
+ - ▁LOVE
140
+ - U
141
+ - ▁WE
142
+ - LL
143
+ - H
144
+ - ▁YOUR
145
+ - ▁S
146
+ - IN
147
+ - ▁OF
148
+ - ▁DO
149
+ - ▁THAT
150
+ - ▁ALL
151
+ - L
152
+ - ▁DON
153
+ - ▁OH
154
+ - ▁LIKE
155
+ - ▁KNOW
156
+ - ▁FOR
157
+ - ▁CAN
158
+ - ▁JUST
159
+ - P
160
+ - ▁BUT
161
+ - ED
162
+ - K
163
+ - ▁WHEN
164
+ - ▁SO
165
+ - R
166
+ - ▁GO
167
+ - ▁WHAT
168
+ - ▁C
169
+ - ▁WITH
170
+ - W
171
+ - ▁F
172
+ - C
173
+ - ▁NO
174
+ - ER
175
+ - ▁ONE
176
+ - ▁LET
177
+ - VE
178
+ - ES
179
+ - ▁NOW
180
+ - ▁BABY
181
+ - G
182
+ - ▁GOT
183
+ - ▁COME
184
+ - CAUSE
185
+ - LE
186
+ - B
187
+ - ▁B
188
+ - AR
189
+ - ▁UP
190
+ - ▁'
191
+ - ▁W
192
+ - ▁SEE
193
+ - ▁TIME
194
+ - ▁ARE
195
+ - ▁G
196
+ - ▁LOOK
197
+ - ▁THIS
198
+ - F
199
+ - ▁IS
200
+ - ▁NEVER
201
+ - ▁M
202
+ - ▁P
203
+ - AN
204
+ - ▁WAS
205
+ - ▁WAY
206
+ - ▁IF
207
+ - OR
208
+ - ▁SAY
209
+ - V
210
+ - ▁R
211
+ - ▁T
212
+ - ▁DOWN
213
+ - RA
214
+ - ▁THERE
215
+ - ▁HEART
216
+ - ▁NOT
217
+ - RO
218
+ - ▁WILL
219
+ - ▁OUT
220
+ - CE
221
+ - ▁WANT
222
+ - ▁YEAH
223
+ - ▁HAVE
224
+ - ▁GIVE
225
+ - ▁TOO
226
+ - ▁GONNA
227
+ - ▁HOW
228
+ - ▁NEED
229
+ - ▁GET
230
+ - ▁TAKE
231
+ - ▁EVERY
232
+ - ▁FEEL
233
+ - ▁HE
234
+ - EN
235
+ - ▁FROM
236
+ - ▁HA
237
+ - ▁K
238
+ - ▁SHE
239
+ - 'ON'
240
+ - ▁DI
241
+ - RI
242
+ - ▁ONLY
243
+ - NE
244
+ - ▁WHO
245
+ - ▁AWAY
246
+ - ▁E
247
+ - ▁D
248
+ - ▁LIFE
249
+ - ▁MAKE
250
+ - IC
251
+ - ▁BACK
252
+ - ▁WHERE
253
+ - ▁MADE
254
+ - ▁DAY
255
+ - ▁HERE
256
+ - ▁LO
257
+ - ▁HER
258
+ - ▁AS
259
+ - ▁GOOD
260
+ - ▁WANNA
261
+ - ▁OOH
262
+ - ▁TELL
263
+ - LY
264
+ - TH
265
+ - ▁WON
266
+ - ▁LIGHT
267
+ - ▁KEEP
268
+ - ▁MA
269
+ - ▁LA
270
+ - ▁SH
271
+ - ▁WORLD
272
+ - ▁MORE
273
+ - ▁LI
274
+ - AL
275
+ - ▁COULD
276
+ - ▁GIRL
277
+ - ▁NOTHING
278
+ - ▁EVER
279
+ - ▁THINK
280
+ - IE
281
+ - ▁BY
282
+ - ▁AT
283
+ - ▁TONIGHT
284
+ - ▁THEY
285
+ - ▁CALL
286
+ - ▁HO
287
+ - ▁WOULD
288
+ - IL
289
+ - ▁OUR
290
+ - ▁FALL
291
+ - ▁NIGHT
292
+ - ▁THAN
293
+ - ▁DE
294
+ - ▁SOME
295
+ - ▁WAIT
296
+ - ▁RIGHT
297
+ - ▁RE
298
+ - ▁HALLELUJAH
299
+ - ▁TH
300
+ - NG
301
+ - ▁CO
302
+ - ▁WERE
303
+ - ▁TALK
304
+ - ET
305
+ - ▁BO
306
+ - ▁HOLD
307
+ - UR
308
+ - ▁BEEN
309
+ - ▁US
310
+ - ▁PA
311
+ - VER
312
+ - ▁EYES
313
+ - ▁DREAM
314
+ - ▁SONG
315
+ - ▁SHOULD
316
+ - ▁STILL
317
+ - ▁OVER
318
+ - TA
319
+ - ▁ANYMORE
320
+ - IGHT
321
+ - ▁STAY
322
+ - ▁BETTER
323
+ - LESS
324
+ - ▁THROUGH
325
+ - ▁LITTLE
326
+ - X
327
+ - ▁GONE
328
+ - ▁AIN
329
+ - ▁DA
330
+ - ▁HOLDING
331
+ - ▁HURT
332
+ - ▁TRY
333
+ - ▁FIND
334
+ - Z
335
+ - DE
336
+ - ▁LAST
337
+ - ▁SAID
338
+ - ▁ALWAYS
339
+ - ▁BODY
340
+ - ▁MIND
341
+ - ▁CRY
342
+ - ▁EVEN
343
+ - ▁RUN
344
+ - ▁HOPE
345
+ - ▁WITHOUT
346
+ - ▁MISS
347
+ - ▁ABOUT
348
+ - ▁HAND
349
+ - ▁J
350
+ - ▁AGAIN
351
+ - ▁THOUGH
352
+ - ▁NAH
353
+ - ▁LIVE
354
+ - ▁BA
355
+ - ▁OLD
356
+ - ▁HEAD
357
+ - ▁FIRE
358
+ - ▁MAN
359
+ - ▁SOMETHING
360
+ - ▁WHY
361
+ - THER
362
+ - ▁HOME
363
+ - ▁OR
364
+ - ▁INSIDE
365
+ - ▁NEW
366
+ - ▁HEY
367
+ - TION
368
+ - ▁EVERYTHING
369
+ - ▁HAD
370
+ - ▁SOMETIMES
371
+ - ▁HARD
372
+ - ▁TOUCH
373
+ - ▁HEAR
374
+ - ▁AM
375
+ - ▁MUCH
376
+ - ▁LONG
377
+ - ▁STAR
378
+ - GETTING
379
+ - ▁WALK
380
+ - ▁PEOPLE
381
+ - ▁BEFORE
382
+ - ▁CLOSE
383
+ - ▁TWO
384
+ - ▁FAR
385
+ - ▁SHOW
386
+ - ▁STAND
387
+ - ▁LOSE
388
+ - ▁HELP
389
+ - ▁NAME
390
+ - ▁BOY
391
+ - ▁TRUE
392
+ - ▁PLAY
393
+ - ▁DARK
394
+ - ▁THINGS
395
+ - ▁NA
396
+ - ▁TEAR
397
+ - ▁END
398
+ - ▁NOBODY
399
+ - ▁SEA
400
+ - ▁ROCKABYE
401
+ - ▁BELIEVE
402
+ - ▁BROKE
403
+ - ▁AROUND
404
+ - ▁START
405
+ - ▁KISS
406
+ - ▁FEELING
407
+ - ▁BREAK
408
+ - ▁SOMEONE
409
+ - ▁FRIEND
410
+ - ▁ALONE
411
+ - ▁BEAUTIFUL
412
+ - ▁CRAZY
413
+ - ▁OWN
414
+ - OSE
415
+ - ▁STOP
416
+ - ▁LOST
417
+ - ▁HIM
418
+ - ▁BAD
419
+ - ▁CHANCE
420
+ - ▁REALLY
421
+ - ▁WISH
422
+ - ▁MOVE
423
+ - ▁SKY
424
+ - ▁PLACE
425
+ - AKE
426
+ - ▁LEAVE
427
+ - ▁YA
428
+ - ▁STRONG
429
+ - ▁PUT
430
+ - ▁OPEN
431
+ - ▁WRONG
432
+ - ▁COLD
433
+ - OCK
434
+ - ▁USED
435
+ - ▁FOUND
436
+ - ▁LONELY
437
+ - ▁DANCE
438
+ - EACH
439
+ - ▁ANOTHER
440
+ - ▁SIDE
441
+ - ▁UNDER
442
+ - ▁MATTER
443
+ - ▁THESE
444
+ - ▁CARE
445
+ - ▁MINE
446
+ - ▁SHINE
447
+ - ▁AFRAID
448
+ - ▁TURN
449
+ - ▁PLEASE
450
+ - ▁SUN
451
+ - ▁DIAMOND
452
+ - ▁UNTIL
453
+ - ▁FACE
454
+ - ▁LEARN
455
+ - ▁TRUST
456
+ - ▁WONDER
457
+ - ▁BREATH
458
+ - ATE
459
+ - ▁SORRY
460
+ - ▁HU
461
+ - ▁WATCH
462
+ - ▁LATE
463
+ - ROUND
464
+ - ▁ARMS
465
+ - ▁PERFECT
466
+ - ▁MAYBE
467
+ - ▁PULL
468
+ - ▁REMEMBER
469
+ - ▁FIGHT
470
+ - ▁MYSELF
471
+ - ▁INTO
472
+ - ▁DARLING
473
+ - ▁THUNDER
474
+ - ▁FOLLOW
475
+ - ▁REASON
476
+ - ▁BURN
477
+ - ▁HIS
478
+ - ▁MUST
479
+ - ▁FREE
480
+ - ▁FLASHLIGHT
481
+ - ▁1
482
+ - ▁ENOUGH
483
+ - ▁DRINK
484
+ - ▁WORDS
485
+ - ▁HIDE
486
+ - ▁UN
487
+ - ▁FORGET
488
+ - ▁SURE
489
+ - ▁CHANGE
490
+ - ▁SMILE
491
+ - ▁PROMISE
492
+ - ▁FOREVER
493
+ - '2'
494
+ - ▁SWEET
495
+ - ▁SAME
496
+ - ▁OOOH
497
+ - ▁PART
498
+ - ▁SOMEBODY
499
+ - NESS
500
+ - ▁BRIGHT
501
+ - ▁HEAVEN
502
+ - ▁DEEP
503
+ - ▁HIGH
504
+ - ▁INSTEAD
505
+ - ▁MOMENT
506
+ - ▁ALONG
507
+ - ▁ALRIGHT
508
+ - ▁SLOW
509
+ - ▁TOMORROW
510
+ - ▁SOUL
511
+ - ▁QU
512
+ - ▁PUSH
513
+ - ▁CHANDELIER
514
+ - ▁LEFT
515
+ - SIDE
516
+ - ▁TOLD
517
+ - ▁KNEW
518
+ - READY
519
+ - ▁LOVING
520
+ - ▁SAW
521
+ - '3'
522
+ - ▁WORK
523
+ - ▁DANCING
524
+ - ▁THREE
525
+ - ▁SAVE
526
+ - ▁SHOOT
527
+ - ▁LEAD
528
+ - ▁SKI
529
+ - ▁WILD
530
+ - ▁WIND
531
+ - ▁WHILE
532
+ - ▁EDGE
533
+ - ▁HAPPY
534
+ - ▁FEAR
535
+ - STUCK
536
+ - ▁MOST
537
+ - ▁LISTEN
538
+ - ▁WOAH
539
+ - ▁FIRST
540
+ - ▁JOLENE
541
+ - ▁VOICE
542
+ - ▁COMP
543
+ - ▁MILLION
544
+ - FUL
545
+ - ▁OOOOOH
546
+ - ▁CAME
547
+ - ▁RISE
548
+ - ▁NEXT
549
+ - ▁COUNT
550
+ - ▁MOUNTAIN
551
+ - ▁ROOM
552
+ - ▁BLUE
553
+ - ▁HIT
554
+ - ▁RAISE
555
+ - J
556
+ - ▁THOUSAND
557
+ - ▁SHAP
558
+ - ▁TREAT
559
+ - ▁DRY
560
+ - ▁FINALLY
561
+ - ▁TITANIUM
562
+ - ▁CARRY
563
+ - ▁TRUTH
564
+ - ▁WATER
565
+ - ▁MORNING
566
+ - TIME
567
+ - ▁BELONG
568
+ - ▁UMA
569
+ - ▁ALIVE
570
+ - ▁ELSE
571
+ - ▁ANGEL
572
+ - ▁BRAND
573
+ - ▁APART
574
+ - ▁EVERYBODY
575
+ - ▁SOUND
576
+ - ▁GUESS
577
+ - ▁PRAY
578
+ - ▁FAITH
579
+ - ▁AFTER
580
+ - ▁THROW
581
+ - ▁TRIED
582
+ - ▁SLEEP
583
+ - ▁FOOL
584
+ - ▁DISCOVERING
585
+ - ▁FUCK
586
+ - ▁TASTE
587
+ - ▁UNDERSTAND
588
+ - ▁SHAME
589
+ - ▁POWER
590
+ - ▁WELCOME
591
+ - ▁FELT
592
+ - ▁SAFE
593
+ - ▁DESERVE
594
+ - ▁GAME
595
+ - ▁SUPERMA
596
+ - ▁SWEAR
597
+ - ▁BETWEEN
598
+ - ▁GLASS
599
+ - ▁CATCH
600
+ - ▁TOGETHER
601
+ - '0'
602
+ - '4'
603
+ - '6'
604
+ - '5'
605
+ - '1'
606
+ - '8'
607
+ - '7'
608
+ - '9'
609
+ - Q
610
+ - <sos/eos>
611
+ init: xavier_uniform
612
+ input_size: null
613
+ ctc_conf:
614
+ dropout_rate: 0.0
615
+ ctc_type: builtin
616
+ reduce: true
617
+ ignore_nan_grad: true
618
+ joint_net_conf: null
619
+ model_conf:
620
+ ctc_weight: 0.3
621
+ lsm_weight: 0.1
622
+ length_normalized_loss: false
623
+ use_preprocessor: true
624
+ token_type: bpe
625
+ bpemodel: data/token_list/bpe_unigram500/bpe.model
626
+ non_linguistic_symbols: null
627
+ cleaner: null
628
+ g2p: null
629
+ speech_volume_normalize: null
630
+ rir_scp: null
631
+ rir_apply_prob: 1.0
632
+ noise_scp: null
633
+ noise_apply_prob: 1.0
634
+ noise_db_range: '13_15'
635
+ frontend: default
636
+ frontend_conf:
637
+ fs: 16k
638
+ specaug: null
639
+ specaug_conf: {}
640
+ normalize: global_mvn
641
+ normalize_conf:
642
+ stats_file: exp/asr_stats_raw_bpe500_sp/train/feats_stats.npz
643
+ preencoder: null
644
+ preencoder_conf: {}
645
+ encoder: transformer
646
+ encoder_conf:
647
+ input_layer: conv2d
648
+ num_blocks: 12
649
+ linear_units: 2048
650
+ dropout_rate: 0.1
651
+ output_size: 256
652
+ attention_heads: 4
653
+ attention_dropout_rate: 0.0
654
+ postencoder: null
655
+ postencoder_conf: {}
656
+ decoder: transformer
657
+ decoder_conf:
658
+ input_layer: embed
659
+ num_blocks: 6
660
+ linear_units: 2048
661
+ dropout_rate: 0.1
662
+ required:
663
+ - output_dir
664
+ - token_list
665
+ version: 0.10.7a1
666
+ distributed: false
exp/asr_train_asr_raw_bpe500_sp/images/acc.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/backward_time.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/cer.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/cer_ctc.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/forward_time.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/gpu_max_cached_mem_GB.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/iter_time.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/loss.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/loss_att.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/loss_ctc.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/optim0_lr0.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/optim_step_time.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/train_time.png ADDED
exp/asr_train_asr_raw_bpe500_sp/images/wer.png ADDED
exp/asr_train_asr_raw_bpe500_sp/valid.acc.ave_10best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bbd3201747c5c17fa0a46ceb3dbdbac72ee0be8cdd09598597b4dc625f4cb48
3
+ size 110126373
exp/lm_train_lm_bpe500/19epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f6ced3992cb3c9f0055c829aa9c8820b61556dc2679da2a279363db8973f472
3
+ size 29685855
exp/lm_train_lm_bpe500/config.yaml ADDED
@@ -0,0 +1,617 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train_lm.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/lm_train_lm_bpe500
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ unused_parameters: false
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: true
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 20
28
+ patience: 3
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - valid
38
+ - loss
39
+ - min
40
+ keep_nbest_models: 1
41
+ nbest_averaging_interval: 0
42
+ grad_clip: 5.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 1
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: false
50
+ log_interval: null
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ use_wandb: false
54
+ wandb_project: null
55
+ wandb_id: null
56
+ wandb_entity: null
57
+ wandb_name: null
58
+ wandb_model_log_interval: -1
59
+ detect_anomaly: false
60
+ pretrain_path: null
61
+ init_param: []
62
+ ignore_init_mismatch: false
63
+ freeze_param: []
64
+ num_iters_per_epoch: null
65
+ batch_size: 64
66
+ valid_batch_size: null
67
+ batch_bins: 1000000
68
+ valid_batch_bins: null
69
+ train_shape_file:
70
+ - exp/lm_stats_bpe500/train/text_shape.bpe
71
+ valid_shape_file:
72
+ - exp/lm_stats_bpe500/valid/text_shape.bpe
73
+ batch_type: folded
74
+ valid_batch_type: null
75
+ fold_length:
76
+ - 150
77
+ sort_in_batch: descending
78
+ sort_batch: descending
79
+ multiple_iterator: false
80
+ chunk_length: 500
81
+ chunk_shift_ratio: 0.5
82
+ num_cache_chunks: 1024
83
+ train_data_path_and_name_and_type:
84
+ - - dump/raw/lm_train.txt
85
+ - text
86
+ - text
87
+ valid_data_path_and_name_and_type:
88
+ - - dump/raw/dev/text
89
+ - text
90
+ - text
91
+ allow_variable_data_keys: false
92
+ max_cache_size: 0.0
93
+ max_cache_fd: 32
94
+ valid_max_cache_size: null
95
+ optim: sgd
96
+ optim_conf: {}
97
+ scheduler: null
98
+ scheduler_conf: {}
99
+ token_list:
100
+ - <blank>
101
+ - <unk>
102
+ - ▁I
103
+ - ''''
104
+ - ▁YOU
105
+ - S
106
+ - T
107
+ - ▁THE
108
+ - M
109
+ - ▁ME
110
+ - ▁A
111
+ - ▁AND
112
+ - ▁TO
113
+ - E
114
+ - A
115
+ - ING
116
+ - D
117
+ - ▁MY
118
+ - ▁
119
+ - O
120
+ - ▁IT
121
+ - I
122
+ - N
123
+ - RE
124
+ - Y
125
+ - ▁BE
126
+ - ▁IN
127
+ - ▁ON
128
+ - ▁LOVE
129
+ - U
130
+ - ▁WE
131
+ - LL
132
+ - H
133
+ - ▁YOUR
134
+ - ▁S
135
+ - IN
136
+ - ▁OF
137
+ - ▁DO
138
+ - ▁THAT
139
+ - ▁ALL
140
+ - L
141
+ - ▁DON
142
+ - ▁OH
143
+ - ▁LIKE
144
+ - ▁KNOW
145
+ - ▁FOR
146
+ - ▁CAN
147
+ - ▁JUST
148
+ - P
149
+ - ▁BUT
150
+ - ED
151
+ - K
152
+ - ▁WHEN
153
+ - ▁SO
154
+ - R
155
+ - ▁GO
156
+ - ▁WHAT
157
+ - ▁C
158
+ - ▁WITH
159
+ - W
160
+ - ▁F
161
+ - C
162
+ - ▁NO
163
+ - ER
164
+ - ▁ONE
165
+ - ▁LET
166
+ - VE
167
+ - ES
168
+ - ▁NOW
169
+ - ▁BABY
170
+ - G
171
+ - ▁GOT
172
+ - ▁COME
173
+ - CAUSE
174
+ - LE
175
+ - B
176
+ - ▁B
177
+ - AR
178
+ - ▁UP
179
+ - ▁'
180
+ - ▁W
181
+ - ▁SEE
182
+ - ▁TIME
183
+ - ▁ARE
184
+ - ▁G
185
+ - ▁LOOK
186
+ - ▁THIS
187
+ - F
188
+ - ▁IS
189
+ - ▁NEVER
190
+ - ▁M
191
+ - ▁P
192
+ - AN
193
+ - ▁WAS
194
+ - ▁WAY
195
+ - ▁IF
196
+ - OR
197
+ - ▁SAY
198
+ - V
199
+ - ▁R
200
+ - ▁T
201
+ - ▁DOWN
202
+ - RA
203
+ - ▁THERE
204
+ - ▁HEART
205
+ - ▁NOT
206
+ - RO
207
+ - ▁WILL
208
+ - ▁OUT
209
+ - CE
210
+ - ▁WANT
211
+ - ▁YEAH
212
+ - ▁HAVE
213
+ - ▁GIVE
214
+ - ▁TOO
215
+ - ▁GONNA
216
+ - ▁HOW
217
+ - ▁NEED
218
+ - ▁GET
219
+ - ▁TAKE
220
+ - ▁EVERY
221
+ - ▁FEEL
222
+ - ▁HE
223
+ - EN
224
+ - ▁FROM
225
+ - ▁HA
226
+ - ▁K
227
+ - ▁SHE
228
+ - 'ON'
229
+ - ▁DI
230
+ - RI
231
+ - ▁ONLY
232
+ - NE
233
+ - ▁WHO
234
+ - ▁AWAY
235
+ - ▁E
236
+ - ▁D
237
+ - ▁LIFE
238
+ - ▁MAKE
239
+ - IC
240
+ - ▁BACK
241
+ - ▁WHERE
242
+ - ▁MADE
243
+ - ▁DAY
244
+ - ▁HERE
245
+ - ▁LO
246
+ - ▁HER
247
+ - ▁AS
248
+ - ▁GOOD
249
+ - ▁WANNA
250
+ - ▁OOH
251
+ - ▁TELL
252
+ - LY
253
+ - TH
254
+ - ▁WON
255
+ - ▁LIGHT
256
+ - ▁KEEP
257
+ - ▁MA
258
+ - ▁LA
259
+ - ▁SH
260
+ - ▁WORLD
261
+ - ▁MORE
262
+ - ▁LI
263
+ - AL
264
+ - ▁COULD
265
+ - ▁GIRL
266
+ - ▁NOTHING
267
+ - ▁EVER
268
+ - ▁THINK
269
+ - IE
270
+ - ▁BY
271
+ - ▁AT
272
+ - ▁TONIGHT
273
+ - ▁THEY
274
+ - ▁CALL
275
+ - ▁HO
276
+ - ▁WOULD
277
+ - IL
278
+ - ▁OUR
279
+ - ▁FALL
280
+ - ▁NIGHT
281
+ - ▁THAN
282
+ - ▁DE
283
+ - ▁SOME
284
+ - ▁WAIT
285
+ - ▁RIGHT
286
+ - ▁RE
287
+ - ▁HALLELUJAH
288
+ - ▁TH
289
+ - NG
290
+ - ▁CO
291
+ - ▁WERE
292
+ - ▁TALK
293
+ - ET
294
+ - ▁BO
295
+ - ▁HOLD
296
+ - UR
297
+ - ▁BEEN
298
+ - ▁US
299
+ - ▁PA
300
+ - VER
301
+ - ▁EYES
302
+ - ▁DREAM
303
+ - ▁SONG
304
+ - ▁SHOULD
305
+ - ▁STILL
306
+ - ▁OVER
307
+ - TA
308
+ - ▁ANYMORE
309
+ - IGHT
310
+ - ▁STAY
311
+ - ▁BETTER
312
+ - LESS
313
+ - ▁THROUGH
314
+ - ▁LITTLE
315
+ - X
316
+ - ▁GONE
317
+ - ▁AIN
318
+ - ▁DA
319
+ - ▁HOLDING
320
+ - ▁HURT
321
+ - ▁TRY
322
+ - ▁FIND
323
+ - Z
324
+ - DE
325
+ - ▁LAST
326
+ - ▁SAID
327
+ - ▁ALWAYS
328
+ - ▁BODY
329
+ - ▁MIND
330
+ - ▁CRY
331
+ - ▁EVEN
332
+ - ▁RUN
333
+ - ▁HOPE
334
+ - ▁WITHOUT
335
+ - ▁MISS
336
+ - ▁ABOUT
337
+ - ▁HAND
338
+ - ▁J
339
+ - ▁AGAIN
340
+ - ▁THOUGH
341
+ - ▁NAH
342
+ - ▁LIVE
343
+ - ▁BA
344
+ - ▁OLD
345
+ - ▁HEAD
346
+ - ▁FIRE
347
+ - ▁MAN
348
+ - ▁SOMETHING
349
+ - ▁WHY
350
+ - THER
351
+ - ▁HOME
352
+ - ▁OR
353
+ - ▁INSIDE
354
+ - ▁NEW
355
+ - ▁HEY
356
+ - TION
357
+ - ▁EVERYTHING
358
+ - ▁HAD
359
+ - ▁SOMETIMES
360
+ - ▁HARD
361
+ - ▁TOUCH
362
+ - ▁HEAR
363
+ - ▁AM
364
+ - ▁MUCH
365
+ - ▁LONG
366
+ - ▁STAR
367
+ - GETTING
368
+ - ▁WALK
369
+ - ▁PEOPLE
370
+ - ▁BEFORE
371
+ - ▁CLOSE
372
+ - ▁TWO
373
+ - ▁FAR
374
+ - ▁SHOW
375
+ - ▁STAND
376
+ - ▁LOSE
377
+ - ▁HELP
378
+ - ▁NAME
379
+ - ▁BOY
380
+ - ▁TRUE
381
+ - ▁PLAY
382
+ - ▁DARK
383
+ - ▁THINGS
384
+ - ▁NA
385
+ - ▁TEAR
386
+ - ▁END
387
+ - ▁NOBODY
388
+ - ▁SEA
389
+ - ▁ROCKABYE
390
+ - ▁BELIEVE
391
+ - ▁BROKE
392
+ - ▁AROUND
393
+ - ▁START
394
+ - ▁KISS
395
+ - ▁FEELING
396
+ - ▁BREAK
397
+ - ▁SOMEONE
398
+ - ▁FRIEND
399
+ - ▁ALONE
400
+ - ▁BEAUTIFUL
401
+ - ▁CRAZY
402
+ - ▁OWN
403
+ - OSE
404
+ - ▁STOP
405
+ - ▁LOST
406
+ - ▁HIM
407
+ - ▁BAD
408
+ - ▁CHANCE
409
+ - ▁REALLY
410
+ - ▁WISH
411
+ - ▁MOVE
412
+ - ▁SKY
413
+ - ▁PLACE
414
+ - AKE
415
+ - ▁LEAVE
416
+ - ▁YA
417
+ - ▁STRONG
418
+ - ▁PUT
419
+ - ▁OPEN
420
+ - ▁WRONG
421
+ - ▁COLD
422
+ - OCK
423
+ - ▁USED
424
+ - ▁FOUND
425
+ - ▁LONELY
426
+ - ▁DANCE
427
+ - EACH
428
+ - ▁ANOTHER
429
+ - ▁SIDE
430
+ - ▁UNDER
431
+ - ▁MATTER
432
+ - ▁THESE
433
+ - ▁CARE
434
+ - ▁MINE
435
+ - ▁SHINE
436
+ - ▁AFRAID
437
+ - ▁TURN
438
+ - ▁PLEASE
439
+ - ▁SUN
440
+ - ▁DIAMOND
441
+ - ▁UNTIL
442
+ - ▁FACE
443
+ - ▁LEARN
444
+ - ▁TRUST
445
+ - ▁WONDER
446
+ - ▁BREATH
447
+ - ATE
448
+ - ▁SORRY
449
+ - ▁HU
450
+ - ▁WATCH
451
+ - ▁LATE
452
+ - ROUND
453
+ - ▁ARMS
454
+ - ▁PERFECT
455
+ - ▁MAYBE
456
+ - ▁PULL
457
+ - ▁REMEMBER
458
+ - ▁FIGHT
459
+ - ▁MYSELF
460
+ - ▁INTO
461
+ - ▁DARLING
462
+ - ▁THUNDER
463
+ - ▁FOLLOW
464
+ - ▁REASON
465
+ - ▁BURN
466
+ - ▁HIS
467
+ - ▁MUST
468
+ - ▁FREE
469
+ - ▁FLASHLIGHT
470
+ - ▁1
471
+ - ▁ENOUGH
472
+ - ▁DRINK
473
+ - ▁WORDS
474
+ - ▁HIDE
475
+ - ▁UN
476
+ - ▁FORGET
477
+ - ▁SURE
478
+ - ▁CHANGE
479
+ - ▁SMILE
480
+ - ▁PROMISE
481
+ - ▁FOREVER
482
+ - '2'
483
+ - ▁SWEET
484
+ - ▁SAME
485
+ - ▁OOOH
486
+ - ▁PART
487
+ - ▁SOMEBODY
488
+ - NESS
489
+ - ▁BRIGHT
490
+ - ▁HEAVEN
491
+ - ▁DEEP
492
+ - ▁HIGH
493
+ - ▁INSTEAD
494
+ - ▁MOMENT
495
+ - ▁ALONG
496
+ - ▁ALRIGHT
497
+ - ▁SLOW
498
+ - ▁TOMORROW
499
+ - ▁SOUL
500
+ - ▁QU
501
+ - ▁PUSH
502
+ - ▁CHANDELIER
503
+ - ▁LEFT
504
+ - SIDE
505
+ - ▁TOLD
506
+ - ▁KNEW
507
+ - READY
508
+ - ▁LOVING
509
+ - ▁SAW
510
+ - '3'
511
+ - ▁WORK
512
+ - ▁DANCING
513
+ - ▁THREE
514
+ - ▁SAVE
515
+ - ▁SHOOT
516
+ - ▁LEAD
517
+ - ▁SKI
518
+ - ▁WILD
519
+ - ▁WIND
520
+ - ▁WHILE
521
+ - ▁EDGE
522
+ - ▁HAPPY
523
+ - ▁FEAR
524
+ - STUCK
525
+ - ▁MOST
526
+ - ▁LISTEN
527
+ - ▁WOAH
528
+ - ▁FIRST
529
+ - ▁JOLENE
530
+ - ▁VOICE
531
+ - ▁COMP
532
+ - ▁MILLION
533
+ - FUL
534
+ - ▁OOOOOH
535
+ - ▁CAME
536
+ - ▁RISE
537
+ - ▁NEXT
538
+ - ▁COUNT
539
+ - ▁MOUNTAIN
540
+ - ▁ROOM
541
+ - ▁BLUE
542
+ - ▁HIT
543
+ - ▁RAISE
544
+ - J
545
+ - ▁THOUSAND
546
+ - ▁SHAP
547
+ - ▁TREAT
548
+ - ▁DRY
549
+ - ▁FINALLY
550
+ - ▁TITANIUM
551
+ - ▁CARRY
552
+ - ▁TRUTH
553
+ - ▁WATER
554
+ - ▁MORNING
555
+ - TIME
556
+ - ▁BELONG
557
+ - ▁UMA
558
+ - ▁ALIVE
559
+ - ▁ELSE
560
+ - ▁ANGEL
561
+ - ▁BRAND
562
+ - ▁APART
563
+ - ▁EVERYBODY
564
+ - ▁SOUND
565
+ - ▁GUESS
566
+ - ▁PRAY
567
+ - ▁FAITH
568
+ - ▁AFTER
569
+ - ▁THROW
570
+ - ▁TRIED
571
+ - ▁SLEEP
572
+ - ▁FOOL
573
+ - ▁DISCOVERING
574
+ - ▁FUCK
575
+ - ▁TASTE
576
+ - ▁UNDERSTAND
577
+ - ▁SHAME
578
+ - ▁POWER
579
+ - ▁WELCOME
580
+ - ▁FELT
581
+ - ▁SAFE
582
+ - ▁DESERVE
583
+ - ▁GAME
584
+ - ▁SUPERMA
585
+ - ▁SWEAR
586
+ - ▁BETWEEN
587
+ - ▁GLASS
588
+ - ▁CATCH
589
+ - ▁TOGETHER
590
+ - '0'
591
+ - '4'
592
+ - '6'
593
+ - '5'
594
+ - '1'
595
+ - '8'
596
+ - '7'
597
+ - '9'
598
+ - Q
599
+ - <sos/eos>
600
+ init: null
601
+ model_conf:
602
+ ignore_id: 0
603
+ use_preprocessor: true
604
+ token_type: bpe
605
+ bpemodel: data/token_list/bpe_unigram500/bpe.model
606
+ non_linguistic_symbols: null
607
+ cleaner: null
608
+ g2p: null
609
+ lm: seq_rnn
610
+ lm_conf:
611
+ nlayers: 2
612
+ unit: 650
613
+ required:
614
+ - output_dir
615
+ - token_list
616
+ version: 0.10.7a1
617
+ distributed: false
exp/lm_train_lm_bpe500/images/backward_time.png ADDED
exp/lm_train_lm_bpe500/images/forward_time.png ADDED
exp/lm_train_lm_bpe500/images/gpu_max_cached_mem_GB.png ADDED
exp/lm_train_lm_bpe500/images/iter_time.png ADDED
exp/lm_train_lm_bpe500/images/loss.png ADDED
exp/lm_train_lm_bpe500/images/optim0_lr0.png ADDED
exp/lm_train_lm_bpe500/images/optim_step_time.png ADDED
exp/lm_train_lm_bpe500/images/train_time.png ADDED
exp/lm_train_lm_bpe500/perplexity_test/ppl ADDED
@@ -0,0 +1 @@
 
 
1
+ 10.403652830281487
meta.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ espnet: 0.10.7a1
2
+ files:
3
+ asr_model_file: exp/asr_train_asr_raw_bpe500_sp/valid.acc.ave_10best.pth
4
+ lm_file: exp/lm_train_lm_bpe500/19epoch.pth
5
+ python: "3.9.7 (default, Sep 16 2021, 13:09:58) \n[GCC 7.5.0]"
6
+ timestamp: 1647750847.447333
7
+ torch: 1.10.1
8
+ yaml_files:
9
+ asr_train_config: exp/asr_train_asr_raw_bpe500_sp/config.yaml
10
+ lm_train_config: exp/lm_train_lm_bpe500/config.yaml