Zengwei commited on
Commit
533e65f
·
1 Parent(s): 0965836

upload files

Browse files
README.md ADDED
@@ -0,0 +1 @@
 
 
1
+ See https://github.com/k2-fsa/icefall/pull/1766 for details
data/lang_bpe_500/bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c53433de083c4a6ad12d034550ef22de68cec62c4f58932a7b6b8b2f1e743fa5
3
+ size 244865
data/lang_bpe_500/tokens.txt ADDED
@@ -0,0 +1,502 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <blk> 0
2
+ <sos/eos> 1
3
+ <unk> 2
4
+ S 3
5
+ ▁THE 4
6
+ ▁A 5
7
+ T 6
8
+ ▁AND 7
9
+ ED 8
10
+ ▁OF 9
11
+ ▁TO 10
12
+ E 11
13
+ D 12
14
+ N 13
15
+ ING 14
16
+ ▁IN 15
17
+ Y 16
18
+ M 17
19
+ C 18
20
+ ▁I 19
21
+ A 20
22
+ P 21
23
+ ▁HE 22
24
+ R 23
25
+ O 24
26
+ L 25
27
+ RE 26
28
+ I 27
29
+ U 28
30
+ ER 29
31
+ ▁IT 30
32
+ LY 31
33
+ ▁THAT 32
34
+ ▁WAS 33
35
+ ▁ 34
36
+ ▁S 35
37
+ AR 36
38
+ ▁BE 37
39
+ F 38
40
+ ▁C 39
41
+ IN 40
42
+ B 41
43
+ ▁FOR 42
44
+ OR 43
45
+ LE 44
46
+ ' 45
47
+ ▁HIS 46
48
+ ▁YOU 47
49
+ AL 48
50
+ ▁RE 49
51
+ V 50
52
+ ▁B 51
53
+ G 52
54
+ RI 53
55
+ ▁E 54
56
+ ▁WITH 55
57
+ ▁T 56
58
+ ▁AS 57
59
+ LL 58
60
+ ▁P 59
61
+ ▁HER 60
62
+ ST 61
63
+ ▁HAD 62
64
+ ▁SO 63
65
+ ▁F 64
66
+ W 65
67
+ CE 66
68
+ ▁IS 67
69
+ ND 68
70
+ ▁NOT 69
71
+ TH 70
72
+ ▁BUT 71
73
+ EN 72
74
+ ▁SHE 73
75
+ ▁ON 74
76
+ VE 75
77
+ ON 76
78
+ SE 77
79
+ ▁DE 78
80
+ UR 79
81
+ ▁G 80
82
+ CH 81
83
+ K 82
84
+ TER 83
85
+ ▁AT 84
86
+ IT 85
87
+ ▁ME 86
88
+ RO 87
89
+ NE 88
90
+ RA 89
91
+ ES 90
92
+ IL 91
93
+ NG 92
94
+ IC 93
95
+ ▁NO 94
96
+ ▁HIM 95
97
+ ENT 96
98
+ IR 97
99
+ ▁WE 98
100
+ H 99
101
+ ▁DO 100
102
+ ▁ALL 101
103
+ ▁HAVE 102
104
+ LO 103
105
+ ▁BY 104
106
+ ▁MY 105
107
+ ▁MO 106
108
+ ▁THIS 107
109
+ LA 108
110
+ ▁ST 109
111
+ ▁WHICH 110
112
+ ▁CON 111
113
+ ▁THEY 112
114
+ CK 113
115
+ TE 114
116
+ ▁SAID 115
117
+ ▁FROM 116
118
+ ▁GO 117
119
+ ▁WHO 118
120
+ ▁TH 119
121
+ ▁OR 120
122
+ ▁D 121
123
+ ▁W 122
124
+ VER 123
125
+ LI 124
126
+ ▁SE 125
127
+ ▁ONE 126
128
+ ▁CA 127
129
+ ▁AN 128
130
+ ▁LA 129
131
+ ▁WERE 130
132
+ EL 131
133
+ ▁HA 132
134
+ ▁MAN 133
135
+ ▁FA 134
136
+ ▁EX 135
137
+ AD 136
138
+ ▁SU 137
139
+ RY 138
140
+ ▁MI 139
141
+ AT 140
142
+ ▁BO 141
143
+ ▁WHEN 142
144
+ AN 143
145
+ THER 144
146
+ PP 145
147
+ ATION 146
148
+ ▁FI 147
149
+ ▁WOULD 148
150
+ ▁PRO 149
151
+ OW 150
152
+ ET 151
153
+ ▁O 152
154
+ ▁THERE 153
155
+ ▁HO 154
156
+ ION 155
157
+ ▁WHAT 156
158
+ ▁FE 157
159
+ ▁PA 158
160
+ US 159
161
+ MENT 160
162
+ ▁MA 161
163
+ UT 162
164
+ ▁OUT 163
165
+ ▁THEIR 164
166
+ ▁IF 165
167
+ ▁LI 166
168
+ ▁K 167
169
+ ▁WILL 168
170
+ ▁ARE 169
171
+ ID 170
172
+ ▁RO 171
173
+ DE 172
174
+ TION 173
175
+ ▁WA 174
176
+ PE 175
177
+ ▁UP 176
178
+ ▁SP 177
179
+ ▁PO 178
180
+ IGHT 179
181
+ ▁UN 180
182
+ RU 181
183
+ ▁LO 182
184
+ AS 183
185
+ OL 184
186
+ ▁LE 185
187
+ ▁BEEN 186
188
+ ▁SH 187
189
+ ▁RA 188
190
+ ▁SEE 189
191
+ KE 190
192
+ UL 191
193
+ TED 192
194
+ ▁SA 193
195
+ UN 194
196
+ UND 195
197
+ ANT 196
198
+ ▁NE 197
199
+ IS 198
200
+ ▁THEM 199
201
+ CI 200
202
+ GE 201
203
+ ▁COULD 202
204
+ ▁DIS 203
205
+ OM 204
206
+ ISH 205
207
+ HE 206
208
+ EST 207
209
+ ▁SOME 208
210
+ ENCE 209
211
+ ITY 210
212
+ IVE 211
213
+ ▁US 212
214
+ ▁MORE 213
215
+ ▁EN 214
216
+ ARD 215
217
+ ATE 216
218
+ ▁YOUR 217
219
+ ▁INTO 218
220
+ ▁KNOW 219
221
+ ▁CO 220
222
+ ANCE 221
223
+ ▁TIME 222
224
+ ▁WI 223
225
+ ▁YE 224
226
+ AGE 225
227
+ ▁NOW 226
228
+ TI 227
229
+ FF 228
230
+ ABLE 229
231
+ ▁VERY 230
232
+ ▁LIKE 231
233
+ AM 232
234
+ HI 233
235
+ Z 234
236
+ ▁OTHER 235
237
+ ▁THAN 236
238
+ ▁LITTLE 237
239
+ ▁DID 238
240
+ ▁LOOK 239
241
+ TY 240
242
+ ERS 241
243
+ ▁CAN 242
244
+ ▁CHA 243
245
+ ▁AR 244
246
+ X 245
247
+ FUL 246
248
+ UGH 247
249
+ ▁BA 248
250
+ ▁DAY 249
251
+ ▁ABOUT 250
252
+ TEN 251
253
+ IM 252
254
+ ▁ANY 253
255
+ ▁PRE 254
256
+ ▁OVER 255
257
+ IES 256
258
+ NESS 257
259
+ ME 258
260
+ BLE 259
261
+ ▁M 260
262
+ ROW 261
263
+ ▁HAS 262
264
+ ▁GREAT 263
265
+ ▁VI 264
266
+ TA 265
267
+ ▁AFTER 266
268
+ PER 267
269
+ ▁AGAIN 268
270
+ HO 269
271
+ SH 270
272
+ ▁UPON 271
273
+ ▁DI 272
274
+ ▁HAND 273
275
+ ▁COM 274
276
+ IST 275
277
+ TURE 276
278
+ ▁STA 277
279
+ ▁THEN 278
280
+ ▁SHOULD 279
281
+ ▁GA 280
282
+ OUS 281
283
+ OUR 282
284
+ ▁WELL 283
285
+ ▁ONLY 284
286
+ MAN 285
287
+ ▁GOOD 286
288
+ ▁TWO 287
289
+ ▁MAR 288
290
+ ▁SAY 289
291
+ ▁HU 290
292
+ TING 291
293
+ ▁OUR 292
294
+ RESS 293
295
+ ▁DOWN 294
296
+ IOUS 295
297
+ ▁BEFORE 296
298
+ ▁DA 297
299
+ ▁NA 298
300
+ QUI 299
301
+ ▁MADE 300
302
+ ▁EVERY 301
303
+ ▁OLD 302
304
+ ▁EVEN 303
305
+ IG 304
306
+ ▁COME 305
307
+ ▁GRA 306
308
+ ▁RI 307
309
+ ▁LONG 308
310
+ OT 309
311
+ SIDE 310
312
+ WARD 311
313
+ ▁FO 312
314
+ ▁WHERE 313
315
+ MO 314
316
+ LESS 315
317
+ ▁SC 316
318
+ ▁MUST 317
319
+ ▁NEVER 318
320
+ ▁HOW 319
321
+ ▁CAME 320
322
+ ▁SUCH 321
323
+ ▁RU 322
324
+ ▁TAKE 323
325
+ ▁WO 324
326
+ ▁CAR 325
327
+ UM 326
328
+ AK 327
329
+ ▁THINK 328
330
+ ▁MUCH 329
331
+ ▁MISTER 330
332
+ ▁MAY 331
333
+ ▁JO 332
334
+ ▁WAY 333
335
+ ▁COMP 334
336
+ ▁THOUGHT 335
337
+ ▁STO 336
338
+ ▁MEN 337
339
+ ▁BACK 338
340
+ ▁DON 339
341
+ J 340
342
+ ▁LET 341
343
+ ▁TRA 342
344
+ ▁FIRST 343
345
+ ▁JUST 344
346
+ ▁VA 345
347
+ ▁OWN 346
348
+ ▁PLA 347
349
+ ▁MAKE 348
350
+ ATED 349
351
+ ▁HIMSELF 350
352
+ ▁WENT 351
353
+ ▁PI 352
354
+ GG 353
355
+ RING 354
356
+ ▁DU 355
357
+ ▁MIGHT 356
358
+ ▁PART 357
359
+ ▁GIVE 358
360
+ ▁IMP 359
361
+ ▁BU 360
362
+ ▁PER 361
363
+ ▁PLACE 362
364
+ ▁HOUSE 363
365
+ ▁THROUGH 364
366
+ IAN 365
367
+ ▁SW 366
368
+ ▁UNDER 367
369
+ QUE 368
370
+ ▁AWAY 369
371
+ ▁LOVE 370
372
+ QUA 371
373
+ ▁LIFE 372
374
+ ▁GET 373
375
+ ▁WITHOUT 374
376
+ ▁PASS 375
377
+ ▁TURN 376
378
+ IGN 377
379
+ ▁HEAD 378
380
+ ▁MOST 379
381
+ ▁THOSE 380
382
+ ▁SHALL 381
383
+ ▁EYES 382
384
+ ▁COL 383
385
+ ▁STILL 384
386
+ ▁NIGHT 385
387
+ ▁NOTHING 386
388
+ ITION 387
389
+ HA 388
390
+ ▁TELL 389
391
+ ▁WORK 390
392
+ ▁LAST 391
393
+ ▁NEW 392
394
+ ▁FACE 393
395
+ ▁HI 394
396
+ ▁WORD 395
397
+ ▁FOUND 396
398
+ ▁COUNT 397
399
+ ▁OB 398
400
+ ▁WHILE 399
401
+ ▁SHA 400
402
+ ▁MEAN 401
403
+ ▁SAW 402
404
+ ▁PEOPLE 403
405
+ ▁FRIEND 404
406
+ ▁THREE 405
407
+ ▁ROOM 406
408
+ ▁SAME 407
409
+ ▁THOUGH 408
410
+ ▁RIGHT 409
411
+ ▁CHILD 410
412
+ ▁FATHER 411
413
+ ▁ANOTHER 412
414
+ ▁HEART 413
415
+ ▁WANT 414
416
+ ▁TOOK 415
417
+ OOK 416
418
+ ▁LIGHT 417
419
+ ▁MISSUS 418
420
+ ▁OPEN 419
421
+ ▁JU 420
422
+ ▁ASKED 421
423
+ PORT 422
424
+ ▁LEFT 423
425
+ ▁JA 424
426
+ ▁WORLD 425
427
+ ▁HOME 426
428
+ ▁WHY 427
429
+ ▁ALWAYS 428
430
+ ▁ANSWER 429
431
+ ▁SEEMED 430
432
+ ▁SOMETHING 431
433
+ ▁GIRL 432
434
+ ▁BECAUSE 433
435
+ ▁NAME 434
436
+ ▁TOLD 435
437
+ ▁NI 436
438
+ ▁HIGH 437
439
+ IZE 438
440
+ ▁WOMAN 439
441
+ ▁FOLLOW 440
442
+ ▁RETURN 441
443
+ ▁KNEW 442
444
+ ▁EACH 443
445
+ ▁KIND 444
446
+ ▁JE 445
447
+ ▁ACT 446
448
+ ▁LU 447
449
+ ▁CERTAIN 448
450
+ ▁YEARS 449
451
+ ▁QUITE 450
452
+ ▁APPEAR 451
453
+ ▁BETTER 452
454
+ ▁HALF 453
455
+ ▁PRESENT 454
456
+ ▁PRINCE 455
457
+ SHIP 456
458
+ ▁ALSO 457
459
+ ▁BEGAN 458
460
+ ▁HAVING 459
461
+ ▁ENOUGH 460
462
+ ▁PERSON 461
463
+ ▁LADY 462
464
+ ▁WHITE 463
465
+ ▁COURSE 464
466
+ ▁VOICE 465
467
+ ▁SPEAK 466
468
+ ▁POWER 467
469
+ ▁MORNING 468
470
+ ▁BETWEEN 469
471
+ ▁AMONG 470
472
+ ▁KEEP 471
473
+ ▁WALK 472
474
+ ▁MATTER 473
475
+ ▁TEA 474
476
+ ▁BELIEVE 475
477
+ ▁SMALL 476
478
+ ▁TALK 477
479
+ ▁FELT 478
480
+ ▁HORSE 479
481
+ ▁MYSELF 480
482
+ ▁SIX 481
483
+ ▁HOWEVER 482
484
+ ▁FULL 483
485
+ ▁HERSELF 484
486
+ ▁POINT 485
487
+ ▁STOOD 486
488
+ ▁HUNDRED 487
489
+ ▁ALMOST 488
490
+ ▁SINCE 489
491
+ ▁LARGE 490
492
+ ▁LEAVE 491
493
+ ▁PERHAPS 492
494
+ ▁DARK 493
495
+ ▁SUDDEN 494
496
+ ▁REPLIED 495
497
+ ▁ANYTHING 496
498
+ ▁WONDER 497
499
+ ▁UNTIL 498
500
+ Q 499
501
+ #0 500
502
+ #1 501
decoding_results/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt ADDED
The diff for this file is too large to render. See raw diff
 
decoding_results/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt ADDED
The diff for this file is too large to render. See raw diff
 
decoding_results/attention-decoder-rescoring-no-ngram/log-decode-epoch-50_avg-20_use-averaged-model-2024-09-21-17-57-57 ADDED
@@ -0,0 +1,251 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-09-21 17:57:57,911 INFO [ctc_decode.py:769] Decoding started
2
+ 2024-09-21 17:57:57,911 INFO [ctc_decode.py:775] Device: cuda:0
3
+ 2024-09-21 17:57:57,911 INFO [ctc_decode.py:776] {'best_train_loss': inf, 'best_valid_loss': inf, 'best_train_epoch': -1, 'best_valid_epoch': -1, 'batch_idx_train': 0, 'log_interval': 50, 'reset_interval': 200, 'valid_interval': 3000, 'feature_dim': 80, 'subsampling_factor': 4, 'ignore_id': -1, 'label_smoothing': 0.1, 'warm_step': 2000, 'env_info': {'k2-version': '1.24.4', 'k2-build-type': 'Release', 'k2-with-cuda': True, 'k2-git-sha1': '44a9d5682af9fd3ef77074777e15278ec6d390eb', 'k2-git-date': 'Wed Sep 27 11:22:55 2023', 'lhotse-version': '1.17.0.dev+git.ccfc5b2c.dirty', 'torch-version': '1.10.0+cu102', 'torch-cuda-available': True, 'torch-cuda-version': '10.2', 'python-version': '3.8', 'icefall-git-branch': 'cr-ctc', 'icefall-git-sha1': 'a6eead6c-clean', 'icefall-git-date': 'Mon Sep 9 10:10:08 2024', 'icefall-path': '/star-zw/workspace/zipformer/icefall_cr_ctc', 'k2-path': '/star-zw/workspace/k2/k2/k2/python/k2/__init__.py', 'lhotse-path': '/star-zw/workspace/lhotse/lhotse/lhotse/__init__.py', 'hostname': 'de-74279-k2-train-2-0904151501-7d58788f57-7cktm', 'IP address': '10.30.14.169'}, 'frame_shift_ms': 10, 'search_beam': 20, 'output_beam': 8, 'min_active_states': 30, 'max_active_states': 10000, 'use_double_scores': True, 'epoch': 50, 'iter': 0, 'avg': 20, 'use_averaged_model': True, 'exp_dir': PosixPath('zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1'), 'bpe_model': 'data/lang_bpe_500/bpe.model', 'lang_dir': PosixPath('data/lang_bpe_500'), 'context_size': 2, 'decoding_method': 'attention-decoder-rescoring-no-ngram', 'num_paths': 100, 'nbest_scale': 1.0, 'hlg_scale': 0.6, 'lm_dir': PosixPath('data/lm'), 'skip_scoring': False, 'num_encoder_layers': '2,2,4,5,4,2', 'downsampling_factor': '1,2,4,8,4,2', 'feedforward_dim': '512,768,1536,2048,1536,768', 'num_heads': '4,4,4,8,4,4', 'encoder_dim': '192,256,512,768,512,256', 'query_head_dim': '32', 'value_head_dim': '12', 'pos_head_dim': '4', 'pos_dim': 48, 'encoder_unmasked_dim': '192,192,256,320,256,192', 'cnn_module_kernel': '31,31,15,15,15,31', 'decoder_dim': 512, 'joiner_dim': 512, 'attention_decoder_dim': 512, 'attention_decoder_num_layers': 6, 'attention_decoder_attention_dim': 512, 'attention_decoder_num_heads': 8, 'attention_decoder_feedforward_dim': 2048, 'causal': False, 'chunk_size': '16,32,64,-1', 'left_context_frames': '64,128,256,-1', 'use_transducer': False, 'use_ctc': True, 'use_attention_decoder': True, 'use_cr_ctc': True, 'full_libri': True, 'mini_libri': False, 'manifest_dir': PosixPath('data/fbank'), 'max_duration': 200, 'bucketing_sampler': True, 'num_buckets': 30, 'concatenate_cuts': False, 'duration_factor': 1.0, 'gap': 1.0, 'on_the_fly_feats': False, 'shuffle': True, 'drop_last': True, 'return_cuts': True, 'num_workers': 2, 'enable_spec_aug': True, 'spec_aug_time_warp_factor': 80, 'enable_musan': True, 'input_strategy': 'PrecomputedFeatures', 'res_dir': PosixPath('zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram'), 'suffix': 'epoch-50_avg-20_use-averaged-model'}
4
+ 2024-09-21 17:57:58,323 INFO [lexicon.py:168] Loading pre-compiled data/lang_bpe_500/Linv.pt
5
+ 2024-09-21 17:58:03,090 INFO [ctc_decode.py:861] About to create model
6
+ 2024-09-21 17:58:04,386 INFO [ctc_decode.py:928] Calculating the averaged model over epoch range from 30 (excluded) to 50
7
+ 2024-09-21 17:58:28,955 INFO [ctc_decode.py:945] Number of model parameters: 174319650
8
+ 2024-09-21 17:58:28,955 INFO [asr_datamodule.py:467] About to get test-clean cuts
9
+ 2024-09-21 17:58:29,094 INFO [asr_datamodule.py:474] About to get test-other cuts
10
+ 2024-09-21 17:58:32,173 INFO [ctc_decode.py:653] batch 0/?, cuts processed until now is 14
11
+ 2024-09-21 17:58:55,303 INFO [zipformer.py:1858] name=None, attn_weights_entropy = tensor([5.2234, 4.6148, 4.6277, 4.7056], device='cuda:0')
12
+ 2024-09-21 18:01:56,602 INFO [ctc_decode.py:653] batch 100/?, cuts processed until now is 2298
13
+ 2024-09-21 18:02:22,203 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
14
+ 2024-09-21 18:02:22,241 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
15
+ 2024-09-21 18:02:22,277 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
16
+ 2024-09-21 18:02:22,313 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
17
+ 2024-09-21 18:02:22,347 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
18
+ 2024-09-21 18:02:22,383 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
19
+ 2024-09-21 18:02:22,432 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
20
+ 2024-09-21 18:02:22,469 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
21
+ 2024-09-21 18:02:22,505 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
22
+ 2024-09-21 18:02:22,541 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
23
+ 2024-09-21 18:02:22,577 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
24
+ 2024-09-21 18:02:22,610 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
25
+ 2024-09-21 18:02:22,645 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
26
+ 2024-09-21 18:02:22,680 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
27
+ 2024-09-21 18:02:22,713 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
28
+ 2024-09-21 18:02:22,749 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
29
+ 2024-09-21 18:02:22,784 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
30
+ 2024-09-21 18:02:22,819 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
31
+ 2024-09-21 18:02:22,854 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
32
+ 2024-09-21 18:02:22,890 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
33
+ 2024-09-21 18:02:22,924 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
34
+ 2024-09-21 18:02:22,959 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
35
+ 2024-09-21 18:02:22,994 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
36
+ 2024-09-21 18:02:23,028 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
37
+ 2024-09-21 18:02:23,060 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
38
+ 2024-09-21 18:02:23,094 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
39
+ 2024-09-21 18:02:23,129 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
40
+ 2024-09-21 18:02:23,163 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt
41
+ 2024-09-21 18:02:23,262 INFO [utils.py:657] [test-clean_attention_scale_0.01] %WER 2.53% [1329 / 52576, 151 ins, 144 del, 1034 sub ]
42
+ 2024-09-21 18:02:23,476 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
43
+ 2024-09-21 18:02:23,572 INFO [utils.py:657] [test-clean_attention_scale_0.05] %WER 2.48% [1302 / 52576, 149 ins, 133 del, 1020 sub ]
44
+ 2024-09-21 18:02:23,784 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
45
+ 2024-09-21 18:02:23,879 INFO [utils.py:657] [test-clean_attention_scale_0.08] %WER 2.43% [1278 / 52576, 147 ins, 126 del, 1005 sub ]
46
+ 2024-09-21 18:02:24,086 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
47
+ 2024-09-21 18:02:24,425 INFO [utils.py:657] [test-clean_attention_scale_0.1] %WER 2.39% [1259 / 52576, 143 ins, 124 del, 992 sub ]
48
+ 2024-09-21 18:02:24,632 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
49
+ 2024-09-21 18:02:24,724 INFO [utils.py:657] [test-clean_attention_scale_0.3] %WER 2.28% [1197 / 52576, 130 ins, 113 del, 954 sub ]
50
+ 2024-09-21 18:02:24,931 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
51
+ 2024-09-21 18:02:25,030 INFO [utils.py:657] [test-clean_attention_scale_0.5] %WER 2.17% [1143 / 52576, 124 ins, 102 del, 917 sub ]
52
+ 2024-09-21 18:02:25,238 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
53
+ 2024-09-21 18:02:25,332 INFO [utils.py:657] [test-clean_attention_scale_0.6] %WER 2.13% [1119 / 52576, 125 ins, 96 del, 898 sub ]
54
+ 2024-09-21 18:02:25,537 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
55
+ 2024-09-21 18:02:25,629 INFO [utils.py:657] [test-clean_attention_scale_0.7] %WER 2.08% [1096 / 52576, 124 ins, 88 del, 884 sub ]
56
+ 2024-09-21 18:02:25,836 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
57
+ 2024-09-21 18:02:25,933 INFO [utils.py:657] [test-clean_attention_scale_0.9] %WER 2.05% [1078 / 52576, 122 ins, 85 del, 871 sub ]
58
+ 2024-09-21 18:02:26,137 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
59
+ 2024-09-21 18:02:26,229 INFO [utils.py:657] [test-clean_attention_scale_1.0] %WER 2.04% [1073 / 52576, 123 ins, 84 del, 866 sub ]
60
+ 2024-09-21 18:02:26,433 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
61
+ 2024-09-21 18:02:26,524 INFO [utils.py:657] [test-clean_attention_scale_1.1] %WER 2.04% [1070 / 52576, 123 ins, 83 del, 864 sub ]
62
+ 2024-09-21 18:02:26,730 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
63
+ 2024-09-21 18:02:26,824 INFO [utils.py:657] [test-clean_attention_scale_1.2] %WER 2.02% [1060 / 52576, 121 ins, 83 del, 856 sub ]
64
+ 2024-09-21 18:02:27,030 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
65
+ 2024-09-21 18:02:27,123 INFO [utils.py:657] [test-clean_attention_scale_1.3] %WER 2.01% [1055 / 52576, 121 ins, 82 del, 852 sub ]
66
+ 2024-09-21 18:02:27,364 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
67
+ 2024-09-21 18:02:27,456 INFO [utils.py:657] [test-clean_attention_scale_1.5] %WER 2.00% [1052 / 52576, 121 ins, 79 del, 852 sub ]
68
+ 2024-09-21 18:02:27,661 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
69
+ 2024-09-21 18:02:27,752 INFO [utils.py:657] [test-clean_attention_scale_1.7] %WER 1.98% [1040 / 52576, 122 ins, 75 del, 843 sub ]
70
+ 2024-09-21 18:02:27,960 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
71
+ 2024-09-21 18:02:28,052 INFO [utils.py:657] [test-clean_attention_scale_1.9] %WER 1.98% [1039 / 52576, 122 ins, 74 del, 843 sub ]
72
+ 2024-09-21 18:02:28,520 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
73
+ 2024-09-21 18:02:28,613 INFO [utils.py:657] [test-clean_attention_scale_2.0] %WER 1.98% [1039 / 52576, 122 ins, 73 del, 844 sub ]
74
+ 2024-09-21 18:02:28,818 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
75
+ 2024-09-21 18:02:28,910 INFO [utils.py:657] [test-clean_attention_scale_2.1] %WER 1.97% [1037 / 52576, 121 ins, 72 del, 844 sub ]
76
+ 2024-09-21 18:02:29,122 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
77
+ 2024-09-21 18:02:29,214 INFO [utils.py:657] [test-clean_attention_scale_2.2] %WER 1.97% [1037 / 52576, 122 ins, 71 del, 844 sub ]
78
+ 2024-09-21 18:02:29,425 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
79
+ 2024-09-21 18:02:29,523 INFO [utils.py:657] [test-clean_attention_scale_2.3] %WER 1.97% [1037 / 52576, 122 ins, 71 del, 844 sub ]
80
+ 2024-09-21 18:02:29,733 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
81
+ 2024-09-21 18:02:29,836 INFO [utils.py:657] [test-clean_attention_scale_2.5] %WER 1.97% [1035 / 52576, 122 ins, 70 del, 843 sub ]
82
+ 2024-09-21 18:02:30,052 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
83
+ 2024-09-21 18:02:30,144 INFO [utils.py:657] [test-clean_attention_scale_3.0] %WER 1.96% [1033 / 52576, 122 ins, 70 del, 841 sub ]
84
+ 2024-09-21 18:02:30,366 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
85
+ 2024-09-21 18:02:30,461 INFO [utils.py:657] [test-clean_attention_scale_4.0] %WER 1.97% [1037 / 52576, 122 ins, 71 del, 844 sub ]
86
+ 2024-09-21 18:02:30,670 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
87
+ 2024-09-21 18:02:30,770 INFO [utils.py:657] [test-clean_attention_scale_5.0] %WER 1.96% [1030 / 52576, 119 ins, 71 del, 840 sub ]
88
+ 2024-09-21 18:02:30,985 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
89
+ 2024-09-21 18:02:31,077 INFO [utils.py:657] [test-clean_attention_scale_6.0] %WER 1.96% [1028 / 52576, 119 ins, 71 del, 838 sub ]
90
+ 2024-09-21 18:02:31,300 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
91
+ 2024-09-21 18:02:31,395 INFO [utils.py:657] [test-clean_attention_scale_7.0] %WER 1.96% [1030 / 52576, 120 ins, 71 del, 839 sub ]
92
+ 2024-09-21 18:02:31,604 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
93
+ 2024-09-21 18:02:31,698 INFO [utils.py:657] [test-clean_attention_scale_8.0] %WER 1.96% [1030 / 52576, 120 ins, 71 del, 839 sub ]
94
+ 2024-09-21 18:02:31,906 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
95
+ 2024-09-21 18:02:32,241 INFO [utils.py:657] [test-clean_attention_scale_9.0] %WER 1.96% [1031 / 52576, 121 ins, 71 del, 839 sub ]
96
+ 2024-09-21 18:02:32,449 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-clean-epoch-50_avg-20_use-averaged-model.txt
97
+ 2024-09-21 18:02:32,486 INFO [ctc_decode.py:717]
98
+ For test-clean, WER of different settings are:
99
+ attention_scale_3.0 1.96 best for test-clean
100
+ attention_scale_5.0 1.96
101
+ attention_scale_6.0 1.96
102
+ attention_scale_7.0 1.96
103
+ attention_scale_8.0 1.96
104
+ attention_scale_9.0 1.96
105
+ attention_scale_2.1 1.97
106
+ attention_scale_2.2 1.97
107
+ attention_scale_2.3 1.97
108
+ attention_scale_2.5 1.97
109
+ attention_scale_4.0 1.97
110
+ attention_scale_1.7 1.98
111
+ attention_scale_1.9 1.98
112
+ attention_scale_2.0 1.98
113
+ attention_scale_1.5 2.0
114
+ attention_scale_1.3 2.01
115
+ attention_scale_1.2 2.02
116
+ attention_scale_1.0 2.04
117
+ attention_scale_1.1 2.04
118
+ attention_scale_0.9 2.05
119
+ attention_scale_0.7 2.08
120
+ attention_scale_0.6 2.13
121
+ attention_scale_0.5 2.17
122
+ attention_scale_0.3 2.28
123
+ attention_scale_0.1 2.39
124
+ attention_scale_0.08 2.43
125
+ attention_scale_0.05 2.48
126
+ attention_scale_0.01 2.53
127
+
128
+ 2024-09-21 18:02:32,913 INFO [zipformer.py:1858] name=None, attn_weights_entropy = tensor([5.1365, 4.4428, 4.9126, 5.0717], device='cuda:0')
129
+ 2024-09-21 18:02:35,087 INFO [ctc_decode.py:653] batch 0/?, cuts processed until now is 17
130
+ 2024-09-21 18:04:48,388 INFO [zipformer.py:1858] name=None, attn_weights_entropy = tensor([4.7769, 4.1399, 4.5622, 4.7112], device='cuda:0')
131
+ 2024-09-21 18:05:13,242 INFO [zipformer.py:1858] name=None, attn_weights_entropy = tensor([5.8741, 5.7811, 5.1177, 5.4814], device='cuda:0')
132
+ 2024-09-21 18:05:41,706 INFO [zipformer.py:1858] name=None, attn_weights_entropy = tensor([3.8281, 4.7939, 5.1590, 5.1042], device='cuda:0')
133
+ 2024-09-21 18:05:48,184 INFO [zipformer.py:1858] name=None, attn_weights_entropy = tensor([2.5137, 2.8956, 2.5775, 2.2306], device='cuda:0')
134
+ 2024-09-21 18:05:53,840 INFO [zipformer.py:1858] name=None, attn_weights_entropy = tensor([4.7181, 3.8914, 4.0782, 4.2465], device='cuda:0')
135
+ 2024-09-21 18:06:02,472 INFO [ctc_decode.py:653] batch 100/?, cuts processed until now is 2530
136
+ 2024-09-21 18:06:26,746 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
137
+ 2024-09-21 18:06:26,785 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
138
+ 2024-09-21 18:06:26,822 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
139
+ 2024-09-21 18:06:26,856 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
140
+ 2024-09-21 18:06:26,893 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
141
+ 2024-09-21 18:06:26,941 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
142
+ 2024-09-21 18:06:26,989 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
143
+ 2024-09-21 18:06:27,032 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
144
+ 2024-09-21 18:06:27,074 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
145
+ 2024-09-21 18:06:27,110 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
146
+ 2024-09-21 18:06:27,192 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
147
+ 2024-09-21 18:06:27,293 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
148
+ 2024-09-21 18:06:27,328 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
149
+ 2024-09-21 18:06:27,378 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
150
+ 2024-09-21 18:06:27,414 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
151
+ 2024-09-21 18:06:27,499 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
152
+ 2024-09-21 18:06:27,560 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
153
+ 2024-09-21 18:06:27,597 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
154
+ 2024-09-21 18:06:27,632 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
155
+ 2024-09-21 18:06:27,672 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
156
+ 2024-09-21 18:06:27,727 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
157
+ 2024-09-21 18:06:27,763 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
158
+ 2024-09-21 18:06:27,851 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
159
+ 2024-09-21 18:06:27,889 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
160
+ 2024-09-21 18:06:27,934 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
161
+ 2024-09-21 18:06:27,999 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
162
+ 2024-09-21 18:06:28,034 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
163
+ 2024-09-21 18:06:28,113 INFO [ctc_decode.py:674] The transcripts are stored in zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt
164
+ 2024-09-21 18:06:28,232 INFO [utils.py:657] [test-other_attention_scale_0.01] %WER 4.93% [2579 / 52343, 256 ins, 268 del, 2055 sub ]
165
+ 2024-09-21 18:06:28,478 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
166
+ 2024-09-21 18:06:28,582 INFO [utils.py:657] [test-other_attention_scale_0.05] %WER 4.83% [2530 / 52343, 257 ins, 260 del, 2013 sub ]
167
+ 2024-09-21 18:06:28,824 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
168
+ 2024-09-21 18:06:28,931 INFO [utils.py:657] [test-other_attention_scale_0.08] %WER 4.77% [2499 / 52343, 255 ins, 253 del, 1991 sub ]
169
+ 2024-09-21 18:06:29,169 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
170
+ 2024-09-21 18:06:29,284 INFO [utils.py:657] [test-other_attention_scale_0.1] %WER 4.74% [2481 / 52343, 252 ins, 247 del, 1982 sub ]
171
+ 2024-09-21 18:06:29,507 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
172
+ 2024-09-21 18:06:29,612 INFO [utils.py:657] [test-other_attention_scale_0.3] %WER 4.50% [2353 / 52343, 234 ins, 218 del, 1901 sub ]
173
+ 2024-09-21 18:06:29,853 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
174
+ 2024-09-21 18:06:29,956 INFO [utils.py:657] [test-other_attention_scale_0.5] %WER 4.33% [2269 / 52343, 221 ins, 195 del, 1853 sub ]
175
+ 2024-09-21 18:06:30,175 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
176
+ 2024-09-21 18:06:30,275 INFO [utils.py:657] [test-other_attention_scale_0.6] %WER 4.31% [2254 / 52343, 221 ins, 193 del, 1840 sub ]
177
+ 2024-09-21 18:06:30,497 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
178
+ 2024-09-21 18:06:30,600 INFO [utils.py:657] [test-other_attention_scale_0.7] %WER 4.26% [2230 / 52343, 220 ins, 187 del, 1823 sub ]
179
+ 2024-09-21 18:06:30,820 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
180
+ 2024-09-21 18:06:30,920 INFO [utils.py:657] [test-other_attention_scale_0.9] %WER 4.21% [2202 / 52343, 220 ins, 182 del, 1800 sub ]
181
+ 2024-09-21 18:06:31,136 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
182
+ 2024-09-21 18:06:31,239 INFO [utils.py:657] [test-other_attention_scale_1.0] %WER 4.20% [2197 / 52343, 219 ins, 183 del, 1795 sub ]
183
+ 2024-09-21 18:06:31,455 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
184
+ 2024-09-21 18:06:31,837 INFO [utils.py:657] [test-other_attention_scale_1.1] %WER 4.18% [2190 / 52343, 218 ins, 182 del, 1790 sub ]
185
+ 2024-09-21 18:06:32,069 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
186
+ 2024-09-21 18:06:32,171 INFO [utils.py:657] [test-other_attention_scale_1.2] %WER 4.17% [2182 / 52343, 217 ins, 182 del, 1783 sub ]
187
+ 2024-09-21 18:06:32,392 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
188
+ 2024-09-21 18:06:32,493 INFO [utils.py:657] [test-other_attention_scale_1.3] %WER 4.17% [2182 / 52343, 219 ins, 181 del, 1782 sub ]
189
+ 2024-09-21 18:06:32,712 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
190
+ 2024-09-21 18:06:32,812 INFO [utils.py:657] [test-other_attention_scale_1.5] %WER 4.15% [2173 / 52343, 219 ins, 180 del, 1774 sub ]
191
+ 2024-09-21 18:06:33,036 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
192
+ 2024-09-21 18:06:33,135 INFO [utils.py:657] [test-other_attention_scale_1.7] %WER 4.14% [2169 / 52343, 222 ins, 179 del, 1768 sub ]
193
+ 2024-09-21 18:06:33,352 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
194
+ 2024-09-21 18:06:33,452 INFO [utils.py:657] [test-other_attention_scale_1.9] %WER 4.13% [2161 / 52343, 221 ins, 180 del, 1760 sub ]
195
+ 2024-09-21 18:06:33,690 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
196
+ 2024-09-21 18:06:33,797 INFO [utils.py:657] [test-other_attention_scale_2.0] %WER 4.13% [2160 / 52343, 221 ins, 180 del, 1759 sub ]
197
+ 2024-09-21 18:06:34,015 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
198
+ 2024-09-21 18:06:34,114 INFO [utils.py:657] [test-other_attention_scale_2.1] %WER 4.13% [2161 / 52343, 222 ins, 181 del, 1758 sub ]
199
+ 2024-09-21 18:06:34,332 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
200
+ 2024-09-21 18:06:34,431 INFO [utils.py:657] [test-other_attention_scale_2.2] %WER 4.13% [2161 / 52343, 221 ins, 182 del, 1758 sub ]
201
+ 2024-09-21 18:06:34,650 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
202
+ 2024-09-21 18:06:34,750 INFO [utils.py:657] [test-other_attention_scale_2.3] %WER 4.12% [2159 / 52343, 221 ins, 181 del, 1757 sub ]
203
+ 2024-09-21 18:06:34,965 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
204
+ 2024-09-21 18:06:35,065 INFO [utils.py:657] [test-other_attention_scale_2.5] %WER 4.12% [2156 / 52343, 223 ins, 181 del, 1752 sub ]
205
+ 2024-09-21 18:06:35,287 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
206
+ 2024-09-21 18:06:35,389 INFO [utils.py:657] [test-other_attention_scale_3.0] %WER 4.11% [2153 / 52343, 225 ins, 179 del, 1749 sub ]
207
+ 2024-09-21 18:06:35,612 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
208
+ 2024-09-21 18:06:35,711 INFO [utils.py:657] [test-other_attention_scale_4.0] %WER 4.10% [2145 / 52343, 228 ins, 180 del, 1737 sub ]
209
+ 2024-09-21 18:06:35,928 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
210
+ 2024-09-21 18:06:36,276 INFO [utils.py:657] [test-other_attention_scale_5.0] %WER 4.11% [2153 / 52343, 231 ins, 179 del, 1743 sub ]
211
+ 2024-09-21 18:06:36,492 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
212
+ 2024-09-21 18:06:36,591 INFO [utils.py:657] [test-other_attention_scale_6.0] %WER 4.10% [2146 / 52343, 228 ins, 180 del, 1738 sub ]
213
+ 2024-09-21 18:06:36,812 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
214
+ 2024-09-21 18:06:36,913 INFO [utils.py:657] [test-other_attention_scale_7.0] %WER 4.09% [2143 / 52343, 227 ins, 180 del, 1736 sub ]
215
+ 2024-09-21 18:06:37,135 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
216
+ 2024-09-21 18:06:37,234 INFO [utils.py:657] [test-other_attention_scale_8.0] %WER 4.08% [2138 / 52343, 225 ins, 179 del, 1734 sub ]
217
+ 2024-09-21 18:06:37,454 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
218
+ 2024-09-21 18:06:37,554 INFO [utils.py:657] [test-other_attention_scale_9.0] %WER 4.08% [2137 / 52343, 225 ins, 178 del, 1734 sub ]
219
+ 2024-09-21 18:06:37,775 INFO [ctc_decode.py:701] Wrote detailed error stats to zipformer/exp-large-ctc-aed-ctc-loss-scale-0.1-aed-loss-scale-0.9-cr-loss-scale-0.02-time-mask-ratio-2.5-scaled-masked-1/attention-decoder-rescoring-no-ngram/errs-test-other-epoch-50_avg-20_use-averaged-model.txt
220
+ 2024-09-21 18:06:37,782 INFO [ctc_decode.py:717]
221
+ For test-other, WER of different settings are:
222
+ attention_scale_8.0 4.08 best for test-other
223
+ attention_scale_9.0 4.08
224
+ attention_scale_7.0 4.09
225
+ attention_scale_4.0 4.1
226
+ attention_scale_6.0 4.1
227
+ attention_scale_3.0 4.11
228
+ attention_scale_5.0 4.11
229
+ attention_scale_2.3 4.12
230
+ attention_scale_2.5 4.12
231
+ attention_scale_1.9 4.13
232
+ attention_scale_2.0 4.13
233
+ attention_scale_2.1 4.13
234
+ attention_scale_2.2 4.13
235
+ attention_scale_1.7 4.14
236
+ attention_scale_1.5 4.15
237
+ attention_scale_1.2 4.17
238
+ attention_scale_1.3 4.17
239
+ attention_scale_1.1 4.18
240
+ attention_scale_1.0 4.2
241
+ attention_scale_0.9 4.21
242
+ attention_scale_0.7 4.26
243
+ attention_scale_0.6 4.31
244
+ attention_scale_0.5 4.33
245
+ attention_scale_0.3 4.5
246
+ attention_scale_0.1 4.74
247
+ attention_scale_0.08 4.77
248
+ attention_scale_0.05 4.83
249
+ attention_scale_0.01 4.93
250
+
251
+ 2024-09-21 18:06:37,782 INFO [ctc_decode.py:985] Done!
decoding_results/attention-decoder-rescoring-no-ngram/recogs-test-clean-epoch-50_avg-20_use-averaged-model.txt ADDED
The diff for this file is too large to render. See raw diff
 
decoding_results/attention-decoder-rescoring-no-ngram/recogs-test-other-epoch-50_avg-20_use-averaged-model.txt ADDED
The diff for this file is too large to render. See raw diff
 
decoding_results/attention-decoder-rescoring-no-ngram/wer-summary-test-clean-epoch-50_avg-20_use-averaged-model.txt ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ settings WER
2
+ attention_scale_3.0 1.96
3
+ attention_scale_5.0 1.96
4
+ attention_scale_6.0 1.96
5
+ attention_scale_7.0 1.96
6
+ attention_scale_8.0 1.96
7
+ attention_scale_9.0 1.96
8
+ attention_scale_2.1 1.97
9
+ attention_scale_2.2 1.97
10
+ attention_scale_2.3 1.97
11
+ attention_scale_2.5 1.97
12
+ attention_scale_4.0 1.97
13
+ attention_scale_1.7 1.98
14
+ attention_scale_1.9 1.98
15
+ attention_scale_2.0 1.98
16
+ attention_scale_1.5 2.0
17
+ attention_scale_1.3 2.01
18
+ attention_scale_1.2 2.02
19
+ attention_scale_1.0 2.04
20
+ attention_scale_1.1 2.04
21
+ attention_scale_0.9 2.05
22
+ attention_scale_0.7 2.08
23
+ attention_scale_0.6 2.13
24
+ attention_scale_0.5 2.17
25
+ attention_scale_0.3 2.28
26
+ attention_scale_0.1 2.39
27
+ attention_scale_0.08 2.43
28
+ attention_scale_0.05 2.48
29
+ attention_scale_0.01 2.53
decoding_results/attention-decoder-rescoring-no-ngram/wer-summary-test-other-epoch-50_avg-20_use-averaged-model.txt ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ settings WER
2
+ attention_scale_8.0 4.08
3
+ attention_scale_9.0 4.08
4
+ attention_scale_7.0 4.09
5
+ attention_scale_4.0 4.1
6
+ attention_scale_6.0 4.1
7
+ attention_scale_3.0 4.11
8
+ attention_scale_5.0 4.11
9
+ attention_scale_2.3 4.12
10
+ attention_scale_2.5 4.12
11
+ attention_scale_1.9 4.13
12
+ attention_scale_2.0 4.13
13
+ attention_scale_2.1 4.13
14
+ attention_scale_2.2 4.13
15
+ attention_scale_1.7 4.14
16
+ attention_scale_1.5 4.15
17
+ attention_scale_1.2 4.17
18
+ attention_scale_1.3 4.17
19
+ attention_scale_1.1 4.18
20
+ attention_scale_1.0 4.2
21
+ attention_scale_0.9 4.21
22
+ attention_scale_0.7 4.26
23
+ attention_scale_0.6 4.31
24
+ attention_scale_0.5 4.33
25
+ attention_scale_0.3 4.5
26
+ attention_scale_0.1 4.74
27
+ attention_scale_0.08 4.77
28
+ attention_scale_0.05 4.83
29
+ attention_scale_0.01 4.93
exp/decode.sh ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ export CUDA_VISIBLE_DEVICES=0
2
+ ./zipformer/ctc_decode.py \
3
+ --epoch 50 \
4
+ --avg 20 \
5
+ --exp-dir zipformer/exp-large-cr-ctc-aed/ \
6
+ --use-cr-ctc 1 \
7
+ --use-ctc 1 \
8
+ --use-transducer 0 \
9
+ --use-attention-decoder 1 \
10
+ --num-encoder-layers 2,2,4,5,4,2 \
11
+ --feedforward-dim 512,768,1536,2048,1536,768 \
12
+ --encoder-dim 192,256,512,768,512,256 \
13
+ --encoder-unmasked-dim 192,192,256,320,256,192 \
14
+ --max-duration 200 \
15
+ --decoding-method attention-decoder-rescoring-no-ngram
exp/epoch-50.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8119c491ec65c20b0439eb6d1a06bd85c6789ac17d345aa5cd11aa9fd01cc2c5
3
+ size 2790384782
exp/export.sh ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ./zipformer/export.py \
2
+ --exp-dir zipformer/exp-large-cr-ctc-aed \
3
+ --use-cr-ctc 1 \
4
+ --use-ctc 1 \
5
+ --use-transducer 0 \
6
+ --use-attention-decoder 1 \
7
+ --num-encoder-layers 2,2,4,5,4,2 \
8
+ --feedforward-dim 512,768,1536,2048,1536,768 \
9
+ --encoder-dim 192,256,512,768,512,256 \
10
+ --encoder-unmasked-dim 192,192,256,320,256,192 \
11
+ --tokens data/lang_bpe_500/tokens.txt \
12
+ --epoch 50 \
13
+ --avg 20
exp/log/log-train-2024-09-16-12-25-21-0 ADDED
The diff for this file is too large to render. See raw diff
 
exp/log/log-train-2024-09-16-12-25-21-1 ADDED
The diff for this file is too large to render. See raw diff
 
exp/pretrained.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:393af324fbda9d0f9126f3909e3adc08ffcce03c29bdf3c344e1fa4256322b77
3
+ size 697818201
exp/tensorboard/events.out.tfevents.1726460721.NGK_zengwei.62835.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42d5ea9552cc6f98c38a1e3b486979efd316da0384259612224252494eef2330
3
+ size 2767319
exp/train.sh ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ export CUDA_VISIBLE_DEVICES="0,1"
2
+ # for non-streaming model training:
3
+ ./zipformer/train.py \
4
+ --world-size 2 \
5
+ --num-epochs 50 \
6
+ --start-epoch 1 \
7
+ --use-fp16 1 \
8
+ --exp-dir zipformer/exp-large-cr-ctc-aed \
9
+ --use-cr-ctc 1 \
10
+ --use-ctc 1 \
11
+ --use-transducer 0 \
12
+ --use-attention-decoder 1 \
13
+ --num-encoder-layers 2,2,4,5,4,2 \
14
+ --feedforward-dim 512,768,1536,2048,1536,768 \
15
+ --encoder-dim 192,256,512,768,512,256 \
16
+ --encoder-unmasked-dim 192,192,256,320,256,192 \
17
+ --ctc-loss-scale 0.1 \
18
+ --attention-decoder-loss-scale 0.9 \
19
+ --enable-spec-aug 0 \
20
+ --cr-loss-scale 0.02 \
21
+ --time-mask-ratio 2.5 \
22
+ --full-libri 1 \
23
+ --max-duration 1200 \
24
+ --master-port 12345