File size: 4,484 Bytes

d301339

accum_grad: 16
adapter: lora
adapter_conf: {}
allow_multi_rates: false
allow_variable_data_keys: false
aux_ctc_tasks: []
batch_bins: 1000000
batch_size: 4
batch_type: sorted
best_model_criterion:
- - valid
  - loss
  - min
bpemodel: null
chunk_default_fs: null
chunk_excluded_key_prefixes: []
chunk_length: 500
chunk_shift_ratio: 0.5
cleaner: null
collect_stats: false
create_graph_in_tensorboard: false
ctc_conf:
  accumulation: false
  agg: mean
  ctc_type: droctc
  dro_group_count: 6
  dro_q_epsilon: 1.0e-10
  dro_step_size: 0.0001
  final_step_size: 0.001
  init_strategy: uniform
  initial_step_size: 0.0001
  laplace_smoothing: 0.0
  max_epoch: 40
  normalize_grad: false
  num_iters_per_epoch: 1200
  running_mean_window: -1
  scheduling: false
  use_running_mean: false
  warmup_steps: 0
cudnn_benchmark: false
cudnn_deterministic: true
cudnn_enabled: true
decoder: null
decoder_conf: {}
detect_anomaly: false
distributed: false
drop_last_iter: false
dry_run: false
duration_batch_length: -1
early_stopping_criterion:
- valid
- loss
- min
encoder: transformer
encoder_conf:
  attention_dropout_rate: 0.1
  attention_heads: 8
  dropout_rate: 0.1
  input_layer: conv2d2
  linear_units: 1024
  normalize_before: true
  num_blocks: 2
  output_size: 256
  positional_dropout_rate: 0.1
exclude_weight_decay: false
exclude_weight_decay_conf: {}
fold_length:
- 80000
- 150
freeze_param: []
frontend: s3prl
frontend_conf:
  download_dir: ./hub
  frontend_conf:
    path_or_url: facebook/mms-300m
    upstream: hf_wav2vec2_custom
  fs: 16k
  multilayer_feature: true
g2p: null
grad_clip: 5.0
grad_clip_type: 2.0
grad_noise: false
ignore_init_mismatch: false
init: xavier_uniform
init_param: []
input_size: null
iterator_type: sequence
joint_net_conf: null
keep_nbest_models: 3
log_interval: null
log_level: INFO
max_cache_fd: 32
max_cache_size: 0.0
max_epoch: 40
model: espnet
model_conf:
  ctc_weight: 1.0
multiple_iterator: false
multiprocessing_distributed: false
nbest_averaging_interval: 0
ngpu: 1
no_forward_run: false
noise_apply_prob: 1.0
noise_db_range: '13_15'
noise_scp: null
non_linguistic_symbols: ./nlsyms.txt
normalize: utterance_mvn
normalize_conf: {}
num_att_plot: 3
num_cache_chunks: 1024
num_iters_per_epoch: 1200
num_workers: 4
optim: adam
optim_conf:
  lr: 0.0001
  weight_decay: 1.0e-06
output_dir: ./inference_results
patience: null
postencoder: null
postencoder_conf: {}
preencoder: linear
preencoder_conf:
  input_size: 1024
  output_size: 80
preprocessor: default
preprocessor_conf: {}
pretrain_path: null
print_config: false
required:
- output_dir
- token_list
resume: true
rir_apply_prob: 1.0
rir_scp: null
save_strategy: all
scheduler: null
scheduler_conf: {}
seed: 0
sharded_ddp: false
short_noise_thres: 0.5
shuffle_within_batch: false
sort_batch: descending
sort_in_batch: descending
specaug: specaug
specaug_conf:
  apply_freq_mask: true
  apply_time_mask: true
  apply_time_warp: true
  freq_mask_width_range:
  - 0
  - 27
  num_freq_mask: 2
  num_time_mask: 10
  time_mask_width_ratio_range:
  - 0.0
  - 0.05
  time_warp_mode: bicubic
  time_warp_window: 5
speech_volume_normalize: null
token_list:
- <blank>
- <unk>
- <space>
- E
- A
- O
- N
- S
- I
- ا
- L
- T
- R
- و
- D
- ن
- ر
- ی
- ي
- M
- U
- H
- P
- ک
- م
- C
- А
- Ӹ
- Н
- B
- ت
- س
- ل
- J
- K
- ہ
- Т
- ے
- G
- Ш
- К
- Е
- Л
- Ы
- V
- М
- ج
- Ӓ
- ه
- ب
- د
- О
- Y
- '[slv]'
- Р
- ڪ
- پ
- Z
- '[mrj]'
- F
- گ
- И
- В
- ئ
- Д
- '[sot]'
- ں
- '[spa]'
- W
- Q
- П
- Г
- ف
- ق
- С
- ع
- ش
- Ж
- ز
- ھ
- آ
- Č
- Í
- У
- ح
- '[urd]'
- Š
- ٹ
- چ
- Ь
- ٽ
- '[snd]'
- ڻ
- Й
- ط
- ص
- ٿ
- Ц
- خ
- Ó
- Я
- Á
- É
- Ч
- ۾
- '0'
- Ž
- З
- '1'
- ۽
- –
- ڏ
- Э
- ڊ
- —
- ڈ
- ء
- Ñ
- ڙ
- ِ
- '2'
- ٻ
- Х
- Ӱ
- ظ
- ض
- ث
- ڳ
- ،
- X
- ¡
- غ
- ڑ
- Ӧ
- ذ
- ¿
- '5'
- ڌ
- '3'
- ڀ
- ُ
- '9'
- Ú
- '4'
- '8'
- ۔
- '6'
- ٺ
- Ю
- »
- Б
- «
- ڇ
- ً
- ڃ
- '7'
- ڄ
- ؤ
- ڍ
- Ф
- َ
- ٰ
- ّ
- ڱ
- ”
- ژ
- ڦ
- Ё
- ؛
- ٍ
- Щ
- ؟
- ’
- ‘
- °
- ۃ
- إ
- Ć
- <sos/eos>
token_type: char
train_dtype: float32
unused_parameters: true
use_adapter: false
use_amp: false
use_lang_prompt: false
use_matplotlib: true
use_nlp_prompt: false
use_preprocessor: true
use_tensorboard: true
val_scheduler_criterion:
- valid
- loss
valid_batch_bins: null
valid_batch_size: null
valid_batch_type: null
valid_iterator_type: null
valid_max_cache_size: null
version: '202402'
write_collected_feats: false