group-dro_mms_set_4 / config.yaml
Bartelds
Upload checkpoint, sanitized config, and transcripts for group-dro_mms_set_4
d301339
accum_grad: 16
adapter: lora
adapter_conf: {}
allow_multi_rates: false
allow_variable_data_keys: false
aux_ctc_tasks: []
batch_bins: 1000000
batch_size: 4
batch_type: sorted
best_model_criterion:
- - valid
- loss
- min
bpemodel: null
chunk_default_fs: null
chunk_excluded_key_prefixes: []
chunk_length: 500
chunk_shift_ratio: 0.5
cleaner: null
collect_stats: false
create_graph_in_tensorboard: false
ctc_conf:
accumulation: false
agg: mean
ctc_type: droctc
dro_group_count: 6
dro_q_epsilon: 1.0e-10
dro_step_size: 0.0001
final_step_size: 0.001
init_strategy: uniform
initial_step_size: 0.0001
laplace_smoothing: 0.0
max_epoch: 40
normalize_grad: false
num_iters_per_epoch: 1200
running_mean_window: -1
scheduling: false
use_running_mean: false
warmup_steps: 0
cudnn_benchmark: false
cudnn_deterministic: true
cudnn_enabled: true
decoder: null
decoder_conf: {}
detect_anomaly: false
distributed: false
drop_last_iter: false
dry_run: false
duration_batch_length: -1
early_stopping_criterion:
- valid
- loss
- min
encoder: transformer
encoder_conf:
attention_dropout_rate: 0.1
attention_heads: 8
dropout_rate: 0.1
input_layer: conv2d2
linear_units: 1024
normalize_before: true
num_blocks: 2
output_size: 256
positional_dropout_rate: 0.1
exclude_weight_decay: false
exclude_weight_decay_conf: {}
fold_length:
- 80000
- 150
freeze_param: []
frontend: s3prl
frontend_conf:
download_dir: ./hub
frontend_conf:
path_or_url: facebook/mms-300m
upstream: hf_wav2vec2_custom
fs: 16k
multilayer_feature: true
g2p: null
grad_clip: 5.0
grad_clip_type: 2.0
grad_noise: false
ignore_init_mismatch: false
init: xavier_uniform
init_param: []
input_size: null
iterator_type: sequence
joint_net_conf: null
keep_nbest_models: 3
log_interval: null
log_level: INFO
max_cache_fd: 32
max_cache_size: 0.0
max_epoch: 40
model: espnet
model_conf:
ctc_weight: 1.0
multiple_iterator: false
multiprocessing_distributed: false
nbest_averaging_interval: 0
ngpu: 1
no_forward_run: false
noise_apply_prob: 1.0
noise_db_range: '13_15'
noise_scp: null
non_linguistic_symbols: ./nlsyms.txt
normalize: utterance_mvn
normalize_conf: {}
num_att_plot: 3
num_cache_chunks: 1024
num_iters_per_epoch: 1200
num_workers: 4
optim: adam
optim_conf:
lr: 0.0001
weight_decay: 1.0e-06
output_dir: ./inference_results
patience: null
postencoder: null
postencoder_conf: {}
preencoder: linear
preencoder_conf:
input_size: 1024
output_size: 80
preprocessor: default
preprocessor_conf: {}
pretrain_path: null
print_config: false
required:
- output_dir
- token_list
resume: true
rir_apply_prob: 1.0
rir_scp: null
save_strategy: all
scheduler: null
scheduler_conf: {}
seed: 0
sharded_ddp: false
short_noise_thres: 0.5
shuffle_within_batch: false
sort_batch: descending
sort_in_batch: descending
specaug: specaug
specaug_conf:
apply_freq_mask: true
apply_time_mask: true
apply_time_warp: true
freq_mask_width_range:
- 0
- 27
num_freq_mask: 2
num_time_mask: 10
time_mask_width_ratio_range:
- 0.0
- 0.05
time_warp_mode: bicubic
time_warp_window: 5
speech_volume_normalize: null
token_list:
- <blank>
- <unk>
- <space>
- E
- A
- O
- N
- S
- I
- ا
- L
- T
- R
- و
- D
- ن
- ر
- ی
- ي
- M
- U
- H
- P
- ک
- م
- C
- А
- Ӹ
- Н
- B
- ت
- س
- ل
- J
- K
- ہ
- Т
- ے
- G
- Ш
- К
- Е
- Л
- Ы
- V
- М
- ج
- Ӓ
- ه
- ب
- د
- О
- Y
- '[slv]'
- Р
- ڪ
- پ
- Z
- '[mrj]'
- F
- گ
- И
- В
- ئ
- Д
- '[sot]'
- ں
- '[spa]'
- W
- Q
- П
- Г
- ف
- ق
- С
- ع
- ش
- Ж
- ز
- ھ
- آ
- Č
- Í
- У
- ح
- '[urd]'
- Š
- ٹ
- چ
- Ь
- ٽ
- '[snd]'
- ڻ
- Й
- ط
- ص
- ٿ
- Ц
- خ
- Ó
- Я
- Á
- É
- Ч
- ۾
- '0'
- Ž
- З
- '1'
- ۽
-
- ڏ
- Э
- ڊ
-
- ڈ
- ء
- Ñ
- ڙ
- ِ
- '2'
- ٻ
- Х
- Ӱ
- ظ
- ض
- ث
- ڳ
- ،
- X
- ¡
- غ
- ڑ
- Ӧ
- ذ
- ¿
- '5'
- ڌ
- '3'
- ڀ
- ُ
- '9'
- Ú
- '4'
- '8'
- ۔
- '6'
- ٺ
- Ю
- »
- Б
- «
- ڇ
- ً
- ڃ
- '7'
- ڄ
- ؤ
- ڍ
- Ф
- َ
- ٰ
- ّ
- ڱ
-
- ژ
- ڦ
- Ё
- ؛
- ٍ
- Щ
- ؟
-
-
- °
- ۃ
- إ
- Ć
- <sos/eos>
token_type: char
train_dtype: float32
unused_parameters: true
use_adapter: false
use_amp: false
use_lang_prompt: false
use_matplotlib: true
use_nlp_prompt: false
use_preprocessor: true
use_tensorboard: true
val_scheduler_criterion:
- valid
- loss
valid_batch_bins: null
valid_batch_size: null
valid_batch_type: null
valid_iterator_type: null
valid_max_cache_size: null
version: '202402'
write_collected_feats: false