HoneyTian commited on
Commit
68ac03b
·
1 Parent(s): ab39b36
examples/vm_sound_classification/conv2d_classifier.yaml CHANGED
@@ -18,21 +18,21 @@ spec_augment_param:
18
  conv2d_block_param_list:
19
  - batch_norm: true
20
  in_channels: 1
21
- out_channels: 32
22
  kernel_size: 3
23
  stride: 1
24
  dilation: 3
25
  activation: relu
26
  dropout: 0.1
27
- - in_channels: 32
28
- out_channels: 32
29
  kernel_size: 5
30
  stride: 2
31
  dilation: 3
32
  activation: relu
33
  dropout: 0.1
34
- - in_channels: 32
35
- out_channels: 32
36
  kernel_size: 3
37
  stride: 1
38
  dilation: 2
@@ -40,7 +40,7 @@ conv2d_block_param_list:
40
  dropout: 0.1
41
 
42
  cls_head_param:
43
- input_dim: 864
44
  num_layers: 2
45
  hidden_dims:
46
  - 128
 
18
  conv2d_block_param_list:
19
  - batch_norm: true
20
  in_channels: 1
21
+ out_channels: 16
22
  kernel_size: 3
23
  stride: 1
24
  dilation: 3
25
  activation: relu
26
  dropout: 0.1
27
+ - in_channels: 16
28
+ out_channels: 16
29
  kernel_size: 5
30
  stride: 2
31
  dilation: 3
32
  activation: relu
33
  dropout: 0.1
34
+ - in_channels: 16
35
+ out_channels: 16
36
  kernel_size: 3
37
  stride: 1
38
  dilation: 2
 
40
  dropout: 0.1
41
 
42
  cls_head_param:
43
+ input_dim: 432
44
  num_layers: 2
45
  hidden_dims:
46
  - 128
examples/vm_sound_classification/run.sh CHANGED
@@ -12,7 +12,7 @@ sh run.sh --stage 2 --stop_stage 2 --system_version windows --file_folder_name f
12
  E:/Users/tianx/HuggingDatasets/vm_sound_classification/data/wav_finished/id-ID/wav_finished/*/*.wav" \
13
  --label_plan 4
14
 
15
- sh run.sh --stage 0 --stop_stage 5 --system_version centos --file_folder_name file_dir --final_model_name vm_sound_classification2-ch32 \
16
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" --label_plan 2
17
 
18
  "
 
12
  E:/Users/tianx/HuggingDatasets/vm_sound_classification/data/wav_finished/id-ID/wav_finished/*/*.wav" \
13
  --label_plan 4
14
 
15
+ sh run.sh --stage 0 --stop_stage 5 --system_version centos --file_folder_name file_dir --final_model_name vm_sound_classification2-ch16 \
16
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" --label_plan 2
17
 
18
  "