call-audio-8 / examples /vm_sound_classification /yaml /conv2d-classifier-4-ch32.yaml
HoneyTian's picture
first commit
bfa885e
raw
history blame contribute delete
752 Bytes
model_name: "cnn_audio_classifier"
mel_spectrogram_param:
sample_rate: 8000
n_fft: 512
win_length: 200
hop_length: 80
f_min: 10
f_max: 3800
window_fn: hamming
n_mels: 80
conv2d_block_param_list:
- batch_norm: true
in_channels: 1
out_channels: 32
kernel_size: 3
stride: 1
dilation: 3
activation: relu
dropout: 0.1
- in_channels: 32
out_channels: 32
kernel_size: 5
stride: 2
dilation: 3
activation: relu
dropout: 0.1
- in_channels: 32
out_channels: 32
kernel_size: 3
stride: 1
dilation: 2
activation: relu
dropout: 0.1
cls_head_param:
input_dim: 864
num_layers: 2
hidden_dims:
- 128
- 32
activations: relu
dropout: 0.1
num_labels: 4