Spaces:
Running
Running
File size: 747 Bytes
bfa885e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 |
model_name: "cnn_audio_classifier"
mel_spectrogram_param:
sample_rate: 8000
n_fft: 512
win_length: 200
hop_length: 80
f_min: 10
f_max: 3800
window_fn: hamming
n_mels: 80
conv2d_block_param_list:
- batch_norm: true
in_channels: 1
out_channels: 4
kernel_size: 3
stride: 1
dilation: 3
activation: relu
dropout: 0.1
- in_channels: 4
out_channels: 4
kernel_size: 5
stride: 2
dilation: 3
activation: relu
dropout: 0.1
- in_channels: 4
out_channels: 4
kernel_size: 3
stride: 1
dilation: 2
activation: relu
dropout: 0.1
cls_head_param:
input_dim: 108
num_layers: 2
hidden_dims:
- 128
- 32
activations: relu
dropout: 0.1
num_labels: 3
|