HoneyTian commited on
Commit
6f7cbba
·
1 Parent(s): e6a1b81
examples/vm_sound_classification/run.sh CHANGED
@@ -20,7 +20,7 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
20
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch32 \
21
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
22
  --label_plan 2-voicemail \
23
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
24
 
25
  END
26
 
@@ -37,6 +37,7 @@ final_model_name=final_model_name
37
  filename_patterns="/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav"
38
  label_plan=4
39
  config_file="yaml/conv2d-classifier-2-ch4.yaml"
 
40
  nohup_name=nohup.out
41
 
42
  country=en-US
@@ -130,6 +131,7 @@ if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
130
  --valid_dataset "${valid_dataset}" \
131
  --serialization_dir "${file_dir}" \
132
  --config_file "${config_file}" \
 
133
 
134
  fi
135
 
 
20
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch32 \
21
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
22
  --label_plan 2-voicemail \
23
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml"
24
 
25
  END
26
 
 
37
  filename_patterns="/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav"
38
  label_plan=4
39
  config_file="yaml/conv2d-classifier-2-ch4.yaml"
40
+ pretrained_model=null
41
  nohup_name=nohup.out
42
 
43
  country=en-US
 
131
  --valid_dataset "${valid_dataset}" \
132
  --serialization_dir "${file_dir}" \
133
  --config_file "${config_file}" \
134
+ --pretrained_model "${pretrained_model}" \
135
 
136
  fi
137
 
examples/vm_sound_classification/run_batch.sh CHANGED
@@ -3,80 +3,80 @@
3
 
4
  # sound ch4
5
 
6
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-2-ch4 \
7
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
8
- --label_plan 2 \
9
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
10
-
11
-
12
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch4 \
13
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
14
- --label_plan 3 \
15
- --config_file "yaml/conv2d-classifier-3-ch4.yaml"
16
-
17
-
18
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-ch4 \
19
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
20
- --label_plan 4 \
21
- --config_file "yaml/conv2d-classifier-4-ch4.yaml"
22
-
23
-
24
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch4 \
25
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
26
- --label_plan 8 \
27
- --config_file "yaml/conv2d-classifier-8-ch4.yaml"
28
 
29
 
30
  # sound ch8
31
 
32
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-2-ch8 \
33
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
34
- --label_plan 2 \
35
- --config_file "yaml/conv2d-classifier-2-ch8.yaml"
36
-
37
-
38
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch8 \
39
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
40
- --label_plan 3 \
41
- --config_file "yaml/conv2d-classifier-3-ch8.yaml"
42
-
43
-
44
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-ch8 \
45
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
46
- --label_plan 4 \
47
- --config_file "yaml/conv2d-classifier-4-ch8.yaml"
48
-
49
-
50
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch8 \
51
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
52
- --label_plan 8 \
53
- --config_file "yaml/conv2d-classifier-8-ch8.yaml"
54
 
55
 
56
  # sound ch16
57
 
58
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-2-ch16 \
59
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
60
- --label_plan 2 \
61
- --config_file "yaml/conv2d-classifier-2-ch16.yaml"
62
-
63
-
64
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch16 \
65
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
66
- --label_plan 3 \
67
- --config_file "yaml/conv2d-classifier-3-ch16.yaml"
68
-
69
-
70
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-ch16 \
71
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
72
- --label_plan 4 \
73
- --config_file "yaml/conv2d-classifier-4-ch16.yaml"
74
-
75
-
76
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch16 \
77
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
78
- --label_plan 8 \
79
- --config_file "yaml/conv2d-classifier-8-ch16.yaml"
80
 
81
 
82
  # sound ch32
@@ -99,10 +99,23 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
99
  #--config_file "yaml/conv2d-classifier-4-ch32.yaml"
100
 
101
 
102
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch32 \
103
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
104
- --label_plan 8 \
105
- --config_file "yaml/conv2d-classifier-8-ch32.yaml"
 
 
 
 
 
 
 
 
 
 
 
 
 
106
 
107
 
108
  # voicemail ch4
@@ -110,57 +123,68 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
110
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-ch4 \
111
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
112
  --label_plan 2-voicemail \
113
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
114
 
115
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-us-2-ch4 \
116
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-US/wav_finished/*/*.wav" \
117
  --label_plan 2-voicemail \
118
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
119
 
120
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-ch4 \
121
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
122
  --label_plan 2-voicemail \
123
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
124
 
125
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-ch4 \
126
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
127
  --label_plan 2-voicemail \
128
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
129
 
130
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-id-id-2-ch4 \
131
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/id-ID/wav_finished/*/*.wav" \
132
  --label_plan 2-voicemail \
133
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
134
 
135
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ja-JP-2-ch4 \
136
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ja-JP/wav_finished/*/*.wav" \
137
  --label_plan 2-voicemail \
138
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
139
 
140
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ko-kr-2-ch4 \
141
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ko-KR/wav_finished/*/*.wav" \
142
  --label_plan 2-voicemail \
143
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
144
 
145
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch4 \
146
- #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
147
- #--label_plan 2-voicemail \
148
- #--config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
149
 
150
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-pt-br-2-ch4 \
151
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/pt-BR/wav_finished/*/*.wav" \
152
  --label_plan 2-voicemail \
153
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
154
 
155
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-th-th-2-ch4 \
156
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/th-TH/wav_finished/*/*.wav" \
157
  --label_plan 2-voicemail \
158
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
159
 
160
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-zh-tw-2-ch4 \
161
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/zh-TW/wav_finished/*/*.wav" \
162
  --label_plan 2-voicemail \
163
- --config_file "yaml/conv2d-classifier-2-ch4.yaml"
 
164
 
165
 
166
  # voicemail ch32
@@ -168,54 +192,65 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
168
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-ch32 \
169
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
170
  --label_plan 2-voicemail \
171
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
172
 
173
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-us-2-ch32 \
174
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-US/wav_finished/*/*.wav" \
175
  --label_plan 2-voicemail \
176
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
177
 
178
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-ch32 \
179
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
180
  --label_plan 2-voicemail \
181
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
182
 
183
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-ch32 \
184
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
185
  --label_plan 2-voicemail \
186
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
187
 
188
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-id-id-2-ch32 \
189
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/id-ID/wav_finished/*/*.wav" \
190
  --label_plan 2-voicemail \
191
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
192
 
193
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ja-JP-2-ch32 \
194
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ja-JP/wav_finished/*/*.wav" \
195
  --label_plan 2-voicemail \
196
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
197
 
198
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ko-kr-2-ch32 \
199
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ko-KR/wav_finished/*/*.wav" \
200
  --label_plan 2-voicemail \
201
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
202
 
203
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch32 \
204
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
205
  --label_plan 2-voicemail \
206
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
207
 
208
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-pt-br-2-ch32 \
209
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/pt-BR/wav_finished/*/*.wav" \
210
  --label_plan 2-voicemail \
211
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
212
 
213
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-th-th-2-ch32 \
214
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/th-TH/wav_finished/*/*.wav" \
215
  --label_plan 2-voicemail \
216
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
217
 
218
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-zh-tw-2-ch32 \
219
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/zh-TW/wav_finished/*/*.wav" \
220
  --label_plan 2-voicemail \
221
- --config_file "yaml/conv2d-classifier-2-ch32.yaml"
 
 
3
 
4
  # sound ch4
5
 
6
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-2-ch4 \
7
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
8
+ #--label_plan 2 \
9
+ #--config_file "yaml/conv2d-classifier-2-ch4.yaml"
10
+ #
11
+ #
12
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch4 \
13
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
14
+ #--label_plan 3 \
15
+ #--config_file "yaml/conv2d-classifier-3-ch4.yaml"
16
+ #
17
+ #
18
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-ch4 \
19
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
20
+ #--label_plan 4 \
21
+ #--config_file "yaml/conv2d-classifier-4-ch4.yaml"
22
+ #
23
+ #
24
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch4 \
25
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
26
+ #--label_plan 8 \
27
+ #--config_file "yaml/conv2d-classifier-8-ch4.yaml"
28
 
29
 
30
  # sound ch8
31
 
32
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-2-ch8 \
33
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
34
+ #--label_plan 2 \
35
+ #--config_file "yaml/conv2d-classifier-2-ch8.yaml"
36
+ #
37
+ #
38
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch8 \
39
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
40
+ #--label_plan 3 \
41
+ #--config_file "yaml/conv2d-classifier-3-ch8.yaml"
42
+ #
43
+ #
44
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-ch8 \
45
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
46
+ #--label_plan 4 \
47
+ #--config_file "yaml/conv2d-classifier-4-ch8.yaml"
48
+ #
49
+ #
50
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch8 \
51
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
52
+ #--label_plan 8 \
53
+ #--config_file "yaml/conv2d-classifier-8-ch8.yaml"
54
 
55
 
56
  # sound ch16
57
 
58
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-2-ch16 \
59
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
60
+ #--label_plan 2 \
61
+ #--config_file "yaml/conv2d-classifier-2-ch16.yaml"
62
+ #
63
+ #
64
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch16 \
65
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
66
+ #--label_plan 3 \
67
+ #--config_file "yaml/conv2d-classifier-3-ch16.yaml"
68
+ #
69
+ #
70
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-ch16 \
71
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
72
+ #--label_plan 4 \
73
+ #--config_file "yaml/conv2d-classifier-4-ch16.yaml"
74
+ #
75
+ #
76
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch16 \
77
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
78
+ #--label_plan 8 \
79
+ #--config_file "yaml/conv2d-classifier-8-ch16.yaml"
80
 
81
 
82
  # sound ch32
 
99
  #--config_file "yaml/conv2d-classifier-4-ch32.yaml"
100
 
101
 
102
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-ch32 \
103
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
104
+ #--label_plan 8 \
105
+ #--config_file "yaml/conv2d-classifier-8-ch32.yaml"
106
+
107
+
108
+ # pretrained voicemail
109
+
110
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-2-ch4 \
111
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
112
+ #--label_plan 2-voicemail \
113
+ #--config_file "yaml/conv2d-classifier-2-ch4.yaml"
114
+ #
115
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-2-ch32 \
116
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
117
+ #--label_plan 2-voicemail \
118
+ #--config_file "yaml/conv2d-classifier-2-ch32.yaml"
119
 
120
 
121
  # voicemail ch4
 
123
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-ch4 \
124
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
125
  --label_plan 2-voicemail \
126
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
127
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
128
 
129
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-us-2-ch4 \
130
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-US/wav_finished/*/*.wav" \
131
  --label_plan 2-voicemail \
132
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
133
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
134
 
135
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-ch4 \
136
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
137
  --label_plan 2-voicemail \
138
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
139
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
140
 
141
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-ch4 \
142
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
143
  --label_plan 2-voicemail \
144
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
145
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
146
 
147
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-id-id-2-ch4 \
148
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/id-ID/wav_finished/*/*.wav" \
149
  --label_plan 2-voicemail \
150
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
151
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
152
 
153
+ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ja-jp-2-ch4 \
154
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ja-JP/wav_finished/*/*.wav" \
155
  --label_plan 2-voicemail \
156
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
157
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
158
 
159
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ko-kr-2-ch4 \
160
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ko-KR/wav_finished/*/*.wav" \
161
  --label_plan 2-voicemail \
162
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
163
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
164
 
165
+ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch4 \
166
+ --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
167
+ --label_plan 2-voicemail \
168
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
169
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
170
 
171
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-pt-br-2-ch4 \
172
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/pt-BR/wav_finished/*/*.wav" \
173
  --label_plan 2-voicemail \
174
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
175
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
176
 
177
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-th-th-2-ch4 \
178
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/th-TH/wav_finished/*/*.wav" \
179
  --label_plan 2-voicemail \
180
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
181
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
182
 
183
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-zh-tw-2-ch4 \
184
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/zh-TW/wav_finished/*/*.wav" \
185
  --label_plan 2-voicemail \
186
+ --config_file "yaml/conv2d-classifier-2-ch4.yaml" \
187
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch4.zip"
188
 
189
 
190
  # voicemail ch32
 
192
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-ch32 \
193
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
194
  --label_plan 2-voicemail \
195
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
196
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
197
 
198
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-us-2-ch32 \
199
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-US/wav_finished/*/*.wav" \
200
  --label_plan 2-voicemail \
201
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
202
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
203
 
204
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-ch32 \
205
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
206
  --label_plan 2-voicemail \
207
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
208
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
209
 
210
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-ch32 \
211
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
212
  --label_plan 2-voicemail \
213
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
214
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
215
 
216
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-id-id-2-ch32 \
217
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/id-ID/wav_finished/*/*.wav" \
218
  --label_plan 2-voicemail \
219
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
220
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
221
 
222
+ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ja-jp-2-ch32 \
223
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ja-JP/wav_finished/*/*.wav" \
224
  --label_plan 2-voicemail \
225
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
226
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
227
 
228
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ko-kr-2-ch32 \
229
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ko-KR/wav_finished/*/*.wav" \
230
  --label_plan 2-voicemail \
231
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
232
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
233
 
234
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch32 \
235
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
236
  --label_plan 2-voicemail \
237
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
238
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
239
 
240
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-pt-br-2-ch32 \
241
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/pt-BR/wav_finished/*/*.wav" \
242
  --label_plan 2-voicemail \
243
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
244
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
245
 
246
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-th-th-2-ch32 \
247
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/th-TH/wav_finished/*/*.wav" \
248
  --label_plan 2-voicemail \
249
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
250
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
251
 
252
  sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-zh-tw-2-ch32 \
253
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/zh-TW/wav_finished/*/*.wav" \
254
  --label_plan 2-voicemail \
255
+ --config_file "yaml/conv2d-classifier-2-ch32.yaml" \
256
+ --pretrained_model "/data/tianxing/PycharmProjects/vm_sound_classification/trained_models/voicemail-2-ch32.zip"
examples/vm_sound_classification/step_1_prepare_data.py CHANGED
@@ -19,7 +19,6 @@ from tqdm import tqdm
19
  def get_args():
20
  parser = argparse.ArgumentParser()
21
  parser.add_argument("--file_dir", default="./", type=str)
22
- parser.add_argument("--task", default="default", type=str)
23
  parser.add_argument("--filename_patterns", type=str)
24
 
25
  parser.add_argument("--train_dataset", default="train.xlsx", type=str)
 
19
  def get_args():
20
  parser = argparse.ArgumentParser()
21
  parser.add_argument("--file_dir", default="./", type=str)
 
22
  parser.add_argument("--filename_patterns", type=str)
23
 
24
  parser.add_argument("--train_dataset", default="train.xlsx", type=str)
examples/vm_sound_classification/step_3_train_model.py CHANGED
@@ -11,7 +11,9 @@ from pathlib import Path
11
  import random
12
  import sys
13
  import shutil
 
14
  from typing import List
 
15
 
16
  pwd = os.path.abspath(os.path.dirname(__file__))
17
  sys.path.append(os.path.join(pwd, "../../"))
@@ -21,6 +23,7 @@ import torch
21
  from torch.utils.data.dataloader import DataLoader
22
  from tqdm import tqdm
23
 
 
24
  from toolbox.torch.modules.loss import FocalLoss, HingeLoss, HingeLinear
25
  from toolbox.torch.training.metrics.categorical_accuracy import CategoricalAccuracy
26
  from toolbox.torch.utils.data.vocabulary import Vocabulary
@@ -46,6 +49,12 @@ def get_args():
46
  parser.add_argument("--seed", default=0, type=int)
47
 
48
  parser.add_argument("--config_file", default="conv2d_classifier.yaml", type=str)
 
 
 
 
 
 
49
 
50
  args = parser.parse_args()
51
  return args
@@ -175,6 +184,23 @@ def main():
175
  model = WaveClassifierPretrainedModel(
176
  config=config,
177
  )
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
178
  model.to(device)
179
  model.train()
180
 
 
11
  import random
12
  import sys
13
  import shutil
14
+ import tempfile
15
  from typing import List
16
+ import zipfile
17
 
18
  pwd = os.path.abspath(os.path.dirname(__file__))
19
  sys.path.append(os.path.join(pwd, "../../"))
 
23
  from torch.utils.data.dataloader import DataLoader
24
  from tqdm import tqdm
25
 
26
+ from project_settings import project_path
27
  from toolbox.torch.modules.loss import FocalLoss, HingeLoss, HingeLinear
28
  from toolbox.torch.training.metrics.categorical_accuracy import CategoricalAccuracy
29
  from toolbox.torch.utils.data.vocabulary import Vocabulary
 
49
  parser.add_argument("--seed", default=0, type=int)
50
 
51
  parser.add_argument("--config_file", default="conv2d_classifier.yaml", type=str)
52
+ parser.add_argument(
53
+ "--pretrained_model",
54
+ # default=(project_path / "trained_models/voicemail-en-sg-2-ch4.zip").as_posix(),
55
+ default="null",
56
+ type=str
57
+ )
58
 
59
  args = parser.parse_args()
60
  return args
 
184
  model = WaveClassifierPretrainedModel(
185
  config=config,
186
  )
187
+
188
+ if args.pretrained_model is not None and os.path.exists(args.pretrained_model):
189
+ logger.info(f"load pretrained model state dict from: {args.pretrained_model}")
190
+ with zipfile.ZipFile(args.pretrained_model, "r") as f_zip:
191
+ out_root = Path(tempfile.gettempdir()) / "vm_sound_classification"
192
+ # print(out_root.as_posix())
193
+ if out_root.exists():
194
+ shutil.rmtree(out_root.as_posix())
195
+ out_root.mkdir(parents=True, exist_ok=True)
196
+ f_zip.extractall(path=out_root)
197
+
198
+ tgt_path = out_root / os.path.basename(args.pretrained_model)
199
+ model_pt_file = tgt_path / "model.pt"
200
+ with open(model_pt_file, "r") as f:
201
+ state_dict = torch.load(f, map_location="cpu")
202
+ model.load_state_dict(state_dict=state_dict)
203
+
204
  model.to(device)
205
  model.train()
206