HoneyTian commited on
Commit
2664dbf
·
1 Parent(s): f0e8674
examples/sound_classification_by_cnn/run_batch_l3.sh CHANGED
@@ -9,10 +9,10 @@
9
  #--config_file "yaml/conv2d-classifier-2-l3-ch4.yaml"
10
 
11
 
12
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-l3-ch4-cnn \
13
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
14
- --label_plan 3 \
15
- --config_file "yaml/conv2d-classifier-3-l3-ch4.yaml"
16
 
17
 
18
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-l3-ch4-cnn \
@@ -87,10 +87,10 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
87
  #--config_file "yaml/conv2d-classifier-2-l3-ch32.yaml"
88
 
89
 
90
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-l3-ch32-cnn \
91
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
92
- --label_plan 3 \
93
- --config_file "yaml/conv2d-classifier-3-l3-ch32.yaml"
94
 
95
 
96
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-l3-ch32-cnn \
@@ -122,20 +122,20 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
122
  #--label_plan 2-voicemail \
123
  #--config_file "yaml/conv2d-classifier-2-l3-ch16.yaml"
124
 
125
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-2-l3-ch32-cnn \
126
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
127
- --label_plan 2-voicemail \
128
- --config_file "yaml/conv2d-classifier-2-l3-ch32.yaml"
129
 
130
 
131
  # voicemail ch4
132
 
133
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-ph-2-l3-ch4-cnn \
134
- #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-PH/wav_finished/*/*.wav" \
135
- #--label_plan 2-voicemail \
136
- #--config_file "yaml/conv2d-classifier-2-l3-ch4.yaml" \
137
- #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch4-cnn.zip"
138
- #
139
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-l3-ch4-cnn \
140
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
141
  #--label_plan 2-voicemail \
@@ -148,11 +148,11 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
148
  #--config_file "yaml/conv2d-classifier-2-l3-ch4.yaml" \
149
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch4-cnn.zip"
150
 
151
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-l3-ch4-cnn \
152
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
153
- --label_plan 2-voicemail \
154
- --config_file "yaml/conv2d-classifier-2-l3-ch4.yaml" \
155
- --pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch4-cnn.zip"
156
  #
157
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-l3-ch4-cnn \
158
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
@@ -250,11 +250,11 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
250
  #--config_file "yaml/conv2d-classifier-2-l3-ch32.yaml" \
251
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch32-cnn.zip"
252
 
253
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-l3-ch32-cnn \
254
- --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
255
- --label_plan 2-voicemail \
256
- --config_file "yaml/conv2d-classifier-2-l3-ch32.yaml" \
257
- --pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch32-cnn.zip"
258
 
259
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-l3-ch32-cnn \
260
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
 
9
  #--config_file "yaml/conv2d-classifier-2-l3-ch4.yaml"
10
 
11
 
12
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-l3-ch4-cnn \
13
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
14
+ #--label_plan 3 \
15
+ #--config_file "yaml/conv2d-classifier-3-l3-ch4.yaml"
16
 
17
 
18
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-l3-ch4-cnn \
 
87
  #--config_file "yaml/conv2d-classifier-2-l3-ch32.yaml"
88
 
89
 
90
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-l3-ch32-cnn \
91
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
92
+ #--label_plan 3 \
93
+ #--config_file "yaml/conv2d-classifier-3-l3-ch32.yaml"
94
 
95
 
96
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-l3-ch32-cnn \
 
122
  #--label_plan 2-voicemail \
123
  #--config_file "yaml/conv2d-classifier-2-l3-ch16.yaml"
124
 
125
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-2-l3-ch32-cnn \
126
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
127
+ #--label_plan 2-voicemail \
128
+ #--config_file "yaml/conv2d-classifier-2-l3-ch32.yaml"
129
 
130
 
131
  # voicemail ch4
132
 
133
+ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-ph-2-l3-ch4-cnn \
134
+ --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-PH/wav_finished/*/*.wav" \
135
+ --label_plan 2-voicemail \
136
+ --config_file "yaml/conv2d-classifier-2-l3-ch4.yaml" \
137
+ --pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch4-cnn.zip"
138
+
139
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-l3-ch4-cnn \
140
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
141
  #--label_plan 2-voicemail \
 
148
  #--config_file "yaml/conv2d-classifier-2-l3-ch4.yaml" \
149
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch4-cnn.zip"
150
 
151
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-l3-ch4-cnn \
152
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
153
+ #--label_plan 2-voicemail \
154
+ #--config_file "yaml/conv2d-classifier-2-l3-ch4.yaml" \
155
+ #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch4-cnn.zip"
156
  #
157
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-l3-ch4-cnn \
158
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
 
250
  #--config_file "yaml/conv2d-classifier-2-l3-ch32.yaml" \
251
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch32-cnn.zip"
252
 
253
+ #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-l3-ch32-cnn \
254
+ #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
255
+ #--label_plan 2-voicemail \
256
+ #--config_file "yaml/conv2d-classifier-2-l3-ch32.yaml" \
257
+ #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-ch32-cnn.zip"
258
 
259
  #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-l3-ch32-cnn \
260
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
examples/sound_classification_by_lstm/run.sh CHANGED
@@ -12,17 +12,17 @@ sh run.sh --stage 2 --stop_stage 2 --system_version windows --file_folder_name f
12
  E:/Users/tianx/HuggingDatasets/cc_audio_8/data/wav_finished/id-ID/wav_finished/*/*.wav" \
13
  --label_plan 4
14
 
15
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch32-lstm \
16
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
17
  --label_plan 3 \
18
  --config_file "yaml/lstm_classifier-3-ch64.yaml"
19
 
20
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch32-lstm \
21
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
22
  --label_plan 2-voicemail \
23
  --config_file "yaml/lstm_classifier-2-ch64.yaml"
24
 
25
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch64-lstm \
26
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
27
  --label_plan 2-voicemail \
28
  --config_file "yaml/lstm-classifier-2-ch64.yaml"
@@ -90,6 +90,7 @@ dataset="${file_dir}/dataset.xlsx"
90
  train_dataset="${file_dir}/train.xlsx"
91
  valid_dataset="${file_dir}/valid.xlsx"
92
  evaluation_file="${file_dir}/evaluation.xlsx"
 
93
  vocabulary_dir="${file_dir}/vocabulary"
94
 
95
  $verbose && echo "system_version: ${system_version}"
@@ -142,7 +143,7 @@ fi
142
 
143
 
144
  if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
145
- $verbose && echo "stage 3: test model"
146
  cd "${work_dir}" || exit 1
147
  python3 step_4_evaluation_model.py \
148
  --dataset "${dataset}" \
@@ -170,7 +171,22 @@ fi
170
 
171
 
172
  if [ ${stage} -le 5 ] && [ ${stop_stage} -ge 5 ]; then
173
- $verbose && echo "stage 5: collect files"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
174
  cd "${work_dir}" || exit 1
175
 
176
  mkdir -p ${final_model_dir}
@@ -178,7 +194,8 @@ if [ ${stage} -le 5 ] && [ ${stop_stage} -ge 5 ]; then
178
  cp "${file_dir}/best"/* "${final_model_dir}"
179
  cp -r "${file_dir}/vocabulary" "${final_model_dir}"
180
 
181
- cp "${file_dir}/evaluation.xlsx" "${final_model_dir}/evaluation.xlsx"
 
182
 
183
  cp "${file_dir}/model.onnx" "${final_model_dir}/model.onnx"
184
 
@@ -200,8 +217,8 @@ if [ ${stage} -le 5 ] && [ ${stop_stage} -ge 5 ]; then
200
  fi
201
 
202
 
203
- if [ ${stage} -le 6 ] && [ ${stop_stage} -ge 6 ]; then
204
- $verbose && echo "stage 6: clear file_dir"
205
  cd "${work_dir}" || exit 1
206
 
207
  rm -rf "${file_dir}";
 
12
  E:/Users/tianx/HuggingDatasets/cc_audio_8/data/wav_finished/id-ID/wav_finished/*/*.wav" \
13
  --label_plan 4
14
 
15
+ sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name sound-3-ch32-lstm \
16
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
17
  --label_plan 3 \
18
  --config_file "yaml/lstm_classifier-3-ch64.yaml"
19
 
20
+ sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch32-lstm \
21
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
22
  --label_plan 2-voicemail \
23
  --config_file "yaml/lstm_classifier-2-ch64.yaml"
24
 
25
+ sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-ch64-lstm \
26
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
27
  --label_plan 2-voicemail \
28
  --config_file "yaml/lstm-classifier-2-ch64.yaml"
 
90
  train_dataset="${file_dir}/train.xlsx"
91
  valid_dataset="${file_dir}/valid.xlsx"
92
  evaluation_file="${file_dir}/evaluation.xlsx"
93
+ evaluation_onnx_file="${file_dir}/evaluation-onnx.xlsx"
94
  vocabulary_dir="${file_dir}/vocabulary"
95
 
96
  $verbose && echo "system_version: ${system_version}"
 
143
 
144
 
145
  if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
146
+ $verbose && echo "stage 3: evaluate model"
147
  cd "${work_dir}" || exit 1
148
  python3 step_4_evaluation_model.py \
149
  --dataset "${dataset}" \
 
171
 
172
 
173
  if [ ${stage} -le 5 ] && [ ${stop_stage} -ge 5 ]; then
174
+ $verbose && echo "stage 5: evaluate onnx model"
175
+ cd "${work_dir}" || exit 1
176
+
177
+ python3 step_9_evaluation_onnx_model.py \
178
+ --model_file "null" \
179
+ --dataset "${evaluation_file}" \
180
+ --vocabulary_dir "${vocabulary_dir}" \
181
+ --model_dir "${file_dir}/best" \
182
+ --onnx_model_file "${file_dir}/model.onnx" \
183
+ --output_file "${evaluation_onnx_file}" \
184
+
185
+ fi
186
+
187
+
188
+ if [ ${stage} -le 6 ] && [ ${stop_stage} -ge 6 ]; then
189
+ $verbose && echo "stage 6: collect files"
190
  cd "${work_dir}" || exit 1
191
 
192
  mkdir -p ${final_model_dir}
 
194
  cp "${file_dir}/best"/* "${final_model_dir}"
195
  cp -r "${file_dir}/vocabulary" "${final_model_dir}"
196
 
197
+ cp "${evaluation_file}" "${final_model_dir}/evaluation.xlsx"
198
+ cp "${evaluation_onnx_file}" "${final_model_dir}/evaluation-onnx.xlsx"
199
 
200
  cp "${file_dir}/model.onnx" "${final_model_dir}/model.onnx"
201
 
 
217
  fi
218
 
219
 
220
+ if [ ${stage} -le 7 ] && [ ${stop_stage} -ge 7 ]; then
221
+ $verbose && echo "stage 7: clear file_dir"
222
  cd "${work_dir}" || exit 1
223
 
224
  rm -rf "${file_dir}";
examples/sound_classification_by_lstm/run_batch.sh CHANGED
@@ -3,22 +3,22 @@
3
 
4
  # sound ch64
5
 
6
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-2-l3-ch64-lstm \
7
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
8
  #--label_plan 2 \
9
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml"
10
  #
11
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-3-l3-ch64-lstm \
12
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
13
  #--label_plan 3 \
14
  #--config_file "yaml/lstm-classifier-3-l3-ch64.yaml"
15
  #
16
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-4-l3-ch64-lstm \
17
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
18
  #--label_plan 4 \
19
  #--config_file "yaml/lstm-classifier-4-l3-ch64.yaml"
20
  #
21
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name sound-8-l3-ch64-lstm \
22
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
23
  #--label_plan 8 \
24
  #--config_file "yaml/lstm-classifier-8-l3-ch64.yaml"
@@ -26,7 +26,7 @@
26
 
27
  # pretrained voicemail
28
 
29
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-2-l3-ch64-lstm \
30
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
31
  --label_plan 2-voicemail \
32
  --config_file "yaml/lstm-classifier-2-l3-ch64.yaml"
@@ -34,79 +34,79 @@ sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name fi
34
 
35
  # voicemail ch64
36
 
37
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-ph-2-l3-ch64-lstm \
38
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-PH/wav_finished/*/*.wav" \
39
  #--label_plan 2-voicemail \
40
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
41
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
42
  #
43
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-l3-ch64-lstm \
44
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
45
  #--label_plan 2-voicemail \
46
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
47
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
48
  #
49
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-us-2-l3-ch64-lstm \
50
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-US/wav_finished/*/*.wav" \
51
  #--label_plan 2-voicemail \
52
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
53
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
54
 
55
- sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-l3-ch64-lstm \
56
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
57
  --label_plan 2-voicemail \
58
  --config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
59
  --pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
60
 
61
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-l3-ch64-lstm \
62
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
63
  #--label_plan 2-voicemail \
64
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
65
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
66
  #
67
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-fi-fi-2-l3-ch64-lstm \
68
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/fi-FI/wav_finished/*/*.wav" \
69
  #--label_plan 2-voicemail \
70
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
71
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
72
  #
73
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-id-id-2-l3-ch64-lstm \
74
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/id-ID/wav_finished/*/*.wav" \
75
  #--label_plan 2-voicemail \
76
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
77
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
78
  #
79
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ja-jp-2-l3-ch64-lstm \
80
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ja-JP/wav_finished/*/*.wav" \
81
  #--label_plan 2-voicemail \
82
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
83
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
84
  #
85
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ko-kr-2-l3-ch64-lstm \
86
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ko-KR/wav_finished/*/*.wav" \
87
  #--label_plan 2-voicemail \
88
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
89
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
90
  #
91
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-l3-ch64-lstm \
92
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
93
  #--label_plan 2-voicemail \
94
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
95
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
96
  #
97
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-pt-br-2-l3-ch64-lstm \
98
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/pt-BR/wav_finished/*/*.wav" \
99
  #--label_plan 2-voicemail \
100
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
101
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
102
  #
103
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-th-th-2-l3-ch64-lstm \
104
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/th-TH/wav_finished/*/*.wav" \
105
  #--label_plan 2-voicemail \
106
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
107
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
108
  #
109
- #sh run.sh --stage 0 --stop_stage 6 --system_version centos --file_folder_name file_dir --final_model_name voicemail-zh-tw-2-l3-ch64-lstm \
110
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/zh-TW/wav_finished/*/*.wav" \
111
  #--label_plan 2-voicemail \
112
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
 
3
 
4
  # sound ch64
5
 
6
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name sound-2-l3-ch64-lstm \
7
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
8
  #--label_plan 2 \
9
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml"
10
  #
11
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name sound-3-l3-ch64-lstm \
12
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
13
  #--label_plan 3 \
14
  #--config_file "yaml/lstm-classifier-3-l3-ch64.yaml"
15
  #
16
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name sound-4-l3-ch64-lstm \
17
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
18
  #--label_plan 4 \
19
  #--config_file "yaml/lstm-classifier-4-l3-ch64.yaml"
20
  #
21
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name sound-8-l3-ch64-lstm \
22
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
23
  #--label_plan 8 \
24
  #--config_file "yaml/lstm-classifier-8-l3-ch64.yaml"
 
26
 
27
  # pretrained voicemail
28
 
29
+ sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-2-l3-ch64-lstm \
30
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/*/wav_finished/*/*.wav" \
31
  --label_plan 2-voicemail \
32
  --config_file "yaml/lstm-classifier-2-l3-ch64.yaml"
 
34
 
35
  # voicemail ch64
36
 
37
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-ph-2-l3-ch64-lstm \
38
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-PH/wav_finished/*/*.wav" \
39
  #--label_plan 2-voicemail \
40
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
41
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
42
  #
43
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-sg-2-l3-ch64-lstm \
44
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-SG/wav_finished/*/*.wav" \
45
  #--label_plan 2-voicemail \
46
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
47
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
48
  #
49
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-en-us-2-l3-ch64-lstm \
50
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/en-US/wav_finished/*/*.wav" \
51
  #--label_plan 2-voicemail \
52
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
53
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
54
 
55
+ sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-mx-2-l3-ch64-lstm \
56
  --filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-MX/wav_finished/*/*.wav" \
57
  --label_plan 2-voicemail \
58
  --config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
59
  --pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
60
 
61
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-es-pe-2-l3-ch64-lstm \
62
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/es-PE/wav_finished/*/*.wav" \
63
  #--label_plan 2-voicemail \
64
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
65
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
66
  #
67
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-fi-fi-2-l3-ch64-lstm \
68
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/fi-FI/wav_finished/*/*.wav" \
69
  #--label_plan 2-voicemail \
70
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
71
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
72
  #
73
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-id-id-2-l3-ch64-lstm \
74
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/id-ID/wav_finished/*/*.wav" \
75
  #--label_plan 2-voicemail \
76
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
77
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
78
  #
79
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ja-jp-2-l3-ch64-lstm \
80
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ja-JP/wav_finished/*/*.wav" \
81
  #--label_plan 2-voicemail \
82
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
83
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
84
  #
85
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ko-kr-2-l3-ch64-lstm \
86
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ko-KR/wav_finished/*/*.wav" \
87
  #--label_plan 2-voicemail \
88
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
89
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
90
  #
91
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-ms-my-2-l3-ch64-lstm \
92
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/ms-MY/wav_finished/*/*.wav" \
93
  #--label_plan 2-voicemail \
94
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
95
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
96
  #
97
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-pt-br-2-l3-ch64-lstm \
98
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/pt-BR/wav_finished/*/*.wav" \
99
  #--label_plan 2-voicemail \
100
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
101
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
102
  #
103
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-th-th-2-l3-ch64-lstm \
104
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/th-TH/wav_finished/*/*.wav" \
105
  #--label_plan 2-voicemail \
106
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
107
  #--pretrained_model "/data/tianxing/PycharmProjects/cc_audio_8/trained_models/voicemail-2-l3-ch64-lstm.zip"
108
  #
109
+ #sh run.sh --stage 0 --stop_stage 7 --system_version centos --file_folder_name file_dir --final_model_name voicemail-zh-tw-2-l3-ch64-lstm \
110
  #--filename_patterns "/data/tianxing/PycharmProjects/datasets/voicemail/zh-TW/wav_finished/*/*.wav" \
111
  #--label_plan 2-voicemail \
112
  #--config_file "yaml/lstm-classifier-2-l3-ch64.yaml" \
examples/sound_classification_by_lstm/step_9_evaluation_onnx_model.py CHANGED
@@ -33,13 +33,19 @@ def get_args():
33
  parser = argparse.ArgumentParser()
34
  parser.add_argument(
35
  "--model_file",
36
- # default=(project_path / "trained_models/cc_audio_8.zip").as_posix(),
37
- default=(project_path / "trained_models/voicemail-ms-my-2-ch64-lstm.zip").as_posix(),
38
  type=str
39
  )
 
 
 
 
40
  parser.add_argument("--output_file", default="evaluation_onnx.xlsx", type=str)
41
  parser.add_argument("--device", default="cpu", type=str)
42
 
 
 
43
  args = parser.parse_args()
44
  return args
45
 
@@ -47,23 +53,29 @@ def get_args():
47
  def main():
48
  args = get_args()
49
 
50
- model_file = Path(args.model_file)
51
 
52
  device = torch.device(args.device)
53
 
54
- with zipfile.ZipFile(model_file, "r") as f_zip:
55
- out_root = Path(tempfile.gettempdir()) / "cc_audio_8"
56
- print(out_root.as_posix())
57
- if out_root.exists():
58
- shutil.rmtree(out_root.as_posix())
59
- out_root.mkdir(parents=True, exist_ok=True)
60
- f_zip.extractall(path=out_root)
61
-
62
- tgt_path = out_root / model_file.stem
63
- config_file = tgt_path / "config.yaml"
64
- onnx_model_file = tgt_path / "model.onnx"
65
- vocab_path = tgt_path / "vocabulary"
66
- evaluation_file = tgt_path / "evaluation.xlsx"
 
 
 
 
 
 
67
 
68
  config = WaveClassifierConfig.from_pretrained(config_file.as_posix())
69
  ort_session = ort.InferenceSession(onnx_model_file.as_posix())
@@ -87,8 +99,12 @@ def main():
87
  total_correct = 0
88
  total_examples = 0
89
 
 
90
  progress_bar = tqdm(total=len(df), desc="Evaluation ONNX")
91
  for i, row in df.iterrows():
 
 
 
92
  row = dict(row)
93
  filename = row["filename"]
94
  ground_true = row["labels"]
@@ -158,6 +174,7 @@ def main():
158
  row_[f"onnx_correct_{idx}"] = correct
159
 
160
  result.append(row_)
 
161
 
162
  total_examples += 1
163
  total_correct += row_["onnx_correct_3"]
 
33
  parser = argparse.ArgumentParser()
34
  parser.add_argument(
35
  "--model_file",
36
+ default="null",
37
+ # default=(project_path / "trained_models/voicemail-ms-my-2-ch64-lstm.zip").as_posix(),
38
  type=str
39
  )
40
+ parser.add_argument("--dataset", default="evaluation.xlsx", type=str)
41
+ parser.add_argument("--vocabulary_dir", default="vocabulary", type=str)
42
+ parser.add_argument("--model_dir", default="best", type=str)
43
+ parser.add_argument("--onnx_model_file", default="model.onnx", type=str)
44
  parser.add_argument("--output_file", default="evaluation_onnx.xlsx", type=str)
45
  parser.add_argument("--device", default="cpu", type=str)
46
 
47
+ parser.add_argument("--max_count", default=10000, type=int)
48
+
49
  args = parser.parse_args()
50
  return args
51
 
 
53
  def main():
54
  args = get_args()
55
 
56
+ model_dir = Path(args.model_dir)
57
 
58
  device = torch.device(args.device)
59
 
60
+ if args.model_file != "null":
61
+ model_file = Path(args.model_file)
62
+ with zipfile.ZipFile(model_file.as_posix(), "r") as f_zip:
63
+ out_root = Path(tempfile.gettempdir()) / "cc_audio_8"
64
+ # print(out_root.as_posix())
65
+ if out_root.exists():
66
+ shutil.rmtree(out_root.as_posix())
67
+ out_root.mkdir(parents=True, exist_ok=True)
68
+ f_zip.extractall(path=out_root)
69
+ tgt_path = out_root / model_file.stem
70
+ config_file = tgt_path / "config.yaml"
71
+ onnx_model_file = tgt_path / "model.onnx"
72
+ vocab_path = tgt_path / "vocabulary"
73
+ evaluation_file = tgt_path / "evaluation.xlsx"
74
+ else:
75
+ config_file = model_dir / "config.yaml"
76
+ onnx_model_file = args.onnx_model_file
77
+ vocab_path = args.vocabulary_dir
78
+ evaluation_file = args.dataset
79
 
80
  config = WaveClassifierConfig.from_pretrained(config_file.as_posix())
81
  ort_session = ort.InferenceSession(onnx_model_file.as_posix())
 
99
  total_correct = 0
100
  total_examples = 0
101
 
102
+ count = 0
103
  progress_bar = tqdm(total=len(df), desc="Evaluation ONNX")
104
  for i, row in df.iterrows():
105
+ if count >= args.max_count:
106
+ break
107
+
108
  row = dict(row)
109
  filename = row["filename"]
110
  ground_true = row["labels"]
 
174
  row_[f"onnx_correct_{idx}"] = correct
175
 
176
  result.append(row_)
177
+ count += 1
178
 
179
  total_examples += 1
180
  total_correct += row_["onnx_correct_3"]