Skip to content

Commit 095343a

Browse files
committed
[update] perf kws & melotts & vad model setup.
1 parent 801d692 commit 095343a

6 files changed

Lines changed: 15 additions & 12 deletions

File tree

projects/llm_framework/main_kws/mode_sherpa-onnx-kws-zipformer-gigaspeech-3.3M-2024-01-01.json

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,9 @@
1313
"kws.bool"
1414
],
1515
"mode_param":{
16-
"model_config.transducer.encoder":"encoder-epoch-12-avg-2-chunk-16-left-64.int8.onnx",
17-
"model_config.transducer.decoder":"decoder-epoch-12-avg-2-chunk-16-left-64.onnx",
18-
"model_config.transducer.joiner":"joiner-epoch-12-avg-2-chunk-16-left-64.int8.onnx",
16+
"model_config.transducer.encoder":"encoder-epoch-12-avg-2-chunk-16-left-64.int8.ort",
17+
"model_config.transducer.decoder":"decoder-epoch-12-avg-2-chunk-16-left-64.ort",
18+
"model_config.transducer.joiner":"joiner-epoch-12-avg-2-chunk-16-left-64.int8.ort",
1919
"model_config.tokens":"tokens.txt",
2020
"model_config.modeling_unit":"cjkchar",
2121
"keywords_file":"keywords.txt",

projects/llm_framework/main_kws/mode_sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01.json

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,10 +12,10 @@
1212
"output_type":[
1313
"kws.bool"
1414
],
15-
"mode_param":{
16-
"model_config.transducer.encoder":"encoder-epoch-12-avg-2-chunk-16-left-64.int8.onnx",
17-
"model_config.transducer.decoder":"decoder-epoch-12-avg-2-chunk-16-left-64.onnx",
18-
"model_config.transducer.joiner":"joiner-epoch-12-avg-2-chunk-16-left-64.int8.onnx",
15+
"mode_param": {
16+
"model_config.transducer.encoder":"encoder-epoch-12-avg-2-chunk-16-left-64.int8.ort",
17+
"model_config.transducer.decoder":"decoder-epoch-12-avg-2-chunk-16-left-64.ort",
18+
"model_config.transducer.joiner":"joiner-epoch-12-avg-2-chunk-16-left-64.int8.ort",
1919
"model_config.tokens":"tokens.txt",
2020
"model_config.modeling_unit":"cjkchar",
2121
"keywords_file":"keywords.txt",

projects/llm_framework/main_melotts/SConstruct

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,9 @@ REQUIREMENTS += ['onnxruntime', 'samplerate']
2626
INCLUDE += [ADir('../include')]
2727
INCLUDE += [ADir('src/runner'), ADir('../include/onnxruntime/core/session')]
2828

29+
LINK_SEARCH_PATH += [ADir('../static_lib/sherpa/onnx')]
30+
LDFLAGS += ['-l:libcargs.a', '-l:libonnxruntime.a']
31+
2932
STATIC_FILES += Glob('mode_*.json')
3033

3134
env['COMPONENTS'].append({'target':'llm_melotts',

projects/llm_framework/main_melotts/mode_melotts-zh-cn.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
"sys.play.0_1"
1313
],
1414
"mode_param": {
15-
"encoder": "encoder.onnx",
15+
"encoder": "encoder.ort",
1616
"decoder": "decoder.axmodel",
1717
"gbin": "g.bin",
1818
"tokens": "tokens.txt",

projects/llm_framework/main_vad/mode_silero-vad-model.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
"vad.bool"
1313
],
1414
"mode_param": {
15-
"silero_vad.model": "silero_vad.onnx"
15+
"silero_vad.model": "silero_vad.ort"
1616
},
1717
"mode_param_bak": {
1818
"silero_vad.threshold": 0.5,

projects/llm_framework/tools/llm_pack.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -289,14 +289,14 @@ def create_bin_deb(package_name, version, src_folder, revision = 'm5stack1'):
289289
create_data_deb('llm-audio-zh-cn', data_version, src_folder, revision)
290290
create_data_deb('llm-sherpa-ncnn-streaming-zipformer-20M-2023-02-17', data_version, src_folder, revision)
291291
create_data_deb('llm-sherpa-ncnn-streaming-zipformer-zh-14M-2023-02-23', data_version, src_folder, revision)
292-
create_data_deb('llm-sherpa-onnx-kws-zipformer-gigaspeech-3.3M-2024-01-01', data_version, src_folder, revision)
293-
create_data_deb('llm-sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01', data_version, src_folder, revision)
292+
create_data_deb('llm-sherpa-onnx-kws-zipformer-gigaspeech-3.3M-2024-01-01', '0.3', src_folder, revision)
293+
create_data_deb('llm-sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01', '0.3', src_folder, revision)
294294
# create_data_deb('llm-qwen2-0.5B-prefill-20e', data_version, src_folder, revision)
295295
# create_data_deb('llm-qwen2-1.5B-prefill-20e', data_version, src_folder, revision)
296296
create_data_deb('llm-qwen2.5-0.5B-prefill-20e', data_version, src_folder, revision)
297297
create_data_deb('llm-single-speaker-english-fast', data_version, src_folder, revision)
298298
create_data_deb('llm-single-speaker-fast', data_version, src_folder, revision)
299-
create_data_deb('llm-melotts-zh-cn', data_version, src_folder, revision)
299+
create_data_deb('llm-melotts-zh-cn', '0.3', src_folder, revision)
300300
create_data_deb('llm-yolo11n', data_version, src_folder, revision)
301301
create_data_deb('llm-yolo11n-pose', data_version, src_folder, revision)
302302
create_data_deb('llm-yolo11n-seg', data_version, src_folder, revision)

0 commit comments

Comments
 (0)