Fangjun Kuang
Committed by GitHub

Upload new sense-voice models (#2580)

@@ -156,6 +156,27 @@ jobs: @@ -156,6 +156,27 @@ jobs:
156 ls -lh *.tar.bz2 156 ls -lh *.tar.bz2
157 done 157 done
158 158
  159 + - name: sense-voice
  160 + if: false
  161 + shell: bash
  162 + run: |
  163 + git lfs install
  164 + d=sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2025-09-09
  165 + f=sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09
  166 + git clone https://huggingface.co/csukuangfj/$d
  167 + git clone https://huggingface.co/csukuangfj/$f
  168 +
  169 + rm -rf $d/.git
  170 + rm -rf $f/.gi*
  171 +
  172 + rm -rf $d/.gitattributes
  173 + rm -rf $f/.gitattributes
  174 +
  175 + tar cjfv $d.tar.bz2 $d
  176 + tar cjfv $f.tar.bz2 $f
  177 +
  178 + ls -lh *.tar.bz2
  179 +
159 - name: Vietnamese (zipformer) 180 - name: Vietnamese (zipformer)
160 if: false 181 if: false
161 shell: bash 182 shell: bash
@@ -117,7 +117,7 @@ def get_2nd_models(): @@ -117,7 +117,7 @@ def get_2nd_models():
117 model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", 117 model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17",
118 idx=15, 118 idx=15,
119 lang="zh_en_ko_ja_yue", 119 lang="zh_en_ko_ja_yue",
120 - short_name="sense_voice", 120 + short_name="sense_voice_2024_07_17_int8",
121 cmd=""" 121 cmd="""
122 pushd $model_name 122 pushd $model_name
123 123
@@ -175,6 +175,23 @@ def get_2nd_models(): @@ -175,6 +175,23 @@ def get_2nd_models():
175 popd 175 popd
176 """, 176 """,
177 ), 177 ),
  178 + Model(
  179 + model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09",
  180 + idx=41,
  181 + lang="zh_en_ko_ja_yue",
  182 + short_name="sense_voice_2025_09_09_int8",
  183 + cmd="""
  184 + pushd $model_name
  185 +
  186 + rm -rfv test_wavs
  187 + rm -fv model.onnx
  188 + rm -fv *.py
  189 +
  190 + ls -lh
  191 +
  192 + popd
  193 + """,
  194 + ),
178 ] 195 ]
179 return models 196 return models
180 197
@@ -380,6 +397,7 @@ def get_models(): @@ -380,6 +397,7 @@ def get_models():
380 "sherpa-onnx-paraformer-zh-2023-09-14", 397 "sherpa-onnx-paraformer-zh-2023-09-14",
381 "icefall-asr-zipformer-wenetspeech-20230615", 398 "icefall-asr-zipformer-wenetspeech-20230615",
382 "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", 399 "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17",
  400 + "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09",
383 "sherpa-onnx-dolphin-base-ctc-multi-lang-int8-2025-04-02", 401 "sherpa-onnx-dolphin-base-ctc-multi-lang-int8-2025-04-02",
384 ] 402 ]
385 for first_m in first_zh: 403 for first_m in first_zh:
@@ -403,6 +421,10 @@ def get_models(): @@ -403,6 +421,10 @@ def get_models():
403 "sherpa-onnx-streaming-zipformer-en-20M-2023-02-17", 421 "sherpa-onnx-streaming-zipformer-en-20M-2023-02-17",
404 "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", 422 "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17",
405 ), 423 ),
  424 + (
  425 + "sherpa-onnx-streaming-zipformer-en-20M-2023-02-17",
  426 + "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09",
  427 + ),
406 ] 428 ]
407 models = [] 429 models = []
408 for f, s in combinations: 430 for f, s in combinations:
@@ -99,7 +99,7 @@ def get_models(): @@ -99,7 +99,7 @@ def get_models():
99 idx=15, 99 idx=15,
100 lang="zh_en_ko_ja_yue", 100 lang="zh_en_ko_ja_yue",
101 lang2="中英粤日韩", 101 lang2="中英粤日韩",
102 - short_name="sense_voice", 102 + short_name="sense_voice_2024_07_17_int8",
103 use_hr=True, 103 use_hr=True,
104 cmd=""" 104 cmd="""
105 pushd $model_name 105 pushd $model_name
@@ -697,6 +697,23 @@ def get_models(): @@ -697,6 +697,23 @@ def get_models():
697 popd 697 popd
698 """, 698 """,
699 ), 699 ),
  700 + Model(
  701 + model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09",
  702 + idx=41,
  703 + lang="zh_en_ko_ja_yue",
  704 + lang2="中英粤日韩",
  705 + short_name="sense_voice_2025_09_09_int8",
  706 + use_hr=True,
  707 + cmd="""
  708 + pushd $model_name
  709 +
  710 + rm -rfv test_wavs
  711 +
  712 + ls -lh
  713 +
  714 + popd
  715 + """,
  716 + ),
700 ] 717 ]
701 return models 718 return models
702 719
@@ -695,6 +695,16 @@ fun getOfflineModelConfig(type: Int): OfflineModelConfig? { @@ -695,6 +695,16 @@ fun getOfflineModelConfig(type: Int): OfflineModelConfig? {
695 modelType = "nemo_transducer", 695 modelType = "nemo_transducer",
696 ) 696 )
697 } 697 }
  698 +
  699 + 41 -> {
  700 + val modelDir = "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09"
  701 + return OfflineModelConfig(
  702 + senseVoice = OfflineSenseVoiceModelConfig(
  703 + model = "$modelDir/model.int8.onnx",
  704 + ),
  705 + tokens = "$modelDir/tokens.txt",
  706 + )
  707 + }
698 } 708 }
699 return null 709 return null
700 } 710 }