正在显示
4 个修改的文件
包含
72 行增加
和
2 行删除
| @@ -156,6 +156,27 @@ jobs: | @@ -156,6 +156,27 @@ jobs: | ||
| 156 | ls -lh *.tar.bz2 | 156 | ls -lh *.tar.bz2 |
| 157 | done | 157 | done |
| 158 | 158 | ||
| 159 | + - name: sense-voice | ||
| 160 | + if: false | ||
| 161 | + shell: bash | ||
| 162 | + run: | | ||
| 163 | + git lfs install | ||
| 164 | + d=sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2025-09-09 | ||
| 165 | + f=sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09 | ||
| 166 | + git clone https://huggingface.co/csukuangfj/$d | ||
| 167 | + git clone https://huggingface.co/csukuangfj/$f | ||
| 168 | + | ||
| 169 | + rm -rf $d/.git | ||
| 170 | + rm -rf $f/.gi* | ||
| 171 | + | ||
| 172 | + rm -rf $d/.gitattributes | ||
| 173 | + rm -rf $f/.gitattributes | ||
| 174 | + | ||
| 175 | + tar cjfv $d.tar.bz2 $d | ||
| 176 | + tar cjfv $f.tar.bz2 $f | ||
| 177 | + | ||
| 178 | + ls -lh *.tar.bz2 | ||
| 179 | + | ||
| 159 | - name: Vietnamese (zipformer) | 180 | - name: Vietnamese (zipformer) |
| 160 | if: false | 181 | if: false |
| 161 | shell: bash | 182 | shell: bash |
| @@ -117,7 +117,7 @@ def get_2nd_models(): | @@ -117,7 +117,7 @@ def get_2nd_models(): | ||
| 117 | model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", | 117 | model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", |
| 118 | idx=15, | 118 | idx=15, |
| 119 | lang="zh_en_ko_ja_yue", | 119 | lang="zh_en_ko_ja_yue", |
| 120 | - short_name="sense_voice", | 120 | + short_name="sense_voice_2024_07_17_int8", |
| 121 | cmd=""" | 121 | cmd=""" |
| 122 | pushd $model_name | 122 | pushd $model_name |
| 123 | 123 | ||
| @@ -175,6 +175,23 @@ def get_2nd_models(): | @@ -175,6 +175,23 @@ def get_2nd_models(): | ||
| 175 | popd | 175 | popd |
| 176 | """, | 176 | """, |
| 177 | ), | 177 | ), |
| 178 | + Model( | ||
| 179 | + model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09", | ||
| 180 | + idx=41, | ||
| 181 | + lang="zh_en_ko_ja_yue", | ||
| 182 | + short_name="sense_voice_2025_09_09_int8", | ||
| 183 | + cmd=""" | ||
| 184 | + pushd $model_name | ||
| 185 | + | ||
| 186 | + rm -rfv test_wavs | ||
| 187 | + rm -fv model.onnx | ||
| 188 | + rm -fv *.py | ||
| 189 | + | ||
| 190 | + ls -lh | ||
| 191 | + | ||
| 192 | + popd | ||
| 193 | + """, | ||
| 194 | + ), | ||
| 178 | ] | 195 | ] |
| 179 | return models | 196 | return models |
| 180 | 197 | ||
| @@ -380,6 +397,7 @@ def get_models(): | @@ -380,6 +397,7 @@ def get_models(): | ||
| 380 | "sherpa-onnx-paraformer-zh-2023-09-14", | 397 | "sherpa-onnx-paraformer-zh-2023-09-14", |
| 381 | "icefall-asr-zipformer-wenetspeech-20230615", | 398 | "icefall-asr-zipformer-wenetspeech-20230615", |
| 382 | "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", | 399 | "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", |
| 400 | + "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09", | ||
| 383 | "sherpa-onnx-dolphin-base-ctc-multi-lang-int8-2025-04-02", | 401 | "sherpa-onnx-dolphin-base-ctc-multi-lang-int8-2025-04-02", |
| 384 | ] | 402 | ] |
| 385 | for first_m in first_zh: | 403 | for first_m in first_zh: |
| @@ -403,6 +421,10 @@ def get_models(): | @@ -403,6 +421,10 @@ def get_models(): | ||
| 403 | "sherpa-onnx-streaming-zipformer-en-20M-2023-02-17", | 421 | "sherpa-onnx-streaming-zipformer-en-20M-2023-02-17", |
| 404 | "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", | 422 | "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-2024-07-17", |
| 405 | ), | 423 | ), |
| 424 | + ( | ||
| 425 | + "sherpa-onnx-streaming-zipformer-en-20M-2023-02-17", | ||
| 426 | + "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09", | ||
| 427 | + ), | ||
| 406 | ] | 428 | ] |
| 407 | models = [] | 429 | models = [] |
| 408 | for f, s in combinations: | 430 | for f, s in combinations: |
| @@ -99,7 +99,7 @@ def get_models(): | @@ -99,7 +99,7 @@ def get_models(): | ||
| 99 | idx=15, | 99 | idx=15, |
| 100 | lang="zh_en_ko_ja_yue", | 100 | lang="zh_en_ko_ja_yue", |
| 101 | lang2="中英粤日韩", | 101 | lang2="中英粤日韩", |
| 102 | - short_name="sense_voice", | 102 | + short_name="sense_voice_2024_07_17_int8", |
| 103 | use_hr=True, | 103 | use_hr=True, |
| 104 | cmd=""" | 104 | cmd=""" |
| 105 | pushd $model_name | 105 | pushd $model_name |
| @@ -697,6 +697,23 @@ def get_models(): | @@ -697,6 +697,23 @@ def get_models(): | ||
| 697 | popd | 697 | popd |
| 698 | """, | 698 | """, |
| 699 | ), | 699 | ), |
| 700 | + Model( | ||
| 701 | + model_name="sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09", | ||
| 702 | + idx=41, | ||
| 703 | + lang="zh_en_ko_ja_yue", | ||
| 704 | + lang2="中英粤日韩", | ||
| 705 | + short_name="sense_voice_2025_09_09_int8", | ||
| 706 | + use_hr=True, | ||
| 707 | + cmd=""" | ||
| 708 | + pushd $model_name | ||
| 709 | + | ||
| 710 | + rm -rfv test_wavs | ||
| 711 | + | ||
| 712 | + ls -lh | ||
| 713 | + | ||
| 714 | + popd | ||
| 715 | + """, | ||
| 716 | + ), | ||
| 700 | ] | 717 | ] |
| 701 | return models | 718 | return models |
| 702 | 719 |
| @@ -695,6 +695,16 @@ fun getOfflineModelConfig(type: Int): OfflineModelConfig? { | @@ -695,6 +695,16 @@ fun getOfflineModelConfig(type: Int): OfflineModelConfig? { | ||
| 695 | modelType = "nemo_transducer", | 695 | modelType = "nemo_transducer", |
| 696 | ) | 696 | ) |
| 697 | } | 697 | } |
| 698 | + | ||
| 699 | + 41 -> { | ||
| 700 | + val modelDir = "sherpa-onnx-sense-voice-zh-en-ja-ko-yue-int8-2025-09-09" | ||
| 701 | + return OfflineModelConfig( | ||
| 702 | + senseVoice = OfflineSenseVoiceModelConfig( | ||
| 703 | + model = "$modelDir/model.int8.onnx", | ||
| 704 | + ), | ||
| 705 | + tokens = "$modelDir/tokens.txt", | ||
| 706 | + ) | ||
| 707 | + } | ||
| 698 | } | 708 | } |
| 699 | return null | 709 | return null |
| 700 | } | 710 | } |
-
请 注册 或 登录 后发表评论