Committed by
GitHub
speaker-identification-with-vad-non-streaming-asr.py Lack of support for sense_voice. (#1884)
正在显示
1 个修改的文件
包含
16 行增加
和
0 行删除
| @@ -185,6 +185,13 @@ def register_non_streaming_asr_model_args(parser): | @@ -185,6 +185,13 @@ def register_non_streaming_asr_model_args(parser): | ||
| 185 | help="Feature dimension. Must match the one expected by the model", | 185 | help="Feature dimension. Must match the one expected by the model", |
| 186 | ) | 186 | ) |
| 187 | 187 | ||
| 188 | + parser.add_argument( | ||
| 189 | + "--sense-voice", | ||
| 190 | + default="", | ||
| 191 | + type=str, | ||
| 192 | + help="Path to sense voice model", | ||
| 193 | + ) | ||
| 194 | + | ||
| 188 | 195 | ||
| 189 | def get_args(): | 196 | def get_args(): |
| 190 | parser = argparse.ArgumentParser( | 197 | parser = argparse.ArgumentParser( |
| @@ -317,6 +324,15 @@ def create_recognizer(args) -> sherpa_onnx.OfflineRecognizer: | @@ -317,6 +324,15 @@ def create_recognizer(args) -> sherpa_onnx.OfflineRecognizer: | ||
| 317 | task=args.whisper_task, | 324 | task=args.whisper_task, |
| 318 | tail_paddings=args.whisper_tail_paddings, | 325 | tail_paddings=args.whisper_tail_paddings, |
| 319 | ) | 326 | ) |
| 327 | + elif args.sense_voice: | ||
| 328 | + assert_file_exists(args.sense_voice) | ||
| 329 | + recognizer = sherpa_onnx.OfflineRecognizer.from_sense_voice( | ||
| 330 | + model=args.sense_voice, | ||
| 331 | + tokens=args.tokens, | ||
| 332 | + num_threads=args.num_threads, | ||
| 333 | + use_itn=True, | ||
| 334 | + debug=args.debug, | ||
| 335 | + ) | ||
| 320 | else: | 336 | else: |
| 321 | raise ValueError("Please specify at least one model") | 337 | raise ValueError("Please specify at least one model") |
| 322 | 338 |
-
请 注册 或 登录 后发表评论