luffy
Committed by GitHub

speaker-identification-with-vad-non-streaming-asr.py Lack of support for sense_voice. (#1884)

@@ -185,6 +185,13 @@ def register_non_streaming_asr_model_args(parser): @@ -185,6 +185,13 @@ def register_non_streaming_asr_model_args(parser):
185 help="Feature dimension. Must match the one expected by the model", 185 help="Feature dimension. Must match the one expected by the model",
186 ) 186 )
187 187
  188 + parser.add_argument(
  189 + "--sense-voice",
  190 + default="",
  191 + type=str,
  192 + help="Path to sense voice model",
  193 + )
  194 +
188 195
189 def get_args(): 196 def get_args():
190 parser = argparse.ArgumentParser( 197 parser = argparse.ArgumentParser(
@@ -317,6 +324,15 @@ def create_recognizer(args) -> sherpa_onnx.OfflineRecognizer: @@ -317,6 +324,15 @@ def create_recognizer(args) -> sherpa_onnx.OfflineRecognizer:
317 task=args.whisper_task, 324 task=args.whisper_task,
318 tail_paddings=args.whisper_tail_paddings, 325 tail_paddings=args.whisper_tail_paddings,
319 ) 326 )
  327 + elif args.sense_voice:
  328 + assert_file_exists(args.sense_voice)
  329 + recognizer = sherpa_onnx.OfflineRecognizer.from_sense_voice(
  330 + model=args.sense_voice,
  331 + tokens=args.tokens,
  332 + num_threads=args.num_threads,
  333 + use_itn=True,
  334 + debug=args.debug,
  335 + )
320 else: 336 else:
321 raise ValueError("Please specify at least one model") 337 raise ValueError("Please specify at least one model")
322 338