Fangjun Kuang
Committed by GitHub

Build Android APK for Thai (#1036)

@@ -24,5 +24,6 @@ dotnet run -c Release \ @@ -24,5 +24,6 @@ dotnet run -c Release \
24 --encoder ./sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20/encoder-epoch-99-avg-1.int8.onnx \ 24 --encoder ./sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20/encoder-epoch-99-avg-1.int8.onnx \
25 --decoder ./sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20/decoder-epoch-99-avg-1.int8.onnx \ 25 --decoder ./sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20/decoder-epoch-99-avg-1.int8.onnx \
26 --joiner ./sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20/joiner-epoch-99-avg-1.int8.onnx \ 26 --joiner ./sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20/joiner-epoch-99-avg-1.int8.onnx \
  27 + --rule-fsts ./itn_zh_number.fst \
27 --decoding-method greedy_search \ 28 --decoding-method greedy_search \
28 --files ./itn-zh-number.wav 29 --files ./itn-zh-number.wav
@@ -55,13 +55,13 @@ def get_models(): @@ -55,13 +55,13 @@ def get_models():
55 short_name="whisper_tiny", 55 short_name="whisper_tiny",
56 cmd=""" 56 cmd="""
57 pushd $model_name 57 pushd $model_name
58 - rm -v tiny.en-encoder.onnx  
59 - rm -v tiny.en-decoder.onnx 58 + rm -fv tiny.en-encoder.onnx
  59 + rm -fv tiny.en-decoder.onnx
60 rm -rf test_wavs 60 rm -rf test_wavs
61 - rm -v *.py  
62 - rm -v requirements.txt  
63 - rm -v .gitignore  
64 - rm -v README.md 61 + rm -fv *.py
  62 + rm -fv requirements.txt
  63 + rm -fv .gitignore
  64 + rm -fv README.md
65 65
66 ls -lh 66 ls -lh
67 67
@@ -80,7 +80,7 @@ def get_models(): @@ -80,7 +80,7 @@ def get_models():
80 fi 80 fi
81 pushd $model_name 81 pushd $model_name
82 82
83 - rm -v README.md 83 + rm -fv README.md
84 rm -rfv test_wavs 84 rm -rfv test_wavs
85 rm model.onnx 85 rm model.onnx
86 86
@@ -102,7 +102,7 @@ def get_models(): @@ -102,7 +102,7 @@ def get_models():
102 pushd $model_name 102 pushd $model_name
103 103
104 rm -rfv test_wavs 104 rm -rfv test_wavs
105 - rm -v README.md 105 + rm -fv README.md
106 mv -v data/lang_char/tokens.txt ./ 106 mv -v data/lang_char/tokens.txt ./
107 rm -rfv data/lang_char 107 rm -rfv data/lang_char
108 108
@@ -196,6 +196,27 @@ def get_models(): @@ -196,6 +196,27 @@ def get_models():
196 popd 196 popd
197 """, 197 """,
198 ), 198 ),
  199 + Model(
  200 + model_name="sherpa-onnx-zipformer-thai-2024-06-20",
  201 + idx=12,
  202 + lang="th",
  203 + short_name="zipformer",
  204 + cmd="""
  205 + pushd $model_name
  206 +
  207 + rm -rfv test_wavs
  208 + rm -fv README.md
  209 + rm -fv bpe.model
  210 +
  211 + rm encoder-epoch-12-avg-5.onnx
  212 + rm decoder-epoch-12-avg-5.int8.onnx
  213 + rm joiner-epoch-12-avg-5.onnx
  214 +
  215 + ls -lh
  216 +
  217 + popd
  218 + """,
  219 + ),
199 ] 220 ]
200 return models 221 return models
201 222
@@ -284,6 +284,19 @@ fun getOfflineModelConfig(type: Int): OfflineModelConfig? { @@ -284,6 +284,19 @@ fun getOfflineModelConfig(type: Int): OfflineModelConfig? {
284 modelType = "tele_speech", 284 modelType = "tele_speech",
285 ) 285 )
286 } 286 }
  287 +
  288 + 12 -> {
  289 + val modelDir = "sherpa-onnx-zipformer-thai-2024-06-20"
  290 + return OfflineModelConfig(
  291 + transducer = OfflineTransducerModelConfig(
  292 + encoder = "$modelDir/encoder-epoch-12-avg-5.int8.onnx",
  293 + decoder = "$modelDir/decoder-epoch-12-avg-5.onnx",
  294 + joiner = "$modelDir/joiner-epoch-12-avg-5.int8.onnx",
  295 + ),
  296 + tokens = "$modelDir/tokens.txt",
  297 + modelType = "zipformer2",
  298 + )
  299 + }
287 } 300 }
288 return null 301 return null
289 } 302 }