Toggle navigation
Toggle navigation
此项目
正在载入...
Sign in
xuning
/
sherpaonnx
转到一个项目
Toggle navigation
项目
群组
代码片段
帮助
Toggle navigation pinning
Project
Activity
Repository
Pipelines
Graphs
Issues
0
Merge Requests
0
Wiki
Network
Create a new issue
Builds
Commits
Authored by
Fangjun Kuang
2024-12-24 16:56:49 +0800
Browse Files
Options
Browse Files
Download
Email Patches
Plain Diff
Committed by
GitHub
2024-12-24 16:56:49 +0800
Commit
08d771337baad95717e1ebb68a468568f2505fe2
08d77133
1 parent
fe3265aa
Add a byte-level BPE Chinese+English non-streaming zipformer model (#1645)
显示空白字符变更
内嵌
并排对比
正在显示
5 个修改的文件
包含
127 行增加
和
0 行删除
.github/scripts/test-python.sh
.github/workflows/add-new-asr-models.yaml
harmony-os/SherpaOnnxVadAsr/entry/src/main/ets/pages/NonStreamingAsrModels.ets
scripts/apk/generate-vad-asr-apk-script.py
sherpa-onnx/kotlin-api/OfflineRecognizer.kt
.github/scripts/test-python.sh
查看文件 @
08d7713
...
...
@@ -8,6 +8,27 @@ log() {
echo
-e
"
$(
date
'+%Y-%m-%d %H:%M:%S'
)
(
${
fname
}
:
${
BASH_LINENO
[0]
}
:
${
FUNCNAME
[1]
}
)
$*
"
}
log
"test offline zipformer (byte-level bpe, Chinese+English)"
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/sherpa-onnx-zipformer-zh-en-2023-11-22.tar.bz2
tar xvf sherpa-onnx-zipformer-zh-en-2023-11-22.tar.bz2
rm sherpa-onnx-zipformer-zh-en-2023-11-22.tar.bz2
repo
=
sherpa-onnx-zipformer-zh-en-2023-11-22
./python-api-examples/offline-decode-files.py
\
--tokens
=
$repo
/tokens.txt
\
--encoder
=
$repo
/encoder-epoch-34-avg-19.int8.onnx
\
--decoder
=
$repo
/decoder-epoch-34-avg-19.onnx
\
--joiner
=
$repo
/joiner-epoch-34-avg-19.int8.onnx
\
--num-threads
=
2
\
--decoding-method
=
greedy_search
\
--debug
=
true
\
$repo
/test_wavs/0.wav
\
$repo
/test_wavs/1.wav
\
$repo
/test_wavs/2.wav
rm -rf sherpa-onnx-zipformer-zh-en-2023-11-22
log
"test offline Moonshine"
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/sherpa-onnx-moonshine-tiny-en-int8.tar.bz2
...
...
.github/workflows/add-new-asr-models.yaml
0 → 100644
查看文件 @
08d7713
name
:
add-new-asr-models
on
:
# push:
# branches:
# - new-asr-models
workflow_dispatch
:
concurrency
:
group
:
add-new-asr-models-${{ github.ref }}
cancel-in-progress
:
true
jobs
:
add-new-asr-models
:
runs-on
:
${{ matrix.os }}
name
:
New asr models
strategy
:
fail-fast
:
false
matrix
:
os
:
[
ubuntu-latest
]
steps
:
-
uses
:
actions/checkout@v4
with
:
fetch-depth
:
0
-
name
:
Download icefall-asr-zipformer-multi-zh-en-2023-11-22
shell
:
bash
run
:
|
d=sherpa-onnx-zipformer-zh-en-2023-11-22
mkdir $d
pushd $d
wget -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/data/lang_bbpe_2000/tokens.txt
wget -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/data/lang_bbpe_2000/bbpe.model
wget -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/exp/decoder-epoch-34-avg-19.onnx
wget -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/exp/encoder-epoch-34-avg-19.int8.onnx
wget -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/exp/encoder-epoch-34-avg-19.onnx
wget -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/exp/joiner-epoch-34-avg-19.int8.onnx
wget -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/exp/joiner-epoch-34-avg-19.onnx
mkdir test_wavs
cd test_wavs
wget -O 0.wav -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/test_wavs/_1634_210_2577_1_1525157964032_3712259_29.wav
wget -O 1.wav -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/test_wavs/_1634_210_2577_1_1525157964032_3712259_55.wav
wget -O 2.wav -q https://huggingface.co/zrjin/icefall-asr-zipformer-multi-zh-en-2023-11-22/resolve/main/test_wavs/_1634_210_2577_1_1525157964032_3712259_75.wav
popd
tar cvjf $d.tar.bz2 $d
ls -lh $d
rm -rf $d
-
name
:
Release
uses
:
svenstaro/upload-release-action@v2
with
:
file_glob
:
true
file
:
./*.tar.bz2
overwrite
:
true
repo_name
:
k2-fsa/sherpa-onnx
repo_token
:
${{ secrets.UPLOAD_GH_SHERPA_ONNX_TOKEN }}
tag
:
asr-models
...
...
harmony-os/SherpaOnnxVadAsr/entry/src/main/ets/pages/NonStreamingAsrModels.ets
查看文件 @
08d7713
...
...
@@ -229,6 +229,18 @@ export function getOfflineModelConfig(type: number): OfflineModelConfig {
break;
}
case 23: {
const modelDir = "sherpa-onnx-zipformer-zh-en-2023-11-22";
c.transducer.encoder = `${modelDir}/encoder-epoch-34-avg-19.int8.onnx`;
c.transducer.decoder = `${modelDir}/decoder-epoch-34-avg-19.onnx`;
c.transducer.joiner = `${modelDir}/joiner-epoch-34-avg-19.int8.onnx`;
c.tokens = `${modelDir}/tokens.txt`;
c.modelType = "transducer";
break;
}
default: {
console.log(`Please specify a supported type. Given type ${type}`);
}
...
...
scripts/apk/generate-vad-asr-apk-script.py
查看文件 @
08d7713
...
...
@@ -423,6 +423,26 @@ def get_models():
popd
"""
,
),
Model
(
model_name
=
"sherpa-onnx-zipformer-zh-en-2023-11-22"
,
idx
=
23
,
lang
=
"zh_en"
,
lang2
=
"Chinese,English"
,
short_name
=
"zipformer"
,
cmd
=
"""
pushd $model_name
rm -rfv test_wavs
rm -fv encoder-epoch-34-avg-19.onnx
rm -fv joiner-epoch-34-avg-19.onnx
rm -fv bbpe.model
ls -lh
popd
"""
,
),
]
return
models
...
...
sherpa-onnx/kotlin-api/OfflineRecognizer.kt
查看文件 @
08d7713
...
...
@@ -451,6 +451,19 @@ fun getOfflineModelConfig(type: Int): OfflineModelConfig? {
tokens = "$modelDir/tokens.txt",
)
}
23 -> {
val modelDir = "sherpa-onnx-zipformer-zh-en-2023-11-22"
return OfflineModelConfig(
transducer = OfflineTransducerModelConfig(
encoder = "$modelDir/encoder-epoch-34-avg-19.int8.onnx",
decoder = "$modelDir/decoder-epoch-34-avg-19.onnx",
joiner = "$modelDir/joiner-epoch-34-avg-19.int8.onnx",
),
tokens = "$modelDir/tokens.txt",
modelType = "transducer",
)
}
}
return null
}
...
...
请
注册
或
登录
后发表评论