run-whisper.sh
1.3 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
#!/usr/bin/env bash
set -ex
dart pub get
if [ ! -f ./sherpa-onnx-whisper-tiny/tiny-encoder.int8.onnx ]; then
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/sherpa-onnx-whisper-tiny.tar.bz2
tar xvf sherpa-onnx-whisper-tiny.tar.bz2
rm sherpa-onnx-whisper-tiny.tar.bz2
fi
# Download test WAV files
waves=(
# ar-arabic.wav
# bg-bulgarian.wav
# cs-czech.wav
# da-danish.wav
# de-german.wav
# el-greek.wav
en-english.wav
es-spanish.wav
# fa-persian.wav
# fi-finnish.wav
# fr-french.wav
# hi-hindi.wav
# hr-croatian.wav
# id-indonesian.wav
# it-italian.wav
# ja-japanese.wav
# ko-korean.wav
# nl-dutch.wav
# no-norwegian.wav
# pl-polish.wav
# pt-portuguese.wav
# ro-romanian.wav
ru-russian.wav
# sk-slovak.wav
# sv-swedish.wav
# ta-tamil.wav
# tl-tagalog.wav
# tr-turkish.wav
# uk-ukrainian.wav
zh-chinese.wav
)
for wav in ${waves[@]}; do
if [ ! -f ./$wav ]; then
echo "Downloading $wav"
curl -SL -O https://hf-mirror.com/spaces/k2-fsa/spoken-language-identification/resolve/main/test_wavs/$wav
fi
echo "Testing $wav"
dart run \
./bin/spoken_language_identification.dart \
--encoder ./sherpa-onnx-whisper-tiny/tiny-encoder.int8.onnx \
--decoder ./sherpa-onnx-whisper-tiny/tiny-decoder.int8.onnx \
--wav ./$wav
echo "----------------------------------------"
done