Program.cs
3.5 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
// Copyright (c) 2024 Xiaomi Corporation
//
// This file shows how to do keyword spotting with sherpa-onnx.
//
// 1. Download a model from
// https://github.com/k2-fsa/sherpa-onnx/releases/tag/kws-models
//
// wget https://github.com/k2-fsa/sherpa-onnx/releases/download/kws-models/sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01.tar.bz2
// tar xvf sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01.tar.bz2
//
// 2. Now run it
//
// dotnet run
using SherpaOnnx;
class KeywordSpotterDemo
{
static void Main(string[] args)
{
var config = new KeywordSpotterConfig();
config.FeatConfig.SampleRate = 16000;
config.FeatConfig.FeatureDim = 80;
config.ModelConfig.Transducer.Encoder = "./sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01/encoder-epoch-12-avg-2-chunk-16-left-64.onnx";
config.ModelConfig.Transducer.Decoder = "./sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01/decoder-epoch-12-avg-2-chunk-16-left-64.onnx";
config.ModelConfig.Transducer.Joiner = "./sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01/joiner-epoch-12-avg-2-chunk-16-left-64.onnx";
config.ModelConfig.Tokens = "./sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01/tokens.txt";
config.ModelConfig.Provider = "cpu";
config.ModelConfig.NumThreads = 1;
config.ModelConfig.Debug = 1;
config.KeywordsFile = "./sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01/test_wavs/test_keywords.txt";
var kws = new KeywordSpotter(config);
var filename = "./sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01/test_wavs/3.wav";
var waveReader = new WaveReader(filename);
Console.WriteLine("----------Use pre-defined keywords----------");
var s = kws.CreateStream();
s.AcceptWaveform(waveReader.SampleRate, waveReader.Samples);
float[] tailPadding = new float[(int)(waveReader.SampleRate * 0.3)];
s.AcceptWaveform(waveReader.SampleRate, tailPadding);
s.InputFinished();
while (kws.IsReady(s))
{
kws.Decode(s);
var result = kws.GetResult(s);
if (result.Keyword != string.Empty)
{
// Remember to call Reset() right after detecting a keyword
kws.Reset(s);
Console.WriteLine("Detected: {0}", result.Keyword);
}
}
Console.WriteLine("----------Use pre-defined keywords + add a new keyword----------");
s = kws.CreateStream("y ǎn y uán @演员");
s.AcceptWaveform(waveReader.SampleRate, waveReader.Samples);
s.AcceptWaveform(waveReader.SampleRate, tailPadding);
s.InputFinished();
while (kws.IsReady(s))
{
kws.Decode(s);
var result = kws.GetResult(s);
if (result.Keyword != string.Empty)
{
// Remember to call Reset() right after detecting a keyword
kws.Reset(s);
Console.WriteLine("Detected: {0}", result.Keyword);
}
}
Console.WriteLine("----------Use pre-defined keywords + add 2 new keywords----------");
// Note keywords are separated by /
s = kws.CreateStream("y ǎn y uán @演员/zh ī m íng @知名");
s.AcceptWaveform(waveReader.SampleRate, waveReader.Samples);
s.AcceptWaveform(waveReader.SampleRate, tailPadding);
s.InputFinished();
while (kws.IsReady(s))
{
kws.Decode(s);
var result = kws.GetResult(s);
if (result.Keyword != string.Empty)
{
// Remember to call Reset() right after detecting a keyword
kws.Reset(s);
Console.WriteLine("Detected: {0}", result.Keyword);
}
}
}
}