Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
snakers4
GitHub Repository: snakers4/silero-vad
Path: blob/master/examples/go/cmd/main.go
1181 views
1
package main
2
3
import (
4
"log"
5
"os"
6
7
"github.com/streamer45/silero-vad-go/speech"
8
9
"github.com/go-audio/wav"
10
)
11
12
func main() {
13
sd, err := speech.NewDetector(speech.DetectorConfig{
14
ModelPath: "../../src/silero_vad/data/silero_vad.onnx",
15
SampleRate: 16000,
16
Threshold: 0.5,
17
MinSilenceDurationMs: 100,
18
SpeechPadMs: 30,
19
})
20
if err != nil {
21
log.Fatalf("failed to create speech detector: %s", err)
22
}
23
24
if len(os.Args) != 2 {
25
log.Fatalf("invalid arguments provided: expecting one file path")
26
}
27
28
f, err := os.Open(os.Args[1])
29
if err != nil {
30
log.Fatalf("failed to open sample audio file: %s", err)
31
}
32
defer f.Close()
33
34
dec := wav.NewDecoder(f)
35
36
if ok := dec.IsValidFile(); !ok {
37
log.Fatalf("invalid WAV file")
38
}
39
40
buf, err := dec.FullPCMBuffer()
41
if err != nil {
42
log.Fatalf("failed to get PCM buffer")
43
}
44
45
pcmBuf := buf.AsFloat32Buffer()
46
47
segments, err := sd.Detect(pcmBuf.Data)
48
if err != nil {
49
log.Fatalf("Detect failed: %s", err)
50
}
51
52
for _, s := range segments {
53
log.Printf("speech starts at %0.2fs", s.SpeechStartAt)
54
if s.SpeechEndAt > 0 {
55
log.Printf("speech ends at %0.2fs", s.SpeechEndAt)
56
}
57
}
58
59
err = sd.Destroy()
60
if err != nil {
61
log.Fatalf("failed to destroy detector: %s", err)
62
}
63
}
64
65