mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-01-05 04:04:09 +00:00
86a277f78d
* run `go mod tidy` before building examples Running `make examples` after cloning the repository gives the following error: ``` ... [100%] Built target whisper gmake[3]: Leaving directory '/tmp/exp/whisper.cpp/bindings/go/build' gmake[2]: Leaving directory '/tmp/exp/whisper.cpp/bindings/go/build' gmake[1]: Leaving directory '/tmp/exp/whisper.cpp/bindings/go/build' Build example go-model-download Build example go-whisper examples/go-whisper/process.go:11:2: missing go.sum entry for module providing package github.com/go-audio/wav (imported by github.com/ggerganov/whisper.cpp/bindings/go/examples/go-whisper); to add: go get github.com/ggerganov/whisper.cpp/bindings/go/examples/go-whisper make: *** [Makefile:26: examples/go-whisper] Error 1 ``` * remove executable bit from various files
81 lines
1.7 KiB
Go
81 lines
1.7 KiB
Go
package main
|
|
|
|
import (
|
|
"fmt"
|
|
"io"
|
|
"os"
|
|
"time"
|
|
|
|
// Package imports
|
|
whisper "github.com/ggerganov/whisper.cpp/bindings/go/pkg/whisper"
|
|
wav "github.com/go-audio/wav"
|
|
)
|
|
|
|
func Process(model whisper.Model, path string, lang string, speedup, tokens bool) error {
|
|
var data []float32
|
|
|
|
// Create processing context
|
|
context, err := model.NewContext()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Open the file
|
|
fh, err := os.Open(path)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer fh.Close()
|
|
|
|
// Decode the WAV file
|
|
dec := wav.NewDecoder(fh)
|
|
if buf, err := dec.FullPCMBuffer(); err != nil {
|
|
return err
|
|
} else if dec.SampleRate != whisper.SampleRate {
|
|
return fmt.Errorf("unsupported sample rate: %d", dec.SampleRate)
|
|
} else if dec.NumChans != 1 {
|
|
return fmt.Errorf("unsupported number of channels: %d", dec.NumChans)
|
|
} else {
|
|
data = buf.AsFloat32Buffer().Data
|
|
}
|
|
|
|
// Set the parameters
|
|
var cb whisper.SegmentCallback
|
|
if lang != "" {
|
|
if err := context.SetLanguage(lang); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
if speedup {
|
|
context.SetSpeedup(true)
|
|
}
|
|
if tokens {
|
|
cb = func(segment whisper.Segment) {
|
|
fmt.Printf("%02d [%6s->%6s] ", segment.Num, segment.Start.Truncate(time.Millisecond), segment.End.Truncate(time.Millisecond))
|
|
for _, token := range segment.Tokens {
|
|
fmt.Printf("%q ", token.Text)
|
|
}
|
|
fmt.Println("")
|
|
}
|
|
}
|
|
|
|
// Process the data
|
|
if err := context.Process(data, cb); err != nil {
|
|
return err
|
|
}
|
|
|
|
// Print out the results
|
|
for {
|
|
segment, err := context.NextSegment()
|
|
if err == io.EOF {
|
|
break
|
|
} else if err != nil {
|
|
return err
|
|
}
|
|
fmt.Printf("[%6s->%6s] %s\n", segment.Start.Truncate(time.Millisecond), segment.End.Truncate(time.Millisecond), segment.Text)
|
|
}
|
|
|
|
// Return success
|
|
return nil
|
|
}
|