whisper.cpp

Running

djojoz commited on Oct 15, 2023

Commit

8e7b807

unverified ·

1 Parent(s): d676563

binding : Expose the audio_ctx param through the Go binding (#1368)

* expose the audio_ctx param through the go binding

* expose the audio_ctx param to the go binding context

Files changed (3) hide show

bindings/go/params.go CHANGED Viewed

@@ -118,6 +118,11 @@ func (p *Params) SetMaxTokensPerSegment(n int) {
 	p.max_tokens = C.int(n)
 }
 ///////////////////////////////////////////////////////////////////////////////
 // PRIVATE METHODS
@@ -141,6 +146,7 @@ func (p *Params) String() string {
 	str += fmt.Sprintf(" n_max_text_ctx=%d", p.n_max_text_ctx)
 	str += fmt.Sprintf(" offset_ms=%d", p.offset_ms)
 	str += fmt.Sprintf(" duration_ms=%d", p.duration_ms)
 	if p.translate {
 		str += " translate"
 	}

 	p.max_tokens = C.int(n)
 }
+// Set audio encoder context
+func (p *Params) SetAudioCtx(n int) {
+	p.audio_ctx = C.int(n)
+}
 ///////////////////////////////////////////////////////////////////////////////
 // PRIVATE METHODS
 	str += fmt.Sprintf(" n_max_text_ctx=%d", p.n_max_text_ctx)
 	str += fmt.Sprintf(" offset_ms=%d", p.offset_ms)
 	str += fmt.Sprintf(" duration_ms=%d", p.duration_ms)
+	str += fmt.Sprintf(" audio_ctx=%d", p.audio_ctx)
 	if p.translate {
 		str += " translate"
 	}

bindings/go/pkg/whisper/context.go CHANGED Viewed

@@ -82,7 +82,7 @@ func (context *context) SetSpeedup(v bool) {
 }
 func (context *context) SetSplitOnWord(v bool) {
-        context.params.SetSplitOnWord(v)
 }
 // Set number of threads to use
@@ -125,6 +125,11 @@ func (context *context) SetMaxTokensPerSegment(n uint) {
 	context.params.SetMaxTokensPerSegment(int(n))
 }
 // ResetTimings resets the mode timings. Should be called before processing
 func (context *context) ResetTimings() {
 	context.model.ctx.Whisper_reset_timings()

 }
 func (context *context) SetSplitOnWord(v bool) {
+	context.params.SetSplitOnWord(v)
 }
 // Set number of threads to use
 	context.params.SetMaxTokensPerSegment(int(n))
 }
+// Set audio encoder context
+func (context *context) SetAudioCtx(n uint) {
+	context.params.SetAudioCtx(int(n))
+}
 // ResetTimings resets the mode timings. Should be called before processing
 func (context *context) ResetTimings() {
 	context.model.ctx.Whisper_reset_timings()

bindings/go/pkg/whisper/interface.go CHANGED Viewed

@@ -48,6 +48,7 @@ type Context interface {
 	SetMaxSegmentLength(uint)     // Set max segment length in characters
 	SetTokenTimestamps(bool)      // Set token timestamps flag
 	SetMaxTokensPerSegment(uint)  // Set max tokens per segment (0 = no limit)
 	// Process mono audio data and return any errors.
 	// If defined, newly generated segments are passed to the

 	SetMaxSegmentLength(uint)     // Set max segment length in characters
 	SetTokenTimestamps(bool)      // Set token timestamps flag
 	SetMaxTokensPerSegment(uint)  // Set max tokens per segment (0 = no limit)
+	SetAudioCtx(uint)             // Set audio encoder context
 	// Process mono audio data and return any errors.
 	// If defined, newly generated segments are passed to the