Fix bug with speech duration calculation (#484)

Shubhrakanti · web-flow · commit b2536642a131 · 2025-06-26T11:53:52.000-07:00
diff --git a/.changeset/tall-months-doubt.md b/.changeset/tall-months-doubt.md
@@ -0,0 +1,5 @@
+---
+'@livekit/agents-plugin-silero': patch
+---
+
+bugfix with speech duration calculation
diff --git a/plugins/silero/src/vad.ts b/plugins/silero/src/vad.ts
@@ -35,9 +35,9 @@ export interface VADOptions {
 
 const defaultVADOptions: VADOptions = {
   minSpeechDuration: 50,
-  minSilenceDuration: 250,
+  minSilenceDuration: 550,
   prefixPaddingDuration: 500,
-  maxBufferedSpeech: 60000,
+  maxBufferedSpeech: 60000, // 60 seconds
   activationThreshold: 0.5,
   sampleRate: 16000,
   forceCPU: true,
@@ -227,7 +227,7 @@ export class VADStream extends baseStream {
 
           // copy the inference window to the speech buffer
           const availableSpace = this.#speechBuffer.length - speechBufferIndex;
-          const toCopyBuffer = Math.min(this.#model.windowSizeSamples, availableSpace);
+          const toCopyBuffer = Math.min(toCopyInt, availableSpace);
           if (toCopyBuffer > 0) {
             this.#speechBuffer.set(inputFrame.data.subarray(0, toCopyBuffer), speechBufferIndex);
             speechBufferIndex += toCopyBuffer;
@@ -250,9 +250,9 @@ export class VADStream extends baseStream {
           }
 
           if (pubSpeaking) {
-            pubSpeechDuration += inferenceDuration;
+            pubSpeechDuration += windowDuration;
           } else {
-            pubSilenceDuration += inferenceDuration;
+            pubSilenceDuration += windowDuration;
           }
 
           this.queue.put({

-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +---
 +'@livekit/agents-plugin-silero': patch
 +---
++
 +bugfix with speech duration calculation