diff --git a/silero-vad.ipynb b/silero-vad.ipynb index f2d3fa2..d9c62e8 100644 --- a/silero-vad.ipynb +++ b/silero-vad.ipynb @@ -138,7 +138,10 @@ "\n", "window_size_samples = 1536 # number of samples in a single audio chunk\n", "for i in range(0, len(wav), window_size_samples):\n", - " speech_dict = vad_iterator(wav[i: i+ window_size_samples], return_seconds=True)\n", + " chunk = wav[i: i+ window_size_samples]\n", + " if len(chunk) < window_size_samples:\n", + " break\n", + " speech_dict = vad_iterator(chunk, return_seconds=True)\n", " if speech_dict:\n", " print(speech_dict, end=' ')\n", "vad_iterator.reset_states() # reset model states after each audio" @@ -158,7 +161,10 @@ "speech_probs = []\n", "window_size_samples = 1536\n", "for i in range(0, len(wav), window_size_samples):\n", - " speech_prob = model(wav[i: i+ window_size_samples], SAMPLING_RATE).item()\n", + " chunk = wav[i: i+ window_size_samples]\n", + " if len(chunk) < window_size_samples:\n", + " break\n", + " speech_prob = model(chunk, SAMPLING_RATE).item()\n", " speech_probs.append(speech_prob)\n", "vad_iterator.reset_states() # reset model states after each audio\n", "\n",