From 6e6da04e7af6207e526bf87fd8c5111f42199a04 Mon Sep 17 00:00:00 2001 From: adamnsandle Date: Wed, 9 Oct 2024 08:49:39 +0000 Subject: [PATCH 1/2] fix pyaudio streaming example --- examples/pyaudio-streaming/README.md | 2 + .../pyaudio-streaming-examples.ipynb | 76 ++++++++++++------- 2 files changed, 52 insertions(+), 26 deletions(-) diff --git a/examples/pyaudio-streaming/README.md b/examples/pyaudio-streaming/README.md index 33e4760..c83bb78 100644 --- a/examples/pyaudio-streaming/README.md +++ b/examples/pyaudio-streaming/README.md @@ -7,6 +7,8 @@ It has been designed as a low-level example for binary real-time streaming using Currently, the notebook consits of two examples: - One that records audio of a predefined length from the microphone, process it with Silero-VAD, and plots it afterwards. - The other one plots the speech probabilities in real-time (using jupyterplot) and records the audio until you press enter. + + This example does not work in google colab! For local usage only. ## Example Video for the Real-Time Visualization diff --git a/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb b/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb index 94c8240..e4f6ff3 100644 --- a/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb +++ b/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "markdown", - "id": "62a0cccb", + "id": "b3e57018", "metadata": {}, "source": [ "# Pyaudio Microphone Streaming Examples\n", @@ -12,12 +12,14 @@ "I created it as an example on how binary data from a stream could be feed into Silero VAD.\n", "\n", "\n", - "Has been tested on Ubuntu 21.04 (x86). After you installed the dependencies below, no additional setup is required." + "Has been tested on Ubuntu 21.04 (x86). After you installed the dependencies below, no additional setup is required.\n", + "\n", + "This notebook does not work in google colab! For local usage only." ] }, { "cell_type": "markdown", - "id": "64cbe1eb", + "id": "fceba3a7", "metadata": {}, "source": [ "## Dependencies\n", @@ -26,9 +28,14 @@ }, { "cell_type": "code", - "execution_count": null, - "id": "57bc2aac", - "metadata": {}, + "execution_count": 1, + "id": "efe93780", + "metadata": { + "ExecuteTime": { + "end_time": "2024-10-09T08:47:34.056898Z", + "start_time": "2024-10-09T08:47:34.053418Z" + } + }, "outputs": [], "source": [ "#!pip install numpy==2.0.2\n", @@ -36,12 +43,12 @@ "#!pip install matplotlib==3.9.2\n", "#!pip install torchaudio==2.4.1\n", "#!pip install soundfile==0.12.1\n", - "#!pip install pyaudio==0.2.11" + "#!apt install python3-pyaudio (linux) or pip install pyaudio (windows)" ] }, { "cell_type": "markdown", - "id": "110de761", + "id": "8bfc4a6f", "metadata": {}, "source": [ "## Imports" @@ -49,10 +56,27 @@ }, { "cell_type": "code", - "execution_count": null, - "id": "5a647d8d", - "metadata": {}, - "outputs": [], + "execution_count": 2, + "id": "adb0a385", + "metadata": { + "ExecuteTime": { + "end_time": "2024-10-09T08:47:39.005032Z", + "start_time": "2024-10-09T08:47:36.489952Z" + } + }, + "outputs": [ + { + "ename": "ModuleNotFoundError", + "evalue": "No module named 'pyaudio'", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", + "Cell \u001b[0;32mIn[2], line 8\u001b[0m\n\u001b[1;32m 6\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mmatplotlib\u001b[39;00m\n\u001b[1;32m 7\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mmatplotlib\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mpylab\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mplt\u001b[39;00m\n\u001b[0;32m----> 8\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mpyaudio\u001b[39;00m\n", + "\u001b[0;31mModuleNotFoundError\u001b[0m: No module named 'pyaudio'" + ] + } + ], "source": [ "import io\n", "import numpy as np\n", @@ -67,7 +91,7 @@ { "cell_type": "code", "execution_count": null, - "id": "725d7066", + "id": "cff8154c", "metadata": {}, "outputs": [], "source": [ @@ -79,7 +103,7 @@ { "cell_type": "code", "execution_count": null, - "id": "1c0b2ea7", + "id": "b7251534", "metadata": {}, "outputs": [], "source": [ @@ -92,7 +116,7 @@ }, { "cell_type": "markdown", - "id": "f9112603", + "id": "bea37012", "metadata": {}, "source": [ "### Helper Methods" @@ -101,7 +125,7 @@ { "cell_type": "code", "execution_count": null, - "id": "5abc6330", + "id": "cfc5e492", "metadata": {}, "outputs": [], "source": [ @@ -124,7 +148,7 @@ }, { "cell_type": "markdown", - "id": "5124095e", + "id": "e893068b", "metadata": {}, "source": [ "## Pyaudio Set-up" @@ -133,7 +157,7 @@ { "cell_type": "code", "execution_count": null, - "id": "a845356e", + "id": "1463d9e7", "metadata": {}, "outputs": [], "source": [ @@ -147,7 +171,7 @@ }, { "cell_type": "markdown", - "id": "0b910c99", + "id": "3f44a55a", "metadata": {}, "source": [ "## Simple Example\n", @@ -157,7 +181,7 @@ { "cell_type": "code", "execution_count": null, - "id": "9d3d2c10", + "id": "b363165c", "metadata": {}, "outputs": [], "source": [ @@ -167,7 +191,7 @@ { "cell_type": "code", "execution_count": null, - "id": "3cb44a4a", + "id": "3a7a187c", "metadata": {}, "outputs": [], "source": [ @@ -207,7 +231,7 @@ }, { "cell_type": "markdown", - "id": "a3dda982", + "id": "1b4fc36a", "metadata": {}, "source": [ "## Real Time Visualization\n", @@ -220,7 +244,7 @@ { "cell_type": "code", "execution_count": null, - "id": "05ef4100", + "id": "f398cf2d", "metadata": {}, "outputs": [], "source": [ @@ -230,7 +254,7 @@ { "cell_type": "code", "execution_count": null, - "id": "d1d4cdd6", + "id": "d5e26840", "metadata": {}, "outputs": [], "source": [ @@ -287,7 +311,7 @@ { "cell_type": "code", "execution_count": null, - "id": "1e398009", + "id": "9f348860", "metadata": {}, "outputs": [], "source": [ @@ -311,7 +335,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.9.10" + "version": "3.10.14" }, "toc": { "base_numbering": 1, From 001d57d6ff799d9fc112902501142f5ff22f344e Mon Sep 17 00:00:00 2001 From: adamnsandle Date: Wed, 9 Oct 2024 09:26:39 +0000 Subject: [PATCH 2/2] fx dependencies --- .../pyaudio-streaming-examples.ipynb | 44 +++++++++---------- 1 file changed, 22 insertions(+), 22 deletions(-) diff --git a/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb b/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb index e4f6ff3..4a577d4 100644 --- a/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb +++ b/examples/pyaudio-streaming/pyaudio-streaming-examples.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "markdown", - "id": "b3e57018", + "id": "76aa55ba", "metadata": {}, "source": [ "# Pyaudio Microphone Streaming Examples\n", @@ -19,7 +19,7 @@ }, { "cell_type": "markdown", - "id": "fceba3a7", + "id": "4a4e15c2", "metadata": {}, "source": [ "## Dependencies\n", @@ -29,7 +29,7 @@ { "cell_type": "code", "execution_count": 1, - "id": "efe93780", + "id": "24205cce", "metadata": { "ExecuteTime": { "end_time": "2024-10-09T08:47:34.056898Z", @@ -38,17 +38,17 @@ }, "outputs": [], "source": [ - "#!pip install numpy==2.0.2\n", - "#!pip install torch==2.4.1\n", - "#!pip install matplotlib==3.9.2\n", - "#!pip install torchaudio==2.4.1\n", + "#!pip install numpy>=1.24.0\n", + "#!pip install torch>=1.12.0\n", + "#!pip install matplotlib>=3.6.0\n", + "#!pip install torchaudio>=0.12.0\n", "#!pip install soundfile==0.12.1\n", "#!apt install python3-pyaudio (linux) or pip install pyaudio (windows)" ] }, { "cell_type": "markdown", - "id": "8bfc4a6f", + "id": "cd22818f", "metadata": {}, "source": [ "## Imports" @@ -57,7 +57,7 @@ { "cell_type": "code", "execution_count": 2, - "id": "adb0a385", + "id": "994d7f3a", "metadata": { "ExecuteTime": { "end_time": "2024-10-09T08:47:39.005032Z", @@ -91,7 +91,7 @@ { "cell_type": "code", "execution_count": null, - "id": "cff8154c", + "id": "ac5c52f7", "metadata": {}, "outputs": [], "source": [ @@ -103,7 +103,7 @@ { "cell_type": "code", "execution_count": null, - "id": "b7251534", + "id": "ad5919dc", "metadata": {}, "outputs": [], "source": [ @@ -116,7 +116,7 @@ }, { "cell_type": "markdown", - "id": "bea37012", + "id": "784d1ab6", "metadata": {}, "source": [ "### Helper Methods" @@ -125,7 +125,7 @@ { "cell_type": "code", "execution_count": null, - "id": "cfc5e492", + "id": "af4bca64", "metadata": {}, "outputs": [], "source": [ @@ -148,7 +148,7 @@ }, { "cell_type": "markdown", - "id": "e893068b", + "id": "ca13e514", "metadata": {}, "source": [ "## Pyaudio Set-up" @@ -157,7 +157,7 @@ { "cell_type": "code", "execution_count": null, - "id": "1463d9e7", + "id": "75f99022", "metadata": {}, "outputs": [], "source": [ @@ -171,7 +171,7 @@ }, { "cell_type": "markdown", - "id": "3f44a55a", + "id": "4da7d2ef", "metadata": {}, "source": [ "## Simple Example\n", @@ -181,7 +181,7 @@ { "cell_type": "code", "execution_count": null, - "id": "b363165c", + "id": "6fe77661", "metadata": {}, "outputs": [], "source": [ @@ -191,7 +191,7 @@ { "cell_type": "code", "execution_count": null, - "id": "3a7a187c", + "id": "23f4da3e", "metadata": {}, "outputs": [], "source": [ @@ -231,7 +231,7 @@ }, { "cell_type": "markdown", - "id": "1b4fc36a", + "id": "fd243e8f", "metadata": {}, "source": [ "## Real Time Visualization\n", @@ -244,7 +244,7 @@ { "cell_type": "code", "execution_count": null, - "id": "f398cf2d", + "id": "d36980c2", "metadata": {}, "outputs": [], "source": [ @@ -254,7 +254,7 @@ { "cell_type": "code", "execution_count": null, - "id": "d5e26840", + "id": "5607b616", "metadata": {}, "outputs": [], "source": [ @@ -311,7 +311,7 @@ { "cell_type": "code", "execution_count": null, - "id": "9f348860", + "id": "dc4f0108", "metadata": {}, "outputs": [], "source": [