Merge pull request #719 from snakers4/adamnsandle

Adamnsandle
fx workflow
2026-02-04 09:29:22 +08:00 · 2025-11-06 11:25:49 +03:00 · 2025-11-06 08:18:46 +00:00 · 2025-11-06 08:04:02 +00:00 · 2025-11-06 07:49:44 +00:00 · 2025-11-06 07:36:38 +00:00
6 changed files with 11 additions and 3 deletions
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -24,6 +24,7 @@ jobs:
      run: |
        python -m pip install --upgrade pip
        pip install build hatchling pytest soundfile
+        pip install .[test]

    - name: Build package
      run: python -m build --wheel --outdir dist
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -3,7 +3,7 @@ requires = ["hatchling"]
 build-backend = "hatchling.build"
 [project]
 name = "silero-vad"
-version = "6.1.0"
+version = "6.2.0"
 authors = [
  {name="Silero Team", email="hello@silero.ai"},
 ]
@@ -37,3 +37,10 @@ dependencies = [
 [project.urls]
 Homepage = "https://github.com/snakers4/silero-vad"
 Issues = "https://github.com/snakers4/silero-vad/issues"
+
+[project.optional-dependencies]
+test = [
+    "pytest",
+    "soundfile",
+    "torch<2.9",
+]
--- a/src/silero_vad/data/silero_vad.jit
+++ b/src/silero_vad/data/silero_vad.jit
--- a/src/silero_vad/data/silero_vad.onnx
+++ b/src/silero_vad/data/silero_vad.onnx
--- a/src/silero_vad/data/silero_vad_16k_op15.onnx
+++ b/src/silero_vad/data/silero_vad_16k_op15.onnx
--- a/src/silero_vad/utils_vad.py
+++ b/src/silero_vad/utils_vad.py
@@ -223,7 +223,7 @@ def get_speech_timestamps(audio: torch.Tensor,
                          progress_tracking_callback: Callable[[float], None] = None,
                          neg_threshold: float = None,
                          window_size_samples: int = 512,
-                          min_silence_at_max_speech: float = 98,
+                          min_silence_at_max_speech: int = 98,
                          use_max_poss_sil_at_max_speech: bool = True):

    """
@@ -272,7 +272,7 @@ def get_speech_timestamps(audio: torch.Tensor,
    neg_threshold: float (default = threshold - 0.15)
        Negative threshold (noise or exit threshold). If model's current state is SPEECH, values BELOW this value are considered as NON-SPEECH.

-    min_silence_at_max_speech: float (default - 98ms)
+    min_silence_at_max_speech: int (default - 98ms)
        Minimum silence duration in ms which is used to avoid abrupt cuts when max_speech_duration_s is reached

    use_max_poss_sil_at_max_speech: bool (default - True)
Author	SHA1	Message	Date
Dimitrii Voronin	be95df9152	Merge pull request #719 from snakers4/adamnsandle Adamnsandle	2025-11-06 11:25:49 +03:00
adamnsandle	ec56fe50a5	fx workflow	2025-11-06 08:18:46 +00:00
adamnsandle	dea5980320	fx workflow	2025-11-06 08:04:02 +00:00
adamnsandle	90d9ce7695	fx workflow	2025-11-06 07:49:44 +00:00
adamnsandle	c56dbb11ac	Merge branch 'master' of github.com:snakers4/silero-vad into adamnsandle	2025-11-06 07:36:38 +00:00
adamnsandle	9b686893ad	fx test workflow	2025-11-06 07:36:23 +00:00
Dimitrii Voronin	6979fbd535	Merge pull request #717 from snakers4/adamnsandle v6.2.0 release	2025-11-06 10:28:00 +03:00
adamnsandle	1cff663de5	fix version to 6.2.0	2025-11-06 07:27:07 +00:00
adamnsandle	bfdc019302	add v6.2 model	2025-11-06 07:23:43 +00:00
Alexander Veysov	c0c0ffa0c5	Merge pull request #714 from Purfview/patch-4 Fix type hint for min_silence_at_max_speech (float -> int)	2025-11-05 08:44:00 +03:00
Purfview	556a442942	Fix type hint for min_silence_at_max_speech (float -> int)	2025-11-04 08:30:01 +00:00