mirror of
https://github.com/snakers4/silero-vad.git
synced 2026-02-04 09:29:22 +08:00
Compare commits
11 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
be95df9152 | ||
|
|
ec56fe50a5 | ||
|
|
dea5980320 | ||
|
|
90d9ce7695 | ||
|
|
c56dbb11ac | ||
|
|
9b686893ad | ||
|
|
6979fbd535 | ||
|
|
1cff663de5 | ||
|
|
bfdc019302 | ||
|
|
c0c0ffa0c5 | ||
|
|
556a442942 |
1
.github/workflows/test.yml
vendored
1
.github/workflows/test.yml
vendored
@@ -24,6 +24,7 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
python -m pip install --upgrade pip
|
python -m pip install --upgrade pip
|
||||||
pip install build hatchling pytest soundfile
|
pip install build hatchling pytest soundfile
|
||||||
|
pip install .[test]
|
||||||
|
|
||||||
- name: Build package
|
- name: Build package
|
||||||
run: python -m build --wheel --outdir dist
|
run: python -m build --wheel --outdir dist
|
||||||
|
|||||||
@@ -3,7 +3,7 @@ requires = ["hatchling"]
|
|||||||
build-backend = "hatchling.build"
|
build-backend = "hatchling.build"
|
||||||
[project]
|
[project]
|
||||||
name = "silero-vad"
|
name = "silero-vad"
|
||||||
version = "6.1.0"
|
version = "6.2.0"
|
||||||
authors = [
|
authors = [
|
||||||
{name="Silero Team", email="hello@silero.ai"},
|
{name="Silero Team", email="hello@silero.ai"},
|
||||||
]
|
]
|
||||||
@@ -37,3 +37,10 @@ dependencies = [
|
|||||||
[project.urls]
|
[project.urls]
|
||||||
Homepage = "https://github.com/snakers4/silero-vad"
|
Homepage = "https://github.com/snakers4/silero-vad"
|
||||||
Issues = "https://github.com/snakers4/silero-vad/issues"
|
Issues = "https://github.com/snakers4/silero-vad/issues"
|
||||||
|
|
||||||
|
[project.optional-dependencies]
|
||||||
|
test = [
|
||||||
|
"pytest",
|
||||||
|
"soundfile",
|
||||||
|
"torch<2.9",
|
||||||
|
]
|
||||||
|
|||||||
Binary file not shown.
Binary file not shown.
Binary file not shown.
@@ -223,7 +223,7 @@ def get_speech_timestamps(audio: torch.Tensor,
|
|||||||
progress_tracking_callback: Callable[[float], None] = None,
|
progress_tracking_callback: Callable[[float], None] = None,
|
||||||
neg_threshold: float = None,
|
neg_threshold: float = None,
|
||||||
window_size_samples: int = 512,
|
window_size_samples: int = 512,
|
||||||
min_silence_at_max_speech: float = 98,
|
min_silence_at_max_speech: int = 98,
|
||||||
use_max_poss_sil_at_max_speech: bool = True):
|
use_max_poss_sil_at_max_speech: bool = True):
|
||||||
|
|
||||||
"""
|
"""
|
||||||
@@ -272,7 +272,7 @@ def get_speech_timestamps(audio: torch.Tensor,
|
|||||||
neg_threshold: float (default = threshold - 0.15)
|
neg_threshold: float (default = threshold - 0.15)
|
||||||
Negative threshold (noise or exit threshold). If model's current state is SPEECH, values BELOW this value are considered as NON-SPEECH.
|
Negative threshold (noise or exit threshold). If model's current state is SPEECH, values BELOW this value are considered as NON-SPEECH.
|
||||||
|
|
||||||
min_silence_at_max_speech: float (default - 98ms)
|
min_silence_at_max_speech: int (default - 98ms)
|
||||||
Minimum silence duration in ms which is used to avoid abrupt cuts when max_speech_duration_s is reached
|
Minimum silence duration in ms which is used to avoid abrupt cuts when max_speech_duration_s is reached
|
||||||
|
|
||||||
use_max_poss_sil_at_max_speech: bool (default - True)
|
use_max_poss_sil_at_max_speech: bool (default - True)
|
||||||
|
|||||||
Reference in New Issue
Block a user