mirror of
https://github.com/snakers4/silero-vad.git
synced 2026-02-05 18:09:22 +08:00
get rid of soundifle dependency
This commit is contained in:
16
utils_vad.py
16
utils_vad.py
@@ -1,15 +1,9 @@
|
|||||||
import torch
|
import torch
|
||||||
import torchaudio
|
import torchaudio
|
||||||
from typing import List
|
from typing import List
|
||||||
from itertools import repeat
|
|
||||||
from collections import deque
|
|
||||||
import torch.nn.functional as F
|
import torch.nn.functional as F
|
||||||
import warnings
|
import warnings
|
||||||
|
|
||||||
|
|
||||||
torchaudio.set_audio_backend("soundfile") # switch backend
|
|
||||||
|
|
||||||
|
|
||||||
languages = ['ru', 'en', 'de', 'es']
|
languages = ['ru', 'en', 'de', 'es']
|
||||||
|
|
||||||
|
|
||||||
@@ -32,20 +26,20 @@ def read_audio(path: str,
|
|||||||
if wav.size(0) > 1:
|
if wav.size(0) > 1:
|
||||||
wav = wav.mean(dim=0, keepdim=True)
|
wav = wav.mean(dim=0, keepdim=True)
|
||||||
|
|
||||||
if sr != target_sr:
|
if sr != sampling_rate:
|
||||||
transform = torchaudio.transforms.Resample(orig_freq=sr,
|
transform = torchaudio.transforms.Resample(orig_freq=sr,
|
||||||
new_freq=target_sr)
|
new_freq=sampling_rate)
|
||||||
wav = transform(wav)
|
wav = transform(wav)
|
||||||
sr = target_sr
|
sr = sampling_rate
|
||||||
|
|
||||||
assert sr == target_sr
|
assert sr == sampling_rate
|
||||||
return wav.squeeze(0)
|
return wav.squeeze(0)
|
||||||
|
|
||||||
|
|
||||||
def save_audio(path: str,
|
def save_audio(path: str,
|
||||||
tensor: torch.Tensor,
|
tensor: torch.Tensor,
|
||||||
sampling_rate: int = 16000):
|
sampling_rate: int = 16000):
|
||||||
torchaudio.save(path, tensor.unsqueeze(0), sr)
|
torchaudio.save(path, tensor.unsqueeze(0), sampling_rate)
|
||||||
|
|
||||||
|
|
||||||
def init_jit_model(model_path: str,
|
def init_jit_model(model_path: str,
|
||||||
|
|||||||
Reference in New Issue
Block a user