add c++ inference based on libtorch

2026-02-05 01:49:22 +08:00 · 2024-11-22 00:10:13 +00:00
parent 93b9782f28
commit 05e380c1de
6 changed files with 683 additions and 0 deletions
--- a/examples/cpp_libtorch/main.cc
+++ b/examples/cpp_libtorch/main.cc
@@ -0,0 +1,51 @@
+#include <iostream>
+#include "silero_torch.h"
+#include "wav.h"
+
+int main(int argc, char* argv[]) {
+
+	if(argc != 3){
+		std::cerr<<"Usage : "<<argv[0]<<" <wav.path> threshold"<<std::endl;
+		std::cerr<<"Usage : "<<argv[0]<<" sample.wav 0.38"<<std::endl;
+		return 1;
+	}
+
+	std::string wav_path = argv[1];
+	float threshold = std::stof(argv[2]);
+
+
+	//Load Model
+	std::string model_path = "../../src/silero_vad/data/silero_vad.jit";
+	silero::VadIterator vad(model_path);
+        vad.threshold=threshold;
+        vad.min_speech_duration_ms=255;
+        vad.max_duration_merge_ms=300;
+        vad.print_as_samples=true;	//if true, it prints time-stamp with sample numbers.
+					//(Default:false)
+
+	// Read wav
+	wav::WavReader wav_reader(wav_path); 
+	std::vector<float> input_wav(wav_reader.num_samples());
+
+	for (int i = 0; i < wav_reader.num_samples(); i++)
+	{
+		input_wav[i] = static_cast<float>(*(wav_reader.data() + i));
+	}
+
+	vad.SpeechProbs(input_wav);
+
+	std::vector<silero::Interval> speeches = vad.GetSpeechTimestamps();
+	for(const auto& speech : speeches){
+		if(vad.print_as_samples){
+			std::cout<<"{'start': "<<static_cast<int>(speech.start)<<", 'end': "<<static_cast<int>(speech.end)<<"}"<<std::endl;
+		}
+		else{
+			std::cout<<"{'start': "<<speech.start<<", 'end': "<<speech.end<<"}"<<std::endl;
+		}
+	}	
+
+
+	return 0;
+	}
+
+