Add runtime support for wespeaker models (#516)
This commit is contained in:
74
sherpa-onnx/csrc/speaker-embedding-extractor.cc
Normal file
74
sherpa-onnx/csrc/speaker-embedding-extractor.cc
Normal file
@@ -0,0 +1,74 @@
|
||||
// sherpa-onnx/csrc/speaker-embedding-extractor.cc
|
||||
//
|
||||
// Copyright (c) 2023 Xiaomi Corporation
|
||||
|
||||
#include "sherpa-onnx/csrc/speaker-embedding-extractor.h"
|
||||
|
||||
#include <vector>
|
||||
|
||||
#include "sherpa-onnx/csrc/file-utils.h"
|
||||
#include "sherpa-onnx/csrc/macros.h"
|
||||
#include "sherpa-onnx/csrc/speaker-embedding-extractor-impl.h"
|
||||
|
||||
namespace sherpa_onnx {
|
||||
|
||||
void SpeakerEmbeddingExtractorConfig::Register(ParseOptions *po) {
|
||||
po->Register("model", &model, "Path to the speaker embedding model.");
|
||||
po->Register("num-threads", &num_threads,
|
||||
"Number of threads to run the neural network");
|
||||
|
||||
po->Register("debug", &debug,
|
||||
"true to print model information while loading it.");
|
||||
|
||||
po->Register("provider", &provider,
|
||||
"Specify a provider to use: cpu, cuda, coreml");
|
||||
}
|
||||
|
||||
bool SpeakerEmbeddingExtractorConfig::Validate() const {
|
||||
if (model.empty()) {
|
||||
SHERPA_ONNX_LOGE("Please provide --speaker-embedding-model");
|
||||
return false;
|
||||
}
|
||||
|
||||
if (!FileExists(model)) {
|
||||
SHERPA_ONNX_LOGE("--speaker-embedding-model: %s does not exist",
|
||||
model.c_str());
|
||||
return false;
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
std::string SpeakerEmbeddingExtractorConfig::ToString() const {
|
||||
std::ostringstream os;
|
||||
|
||||
os << "SpeakerEmbeddingExtractorConfig(";
|
||||
os << "model=\"" << model << "\", ";
|
||||
os << "num_threads=" << num_threads << ", ";
|
||||
os << "debug=" << (debug ? "True" : "False") << ", ";
|
||||
os << "provider=\"" << provider << "\")";
|
||||
|
||||
return os.str();
|
||||
}
|
||||
|
||||
SpeakerEmbeddingExtractor::SpeakerEmbeddingExtractor(
|
||||
const SpeakerEmbeddingExtractorConfig &config)
|
||||
: impl_(SpeakerEmbeddingExtractorImpl::Create(config)) {}
|
||||
|
||||
SpeakerEmbeddingExtractor::~SpeakerEmbeddingExtractor() = default;
|
||||
|
||||
int32_t SpeakerEmbeddingExtractor::Dim() const { return impl_->Dim(); }
|
||||
|
||||
std::unique_ptr<OnlineStream> SpeakerEmbeddingExtractor::CreateStream() const {
|
||||
return impl_->CreateStream();
|
||||
}
|
||||
|
||||
bool SpeakerEmbeddingExtractor::IsReady(OnlineStream *s) const {
|
||||
return impl_->IsReady(s);
|
||||
}
|
||||
|
||||
std::vector<float> SpeakerEmbeddingExtractor::Compute(OnlineStream *s) const {
|
||||
return impl_->Compute(s);
|
||||
}
|
||||
|
||||
} // namespace sherpa_onnx
|
||||
Reference in New Issue
Block a user