Support exporting models to onnx from 3D-Speaker (#522)

This commit is contained in:
Fangjun Kuang
2024-01-10 21:09:45 +08:00
committed by GitHub
parent 55266918c8
commit 07e2b9a36d
10 changed files with 442 additions and 14 deletions

View File

@@ -27,7 +27,7 @@ class SpeakerEmbeddingExtractorWeSpeakerImpl
FeatureExtractorConfig feat_config;
auto meta_data = model_.GetMetaData();
feat_config.sampling_rate = meta_data.sample_rate;
feat_config.normalize_samples = meta_data.normalize_features;
feat_config.normalize_samples = meta_data.normalize_samples;
return std::make_unique<OnlineStream>(feat_config);
}

View File

@@ -12,7 +12,7 @@ namespace sherpa_onnx {
struct SpeakerEmbeddingExtractorWeSpeakerModelMetaData {
int32_t output_dim = 0;
int32_t sample_rate = 0;
int32_t normalize_features = 0;
int32_t normalize_samples = 0;
std::string language;
};

View File

@@ -61,8 +61,8 @@ class SpeakerEmbeddingExtractorWeSpeakerModel::Impl {
Ort::AllocatorWithDefaultOptions allocator; // used in the macro below
SHERPA_ONNX_READ_META_DATA(meta_data_.output_dim, "output_dim");
SHERPA_ONNX_READ_META_DATA(meta_data_.sample_rate, "sample_rate");
SHERPA_ONNX_READ_META_DATA(meta_data_.normalize_features,
"normalize_features");
SHERPA_ONNX_READ_META_DATA(meta_data_.normalize_samples,
"normalize_samples");
SHERPA_ONNX_READ_META_DATA_STR(meta_data_.language, "language");
std::string framework;