Add C++ runtime for speaker verification models from NeMo (#527)

This commit is contained in:
Fangjun Kuang
2024-01-13 21:42:09 +08:00
committed by GitHub
parent 68a525a024
commit 2024e96639
20 changed files with 405 additions and 24 deletions

View File

@@ -28,6 +28,14 @@ struct FeatureExtractorConfig {
// If false, we will multiply the inputs by 32768
bool normalize_samples = true;
bool snip_edges = false;
float frame_shift_ms = 10.0f; // in milliseconds.
float frame_length_ms = 25.0f; // in milliseconds.
int32_t low_freq = 20;
bool is_librosa = false;
bool remove_dc_offset = true; // Subtract mean of wave before FFT.
std::string window_type = "povey"; // e.g. Hamming window
std::string ToString() const;
void Register(ParseOptions *po);