Add C++ runtime for speaker verification models from NeMo (#527)

2024-01-13 21:42:09 +08:00
parent 68a525a024
commit 2024e96639
20 changed files with 405 additions and 24 deletions
--- a/sherpa-onnx/csrc/features.h
+++ b/sherpa-onnx/csrc/features.h
@@ -28,6 +28,14 @@ struct FeatureExtractorConfig {
  // If false, we will multiply the inputs by 32768
  bool normalize_samples = true;

+  bool snip_edges = false;
+  float frame_shift_ms = 10.0f;   // in milliseconds.
+  float frame_length_ms = 25.0f;  // in milliseconds.
+  int32_t low_freq = 20;
+  bool is_librosa = false;
+  bool remove_dc_offset = true;       // Subtract mean of wave before FFT.
+  std::string window_type = "povey";  // e.g. Hamming window
+
  std::string ToString() const;

  void Register(ParseOptions *po);