This repository has been archived on 2025-08-26. You can view files and clone it, but cannot push or open issues or pull requests.
Files
enginex-mr_series-sherpa-onnx/sherpa-onnx/csrc/features.cc

124 lines
3.3 KiB
C++
Raw Normal View History

2023-02-19 19:36:03 +08:00
// sherpa-onnx/csrc/features.cc
2023-02-18 21:35:15 +08:00
//
// Copyright (c) 2023 Xiaomi Corporation
#include "sherpa-onnx/csrc/features.h"
#include <algorithm>
#include <memory>
2023-02-19 09:57:56 +08:00
#include <mutex> // NOLINT
2023-02-19 12:45:38 +08:00
#include <sstream>
2023-02-18 21:35:15 +08:00
#include <vector>
2023-02-19 09:57:56 +08:00
#include "kaldi-native-fbank/csrc/online-feature.h"
2023-02-18 21:35:15 +08:00
namespace sherpa_onnx {
2023-02-19 12:45:38 +08:00
std::string FeatureExtractorConfig::ToString() const {
std::ostringstream os;
os << "FeatureExtractorConfig(";
os << "sampling_rate=" << sampling_rate << ", ";
os << "feature_dim=" << feature_dim << ")";
return os.str();
}
2023-02-19 09:57:56 +08:00
class FeatureExtractor::Impl {
public:
2023-02-19 10:39:07 +08:00
explicit Impl(const FeatureExtractorConfig &config) {
2023-02-19 09:57:56 +08:00
opts_.frame_opts.dither = 0;
opts_.frame_opts.snip_edges = false;
2023-02-19 10:39:07 +08:00
opts_.frame_opts.samp_freq = config.sampling_rate;
2023-02-18 21:35:15 +08:00
2023-02-19 09:57:56 +08:00
// cache 100 seconds of feature frames, which is more than enough
// for real needs
opts_.frame_opts.max_feature_vectors = 100 * 100;
2023-02-18 21:35:15 +08:00
2023-02-19 10:39:07 +08:00
opts_.mel_opts.num_bins = config.feature_dim;
2023-02-18 21:35:15 +08:00
2023-02-19 09:57:56 +08:00
fbank_ = std::make_unique<knf::OnlineFbank>(opts_);
}
2023-02-18 21:35:15 +08:00
2023-02-19 09:57:56 +08:00
void AcceptWaveform(float sampling_rate, const float *waveform, int32_t n) {
std::lock_guard<std::mutex> lock(mutex_);
fbank_->AcceptWaveform(sampling_rate, waveform, n);
}
void InputFinished() {
std::lock_guard<std::mutex> lock(mutex_);
fbank_->InputFinished();
}
int32_t NumFramesReady() const {
std::lock_guard<std::mutex> lock(mutex_);
return fbank_->NumFramesReady();
}
bool IsLastFrame(int32_t frame) const {
std::lock_guard<std::mutex> lock(mutex_);
return fbank_->IsLastFrame(frame);
}
std::vector<float> GetFrames(int32_t frame_index, int32_t n) const {
if (frame_index + n > NumFramesReady()) {
fprintf(stderr, "%d + %d > %d\n", frame_index, n, NumFramesReady());
exit(-1);
}
std::lock_guard<std::mutex> lock(mutex_);
int32_t feature_dim = fbank_->Dim();
std::vector<float> features(feature_dim * n);
float *p = features.data();
for (int32_t i = 0; i != n; ++i) {
const float *f = fbank_->GetFrame(i + frame_index);
std::copy(f, f + feature_dim, p);
p += feature_dim;
}
return features;
}
void Reset() { fbank_ = std::make_unique<knf::OnlineFbank>(opts_); }
int32_t FeatureDim() const { return opts_.mel_opts.num_bins; }
private:
std::unique_ptr<knf::OnlineFbank> fbank_;
knf::FbankOptions opts_;
mutable std::mutex mutex_;
};
2023-02-19 10:39:07 +08:00
FeatureExtractor::FeatureExtractor(const FeatureExtractorConfig &config /*={}*/)
: impl_(std::make_unique<Impl>(config)) {}
2023-02-19 09:57:56 +08:00
FeatureExtractor::~FeatureExtractor() = default;
2023-02-18 21:35:15 +08:00
void FeatureExtractor::AcceptWaveform(float sampling_rate,
const float *waveform, int32_t n) {
2023-02-19 09:57:56 +08:00
impl_->AcceptWaveform(sampling_rate, waveform, n);
2023-02-18 21:35:15 +08:00
}
2023-02-19 09:57:56 +08:00
void FeatureExtractor::InputFinished() { impl_->InputFinished(); }
2023-02-18 21:35:15 +08:00
int32_t FeatureExtractor::NumFramesReady() const {
2023-02-19 09:57:56 +08:00
return impl_->NumFramesReady();
2023-02-18 21:35:15 +08:00
}
bool FeatureExtractor::IsLastFrame(int32_t frame) const {
2023-02-19 09:57:56 +08:00
return impl_->IsLastFrame(frame);
2023-02-18 21:35:15 +08:00
}
std::vector<float> FeatureExtractor::GetFrames(int32_t frame_index,
int32_t n) const {
2023-02-19 09:57:56 +08:00
return impl_->GetFrames(frame_index, n);
2023-02-18 21:35:15 +08:00
}
2023-02-19 09:57:56 +08:00
void FeatureExtractor::Reset() { impl_->Reset(); }
int32_t FeatureExtractor::FeatureDim() const { return impl_->FeatureDim(); }
2023-02-18 21:35:15 +08:00
} // namespace sherpa_onnx