* Add speaker embedding extractor API for HarmonyOS * Add ArkTS API for speaker identification
45 lines
1.3 KiB
C++
45 lines
1.3 KiB
C++
// sherpa-onnx/csrc/speaker-embedding-extractor-nemo-model.h
|
|
//
|
|
// Copyright (c) 2024 Xiaomi Corporation
|
|
#ifndef SHERPA_ONNX_CSRC_SPEAKER_EMBEDDING_EXTRACTOR_NEMO_MODEL_H_
|
|
#define SHERPA_ONNX_CSRC_SPEAKER_EMBEDDING_EXTRACTOR_NEMO_MODEL_H_
|
|
|
|
#include <memory>
|
|
|
|
#include "onnxruntime_cxx_api.h" // NOLINT
|
|
#include "sherpa-onnx/csrc/speaker-embedding-extractor-nemo-model-meta-data.h"
|
|
#include "sherpa-onnx/csrc/speaker-embedding-extractor.h"
|
|
|
|
namespace sherpa_onnx {
|
|
|
|
class SpeakerEmbeddingExtractorNeMoModel {
|
|
public:
|
|
explicit SpeakerEmbeddingExtractorNeMoModel(
|
|
const SpeakerEmbeddingExtractorConfig &config);
|
|
|
|
template <typename Manager>
|
|
SpeakerEmbeddingExtractorNeMoModel(
|
|
Manager *mgr, const SpeakerEmbeddingExtractorConfig &config);
|
|
|
|
~SpeakerEmbeddingExtractorNeMoModel();
|
|
|
|
const SpeakerEmbeddingExtractorNeMoModelMetaData &GetMetaData() const;
|
|
|
|
/**
|
|
* @param x A float32 tensor of shape (N, C, T)
|
|
* @param x_len A int64 tensor of shape (N,)
|
|
* @return A float32 tensor of shape (N, C)
|
|
*/
|
|
Ort::Value Compute(Ort::Value x, Ort::Value x_len) const;
|
|
|
|
OrtAllocator *Allocator() const;
|
|
|
|
private:
|
|
class Impl;
|
|
std::unique_ptr<Impl> impl_;
|
|
};
|
|
|
|
} // namespace sherpa_onnx
|
|
|
|
#endif // SHERPA_ONNX_CSRC_SPEAKER_EMBEDDING_EXTRACTOR_NEMO_MODEL_H_
|