139 lines
4.7 KiB
C++
139 lines
4.7 KiB
C++
// sherpa-onnx/jni/speaker-embedding-extractor.cc
|
|
//
|
|
// Copyright (c) 2024 Xiaomi Corporation
|
|
#include "sherpa-onnx/csrc/speaker-embedding-extractor.h"
|
|
|
|
#include "sherpa-onnx/jni/common.h"
|
|
|
|
namespace sherpa_onnx {
|
|
|
|
static SpeakerEmbeddingExtractorConfig GetSpeakerEmbeddingExtractorConfig(
|
|
JNIEnv *env, jobject config) {
|
|
SpeakerEmbeddingExtractorConfig ans;
|
|
|
|
jclass cls = env->GetObjectClass(config);
|
|
|
|
jfieldID fid = env->GetFieldID(cls, "model", "Ljava/lang/String;");
|
|
jstring s = (jstring)env->GetObjectField(config, fid);
|
|
const char *p = env->GetStringUTFChars(s, nullptr);
|
|
|
|
ans.model = p;
|
|
env->ReleaseStringUTFChars(s, p);
|
|
|
|
fid = env->GetFieldID(cls, "numThreads", "I");
|
|
ans.num_threads = env->GetIntField(config, fid);
|
|
|
|
fid = env->GetFieldID(cls, "debug", "Z");
|
|
ans.debug = env->GetBooleanField(config, fid);
|
|
|
|
fid = env->GetFieldID(cls, "provider", "Ljava/lang/String;");
|
|
s = (jstring)env->GetObjectField(config, fid);
|
|
p = env->GetStringUTFChars(s, nullptr);
|
|
ans.provider = p;
|
|
env->ReleaseStringUTFChars(s, p);
|
|
|
|
return ans;
|
|
}
|
|
|
|
} // namespace sherpa_onnx
|
|
|
|
SHERPA_ONNX_EXTERN_C
|
|
JNIEXPORT jlong JNICALL
|
|
Java_com_k2fsa_sherpa_onnx_SpeakerEmbeddingExtractor_newFromAsset(
|
|
JNIEnv *env, jobject /*obj*/, jobject asset_manager, jobject _config) {
|
|
#if __ANDROID_API__ >= 9
|
|
AAssetManager *mgr = AAssetManager_fromJava(env, asset_manager);
|
|
if (!mgr) {
|
|
SHERPA_ONNX_LOGE("Failed to get asset manager: %p", mgr);
|
|
return 0;
|
|
}
|
|
#endif
|
|
auto config = sherpa_onnx::GetSpeakerEmbeddingExtractorConfig(env, _config);
|
|
SHERPA_ONNX_LOGE("new config:\n%s", config.ToString().c_str());
|
|
|
|
auto extractor = new sherpa_onnx::SpeakerEmbeddingExtractor(
|
|
#if __ANDROID_API__ >= 9
|
|
mgr,
|
|
#endif
|
|
config);
|
|
|
|
return (jlong)extractor;
|
|
}
|
|
|
|
SHERPA_ONNX_EXTERN_C
|
|
JNIEXPORT jlong JNICALL
|
|
Java_com_k2fsa_sherpa_onnx_SpeakerEmbeddingExtractor_newFromFile(
|
|
JNIEnv *env, jobject /*obj*/, jobject _config) {
|
|
auto config = sherpa_onnx::GetSpeakerEmbeddingExtractorConfig(env, _config);
|
|
SHERPA_ONNX_LOGE("newFromFile config:\n%s", config.ToString().c_str());
|
|
|
|
if (!config.Validate()) {
|
|
SHERPA_ONNX_LOGE("Errors found in config!");
|
|
}
|
|
|
|
auto extractor = new sherpa_onnx::SpeakerEmbeddingExtractor(config);
|
|
|
|
return (jlong)extractor;
|
|
}
|
|
|
|
SHERPA_ONNX_EXTERN_C
|
|
JNIEXPORT void JNICALL
|
|
Java_com_k2fsa_sherpa_onnx_SpeakerEmbeddingExtractor_delete(JNIEnv * /*env*/,
|
|
jobject /*obj*/,
|
|
jlong ptr) {
|
|
delete reinterpret_cast<sherpa_onnx::SpeakerEmbeddingExtractor *>(ptr);
|
|
}
|
|
|
|
SHERPA_ONNX_EXTERN_C
|
|
JNIEXPORT jlong JNICALL
|
|
Java_com_k2fsa_sherpa_onnx_SpeakerEmbeddingExtractor_createStream(
|
|
JNIEnv * /*env*/, jobject /*obj*/, jlong ptr) {
|
|
std::unique_ptr<sherpa_onnx::OnlineStream> s =
|
|
reinterpret_cast<sherpa_onnx::SpeakerEmbeddingExtractor *>(ptr)
|
|
->CreateStream();
|
|
|
|
// The user is responsible to free the returned pointer.
|
|
//
|
|
// See Java_com_k2fsa_sherpa_onnx_OnlineStream_delete() from
|
|
// ./online-stream.cc
|
|
sherpa_onnx::OnlineStream *p = s.release();
|
|
return (jlong)p;
|
|
}
|
|
|
|
SHERPA_ONNX_EXTERN_C
|
|
JNIEXPORT jboolean JNICALL
|
|
Java_com_k2fsa_sherpa_onnx_SpeakerEmbeddingExtractor_isReady(JNIEnv * /*env*/,
|
|
jobject /*obj*/,
|
|
jlong ptr,
|
|
jlong stream_ptr) {
|
|
auto extractor =
|
|
reinterpret_cast<sherpa_onnx::SpeakerEmbeddingExtractor *>(ptr);
|
|
auto stream = reinterpret_cast<sherpa_onnx::OnlineStream *>(stream_ptr);
|
|
return extractor->IsReady(stream);
|
|
}
|
|
|
|
SHERPA_ONNX_EXTERN_C
|
|
JNIEXPORT jfloatArray JNICALL
|
|
Java_com_k2fsa_sherpa_onnx_SpeakerEmbeddingExtractor_compute(JNIEnv *env,
|
|
jobject /*obj*/,
|
|
jlong ptr,
|
|
jlong stream_ptr) {
|
|
auto extractor =
|
|
reinterpret_cast<sherpa_onnx::SpeakerEmbeddingExtractor *>(ptr);
|
|
auto stream = reinterpret_cast<sherpa_onnx::OnlineStream *>(stream_ptr);
|
|
|
|
std::vector<float> embedding = extractor->Compute(stream);
|
|
jfloatArray embedding_arr = env->NewFloatArray(embedding.size());
|
|
env->SetFloatArrayRegion(embedding_arr, 0, embedding.size(),
|
|
embedding.data());
|
|
return embedding_arr;
|
|
}
|
|
|
|
SHERPA_ONNX_EXTERN_C
|
|
JNIEXPORT jint JNICALL Java_com_k2fsa_sherpa_onnx_SpeakerEmbeddingExtractor_dim(
|
|
JNIEnv * /*env*/, jobject /*obj*/, jlong ptr) {
|
|
auto extractor =
|
|
reinterpret_cast<sherpa_onnx::SpeakerEmbeddingExtractor *>(ptr);
|
|
return extractor->Dim();
|
|
}
|