Support not using external buffers for node-addon (#925)
This commit is contained in:
2
.github/scripts/node-addon/run.sh
vendored
2
.github/scripts/node-addon/run.sh
vendored
@@ -18,7 +18,7 @@ fi
|
|||||||
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
||||||
echo "SHERPA_ONNX_VERSION $SHERPA_ONNX_VERSION"
|
echo "SHERPA_ONNX_VERSION $SHERPA_ONNX_VERSION"
|
||||||
|
|
||||||
# SHERPA_ONNX_VERSION=1.0.25
|
# SHERPA_ONNX_VERSION=1.0.27
|
||||||
|
|
||||||
if [ -z $owner ]; then
|
if [ -z $owner ]; then
|
||||||
owner=k2-fsa
|
owner=k2-fsa
|
||||||
|
|||||||
2
.github/workflows/npm-addon.yaml
vendored
2
.github/workflows/npm-addon.yaml
vendored
@@ -55,7 +55,7 @@ jobs:
|
|||||||
|
|
||||||
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
||||||
echo "SHERPA_ONNX_VERSION $SHERPA_ONNX_VERSION"
|
echo "SHERPA_ONNX_VERSION $SHERPA_ONNX_VERSION"
|
||||||
# SHERPA_ONNX_VERSION=1.0.25
|
# SHERPA_ONNX_VERSION=1.0.27
|
||||||
|
|
||||||
src_dir=.github/scripts/node-addon
|
src_dir=.github/scripts/node-addon
|
||||||
sed -i.bak s/SHERPA_ONNX_VERSION/$SHERPA_ONNX_VERSION/g $src_dir/package.json
|
sed -i.bak s/SHERPA_ONNX_VERSION/$SHERPA_ONNX_VERSION/g $src_dir/package.json
|
||||||
|
|||||||
@@ -1,5 +1,5 @@
|
|||||||
{
|
{
|
||||||
"dependencies": {
|
"dependencies": {
|
||||||
"sherpa-onnx-node": "^1.0.25"
|
"sherpa-onnx-node": "^1.0.27"
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -24,7 +24,12 @@ const tts = createOfflineTts();
|
|||||||
const text = 'Alles hat ein Ende, nur die Wurst hat zwei.'
|
const text = 'Alles hat ein Ende, nur die Wurst hat zwei.'
|
||||||
|
|
||||||
let start = Date.now();
|
let start = Date.now();
|
||||||
const audio = tts.generate({text: text, sid: 0, speed: 1.0});
|
const audio = tts.generate({
|
||||||
|
text: text,
|
||||||
|
sid: 0,
|
||||||
|
speed: 1.0,
|
||||||
|
enableExternalBuffer: true,
|
||||||
|
});
|
||||||
let stop = Date.now();
|
let stop = Date.now();
|
||||||
const elapsed_seconds = (stop - start) / 1000;
|
const elapsed_seconds = (stop - start) / 1000;
|
||||||
const duration = audio.samples.length / audio.sampleRate;
|
const duration = audio.samples.length / audio.sampleRate;
|
||||||
|
|||||||
@@ -99,7 +99,7 @@ function do_check() {
|
|||||||
;;
|
;;
|
||||||
2)
|
2)
|
||||||
echo "Check all files"
|
echo "Check all files"
|
||||||
files=$(find $sherpa_onnx_dir/sherpa-onnx -name "*.h" -o -name "*.cc")
|
files=$(find $sherpa_onnx_dir/sherpa-onnx/csrc $sherpa_onnx_dir/sherpa-onnx/python $sherpa_onnx_dir/scripts/node-addon-api/src $sherpa_onnx_dir/sherpa-onnx/jni $sherpa_onnx_dir/sherpa-onnx/c-api -name "*.h" -o -name "*.cc")
|
||||||
;;
|
;;
|
||||||
*)
|
*)
|
||||||
echo "Check last commit"
|
echo "Check last commit"
|
||||||
|
|||||||
@@ -18,9 +18,9 @@ class SpeakerEmbeddingExtractor {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// return a float32 array
|
// return a float32 array
|
||||||
compute(stream) {
|
compute(stream, enableExternalBuffer = true) {
|
||||||
return addon.speakerEmbeddingExtractorComputeEmbedding(
|
return addon.speakerEmbeddingExtractorComputeEmbedding(
|
||||||
this.handle, stream.handle);
|
this.handle, stream.handle, enableExternalBuffer);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
@@ -11,8 +11,9 @@ class CircularBuffer {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// return a float32 array
|
// return a float32 array
|
||||||
get(startIndex, n) {
|
get(startIndex, n, enableExternalBuffer = true) {
|
||||||
return addon.circularBufferGet(this.handle, startIndex, n);
|
return addon.circularBufferGet(
|
||||||
|
this.handle, startIndex, n, enableExternalBuffer);
|
||||||
}
|
}
|
||||||
|
|
||||||
pop(n) {
|
pop(n) {
|
||||||
@@ -48,23 +49,23 @@ config = {
|
|||||||
}
|
}
|
||||||
|
|
||||||
acceptWaveform(samples) {
|
acceptWaveform(samples) {
|
||||||
addon.voiceActivityDetectorAcceptWaveform(this.handle, samples)
|
addon.voiceActivityDetectorAcceptWaveform(this.handle, samples);
|
||||||
}
|
}
|
||||||
|
|
||||||
isEmpty() {
|
isEmpty() {
|
||||||
return addon.voiceActivityDetectorIsEmpty(this.handle)
|
return addon.voiceActivityDetectorIsEmpty(this.handle);
|
||||||
}
|
}
|
||||||
|
|
||||||
isDetected() {
|
isDetected() {
|
||||||
return addon.voiceActivityDetectorIsDetected(this.handle)
|
return addon.voiceActivityDetectorIsDetected(this.handle);
|
||||||
}
|
}
|
||||||
|
|
||||||
pop() {
|
pop() {
|
||||||
addon.voiceActivityDetectorPop(this.handle)
|
addon.voiceActivityDetectorPop(this.handle);
|
||||||
}
|
}
|
||||||
|
|
||||||
clear() {
|
clear() {
|
||||||
addon.VoiceActivityDetectorClearWrapper(this.handle)
|
addon.VoiceActivityDetectorClearWrapper(this.handle);
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
@@ -73,12 +74,12 @@ config = {
|
|||||||
start: a int32
|
start: a int32
|
||||||
}
|
}
|
||||||
*/
|
*/
|
||||||
front() {
|
front(enableExternalBuffer = true) {
|
||||||
return addon.voiceActivityDetectorFront(this.handle)
|
return addon.voiceActivityDetectorFront(this.handle, enableExternalBuffer);
|
||||||
}
|
}
|
||||||
|
|
||||||
reset() {
|
reset() {
|
||||||
return addon.VoiceActivityDetectorResetWrapper(this.handle)
|
return addon.VoiceActivityDetectorResetWrapper(this.handle);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
@@ -2,6 +2,7 @@
|
|||||||
//
|
//
|
||||||
// Copyright (c) 2024 Xiaomi Corporation
|
// Copyright (c) 2024 Xiaomi Corporation
|
||||||
|
|
||||||
|
#include <algorithm>
|
||||||
#include <sstream>
|
#include <sstream>
|
||||||
|
|
||||||
#include "macros.h" // NOLINT
|
#include "macros.h" // NOLINT
|
||||||
@@ -265,6 +266,13 @@ static Napi::Object OfflineTtsGenerateWrapper(const Napi::CallbackInfo &info) {
|
|||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool enable_external_buffer = true;
|
||||||
|
if (obj.Has("enableExternalBuffer") &&
|
||||||
|
obj.Get("enableExternalBuffer").IsBoolean()) {
|
||||||
|
enable_external_buffer =
|
||||||
|
obj.Get("enableExternalBuffer").As<Napi::Boolean>().Value();
|
||||||
|
}
|
||||||
|
|
||||||
Napi::String _text = obj.Get("text").As<Napi::String>();
|
Napi::String _text = obj.Get("text").As<Napi::String>();
|
||||||
std::string text = _text.Utf8Value();
|
std::string text = _text.Utf8Value();
|
||||||
int32_t sid = obj.Get("sid").As<Napi::Number>().Int32Value();
|
int32_t sid = obj.Get("sid").As<Napi::Number>().Int32Value();
|
||||||
@@ -273,20 +281,37 @@ static Napi::Object OfflineTtsGenerateWrapper(const Napi::CallbackInfo &info) {
|
|||||||
const SherpaOnnxGeneratedAudio *audio =
|
const SherpaOnnxGeneratedAudio *audio =
|
||||||
SherpaOnnxOfflineTtsGenerate(tts, text.c_str(), sid, speed);
|
SherpaOnnxOfflineTtsGenerate(tts, text.c_str(), sid, speed);
|
||||||
|
|
||||||
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
if (enable_external_buffer) {
|
||||||
env, const_cast<float *>(audio->samples), sizeof(float) * audio->n,
|
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
||||||
[](Napi::Env /*env*/, void * /*data*/,
|
env, const_cast<float *>(audio->samples), sizeof(float) * audio->n,
|
||||||
const SherpaOnnxGeneratedAudio *hint) {
|
[](Napi::Env /*env*/, void * /*data*/,
|
||||||
SherpaOnnxDestroyOfflineTtsGeneratedAudio(hint);
|
const SherpaOnnxGeneratedAudio *hint) {
|
||||||
},
|
SherpaOnnxDestroyOfflineTtsGeneratedAudio(hint);
|
||||||
audio);
|
},
|
||||||
Napi::Float32Array float32Array =
|
audio);
|
||||||
Napi::Float32Array::New(env, audio->n, arrayBuffer, 0);
|
Napi::Float32Array float32Array =
|
||||||
|
Napi::Float32Array::New(env, audio->n, arrayBuffer, 0);
|
||||||
|
|
||||||
Napi::Object ans = Napi::Object::New(env);
|
Napi::Object ans = Napi::Object::New(env);
|
||||||
ans.Set(Napi::String::New(env, "samples"), float32Array);
|
ans.Set(Napi::String::New(env, "samples"), float32Array);
|
||||||
ans.Set(Napi::String::New(env, "sampleRate"), audio->sample_rate);
|
ans.Set(Napi::String::New(env, "sampleRate"), audio->sample_rate);
|
||||||
return ans;
|
return ans;
|
||||||
|
} else {
|
||||||
|
// don't use external buffer
|
||||||
|
Napi::ArrayBuffer arrayBuffer =
|
||||||
|
Napi::ArrayBuffer::New(env, sizeof(float) * audio->n);
|
||||||
|
|
||||||
|
Napi::Float32Array float32Array =
|
||||||
|
Napi::Float32Array::New(env, audio->n, arrayBuffer, 0);
|
||||||
|
|
||||||
|
std::copy(audio->samples, audio->samples + audio->n, float32Array.Data());
|
||||||
|
|
||||||
|
Napi::Object ans = Napi::Object::New(env);
|
||||||
|
ans.Set(Napi::String::New(env, "samples"), float32Array);
|
||||||
|
ans.Set(Napi::String::New(env, "sampleRate"), audio->sample_rate);
|
||||||
|
SherpaOnnxDestroyOfflineTtsGeneratedAudio(audio);
|
||||||
|
return ans;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void InitNonStreamingTts(Napi::Env env, Napi::Object exports) {
|
void InitNonStreamingTts(Napi::Env env, Napi::Object exports) {
|
||||||
|
|||||||
@@ -1,6 +1,7 @@
|
|||||||
// scripts/node-addon-api/src/speaker-identification.cc
|
// scripts/node-addon-api/src/speaker-identification.cc
|
||||||
//
|
//
|
||||||
// Copyright (c) 2024 Xiaomi Corporation
|
// Copyright (c) 2024 Xiaomi Corporation
|
||||||
|
#include <algorithm>
|
||||||
#include <sstream>
|
#include <sstream>
|
||||||
|
|
||||||
#include "macros.h" // NOLINT
|
#include "macros.h" // NOLINT
|
||||||
@@ -175,9 +176,9 @@ static Napi::Boolean SpeakerEmbeddingExtractorIsReadyWrapper(
|
|||||||
static Napi::Float32Array SpeakerEmbeddingExtractorComputeEmbeddingWrapper(
|
static Napi::Float32Array SpeakerEmbeddingExtractorComputeEmbeddingWrapper(
|
||||||
const Napi::CallbackInfo &info) {
|
const Napi::CallbackInfo &info) {
|
||||||
Napi::Env env = info.Env();
|
Napi::Env env = info.Env();
|
||||||
if (info.Length() != 2) {
|
if (info.Length() != 2 && info.Length() != 3) {
|
||||||
std::ostringstream os;
|
std::ostringstream os;
|
||||||
os << "Expect only 2 arguments. Given: " << info.Length();
|
os << "Expect only 2 or 3 arguments. Given: " << info.Length();
|
||||||
|
|
||||||
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
||||||
|
|
||||||
@@ -199,6 +200,16 @@ static Napi::Float32Array SpeakerEmbeddingExtractorComputeEmbeddingWrapper(
|
|||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool enable_external_buffer = true;
|
||||||
|
if (info.Length() == 3) {
|
||||||
|
if (info[2].IsBoolean()) {
|
||||||
|
enable_external_buffer = info[2].As<Napi::Boolean>().Value();
|
||||||
|
} else {
|
||||||
|
Napi::TypeError::New(env, "Argument 2 should be a boolean.")
|
||||||
|
.ThrowAsJavaScriptException();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
SherpaOnnxSpeakerEmbeddingExtractor *extractor =
|
SherpaOnnxSpeakerEmbeddingExtractor *extractor =
|
||||||
info[0].As<Napi::External<SherpaOnnxSpeakerEmbeddingExtractor>>().Data();
|
info[0].As<Napi::External<SherpaOnnxSpeakerEmbeddingExtractor>>().Data();
|
||||||
|
|
||||||
@@ -210,14 +221,29 @@ static Napi::Float32Array SpeakerEmbeddingExtractorComputeEmbeddingWrapper(
|
|||||||
|
|
||||||
int32_t dim = SherpaOnnxSpeakerEmbeddingExtractorDim(extractor);
|
int32_t dim = SherpaOnnxSpeakerEmbeddingExtractorDim(extractor);
|
||||||
|
|
||||||
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
if (enable_external_buffer) {
|
||||||
env, const_cast<float *>(v), sizeof(float) * dim,
|
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
||||||
[](Napi::Env /*env*/, void *data) {
|
env, const_cast<float *>(v), sizeof(float) * dim,
|
||||||
SherpaOnnxSpeakerEmbeddingExtractorDestroyEmbedding(
|
[](Napi::Env /*env*/, void *data) {
|
||||||
reinterpret_cast<float *>(data));
|
SherpaOnnxSpeakerEmbeddingExtractorDestroyEmbedding(
|
||||||
});
|
reinterpret_cast<float *>(data));
|
||||||
|
});
|
||||||
|
|
||||||
return Napi::Float32Array::New(env, dim, arrayBuffer, 0);
|
return Napi::Float32Array::New(env, dim, arrayBuffer, 0);
|
||||||
|
} else {
|
||||||
|
// don't use external buffer
|
||||||
|
Napi::ArrayBuffer arrayBuffer =
|
||||||
|
Napi::ArrayBuffer::New(env, sizeof(float) * dim);
|
||||||
|
|
||||||
|
Napi::Float32Array float32Array =
|
||||||
|
Napi::Float32Array::New(env, dim, arrayBuffer, 0);
|
||||||
|
|
||||||
|
std::copy(v, v + dim, float32Array.Data());
|
||||||
|
|
||||||
|
SherpaOnnxSpeakerEmbeddingExtractorDestroyEmbedding(v);
|
||||||
|
|
||||||
|
return float32Array;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static Napi::External<SherpaOnnxSpeakerEmbeddingManager>
|
static Napi::External<SherpaOnnxSpeakerEmbeddingManager>
|
||||||
|
|||||||
@@ -2,6 +2,7 @@
|
|||||||
//
|
//
|
||||||
// Copyright (c) 2024 Xiaomi Corporation
|
// Copyright (c) 2024 Xiaomi Corporation
|
||||||
|
|
||||||
|
#include <algorithm>
|
||||||
#include <sstream>
|
#include <sstream>
|
||||||
|
|
||||||
#include "macros.h" // NOLINT
|
#include "macros.h" // NOLINT
|
||||||
@@ -75,9 +76,9 @@ static Napi::Float32Array CircularBufferGetWrapper(
|
|||||||
const Napi::CallbackInfo &info) {
|
const Napi::CallbackInfo &info) {
|
||||||
Napi::Env env = info.Env();
|
Napi::Env env = info.Env();
|
||||||
|
|
||||||
if (info.Length() != 3) {
|
if (info.Length() != 3 && info.Length() != 4) {
|
||||||
std::ostringstream os;
|
std::ostringstream os;
|
||||||
os << "Expect only 3 arguments. Given: " << info.Length();
|
os << "Expect only 3 or 4 arguments. Given: " << info.Length();
|
||||||
|
|
||||||
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
||||||
|
|
||||||
@@ -108,21 +109,46 @@ static Napi::Float32Array CircularBufferGetWrapper(
|
|||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool enable_external_buffer = true;
|
||||||
|
if (info.Length() == 4) {
|
||||||
|
if (info[3].IsBoolean()) {
|
||||||
|
enable_external_buffer = info[3].As<Napi::Boolean>().Value();
|
||||||
|
} else {
|
||||||
|
Napi::TypeError::New(env, "Argument 3 should be a boolean.")
|
||||||
|
.ThrowAsJavaScriptException();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
int32_t start_index = info[1].As<Napi::Number>().Int32Value();
|
int32_t start_index = info[1].As<Napi::Number>().Int32Value();
|
||||||
int32_t n = info[2].As<Napi::Number>().Int32Value();
|
int32_t n = info[2].As<Napi::Number>().Int32Value();
|
||||||
|
|
||||||
const float *data = SherpaOnnxCircularBufferGet(buf, start_index, n);
|
const float *data = SherpaOnnxCircularBufferGet(buf, start_index, n);
|
||||||
|
|
||||||
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
if (enable_external_buffer) {
|
||||||
env, const_cast<float *>(data), sizeof(float) * n,
|
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
||||||
[](Napi::Env /*env*/, void *p) {
|
env, const_cast<float *>(data), sizeof(float) * n,
|
||||||
SherpaOnnxCircularBufferFree(reinterpret_cast<const float *>(p));
|
[](Napi::Env /*env*/, void *p) {
|
||||||
});
|
SherpaOnnxCircularBufferFree(reinterpret_cast<const float *>(p));
|
||||||
|
});
|
||||||
|
|
||||||
Napi::Float32Array float32Array =
|
Napi::Float32Array float32Array =
|
||||||
Napi::Float32Array::New(env, n, arrayBuffer, 0);
|
Napi::Float32Array::New(env, n, arrayBuffer, 0);
|
||||||
|
|
||||||
return float32Array;
|
return float32Array;
|
||||||
|
} else {
|
||||||
|
// don't use external buffer
|
||||||
|
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
||||||
|
env, const_cast<float *>(data), sizeof(float) * n);
|
||||||
|
|
||||||
|
Napi::Float32Array float32Array =
|
||||||
|
Napi::Float32Array::New(env, n, arrayBuffer, 0);
|
||||||
|
|
||||||
|
std::copy(data, data + n, float32Array.Data());
|
||||||
|
|
||||||
|
SherpaOnnxCircularBufferFree(data);
|
||||||
|
|
||||||
|
return float32Array;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static void CircularBufferPopWrapper(const Napi::CallbackInfo &info) {
|
static void CircularBufferPopWrapper(const Napi::CallbackInfo &info) {
|
||||||
@@ -470,9 +496,9 @@ static Napi::Object VoiceActivityDetectorFrontWrapper(
|
|||||||
const Napi::CallbackInfo &info) {
|
const Napi::CallbackInfo &info) {
|
||||||
Napi::Env env = info.Env();
|
Napi::Env env = info.Env();
|
||||||
|
|
||||||
if (info.Length() != 1) {
|
if (info.Length() != 1 && info.Length() != 2) {
|
||||||
std::ostringstream os;
|
std::ostringstream os;
|
||||||
os << "Expect only 1 argument. Given: " << info.Length();
|
os << "Expect only 1 or 2 arguments. Given: " << info.Length();
|
||||||
|
|
||||||
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
||||||
|
|
||||||
@@ -486,28 +512,57 @@ static Napi::Object VoiceActivityDetectorFrontWrapper(
|
|||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool enable_external_buffer = true;
|
||||||
|
if (info.Length() == 2) {
|
||||||
|
if (info[1].IsBoolean()) {
|
||||||
|
enable_external_buffer = info[1].As<Napi::Boolean>().Value();
|
||||||
|
} else {
|
||||||
|
Napi::TypeError::New(env, "Argument 1 should be a boolean.")
|
||||||
|
.ThrowAsJavaScriptException();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
SherpaOnnxVoiceActivityDetector *vad =
|
SherpaOnnxVoiceActivityDetector *vad =
|
||||||
info[0].As<Napi::External<SherpaOnnxVoiceActivityDetector>>().Data();
|
info[0].As<Napi::External<SherpaOnnxVoiceActivityDetector>>().Data();
|
||||||
|
|
||||||
const SherpaOnnxSpeechSegment *segment =
|
const SherpaOnnxSpeechSegment *segment =
|
||||||
SherpaOnnxVoiceActivityDetectorFront(vad);
|
SherpaOnnxVoiceActivityDetectorFront(vad);
|
||||||
|
|
||||||
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
if (enable_external_buffer) {
|
||||||
env, const_cast<float *>(segment->samples), sizeof(float) * segment->n,
|
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
||||||
[](Napi::Env /*env*/, void * /*data*/,
|
env, const_cast<float *>(segment->samples), sizeof(float) * segment->n,
|
||||||
const SherpaOnnxSpeechSegment *hint) {
|
[](Napi::Env /*env*/, void * /*data*/,
|
||||||
SherpaOnnxDestroySpeechSegment(hint);
|
const SherpaOnnxSpeechSegment *hint) {
|
||||||
},
|
SherpaOnnxDestroySpeechSegment(hint);
|
||||||
segment);
|
},
|
||||||
|
segment);
|
||||||
|
|
||||||
Napi::Float32Array float32Array =
|
Napi::Float32Array float32Array =
|
||||||
Napi::Float32Array::New(env, segment->n, arrayBuffer, 0);
|
Napi::Float32Array::New(env, segment->n, arrayBuffer, 0);
|
||||||
|
|
||||||
Napi::Object obj = Napi::Object::New(env);
|
Napi::Object obj = Napi::Object::New(env);
|
||||||
obj.Set(Napi::String::New(env, "start"), segment->start);
|
obj.Set(Napi::String::New(env, "start"), segment->start);
|
||||||
obj.Set(Napi::String::New(env, "samples"), float32Array);
|
obj.Set(Napi::String::New(env, "samples"), float32Array);
|
||||||
|
|
||||||
return obj;
|
return obj;
|
||||||
|
} else {
|
||||||
|
Napi::ArrayBuffer arrayBuffer =
|
||||||
|
Napi::ArrayBuffer::New(env, sizeof(float) * segment->n);
|
||||||
|
|
||||||
|
Napi::Float32Array float32Array =
|
||||||
|
Napi::Float32Array::New(env, segment->n, arrayBuffer, 0);
|
||||||
|
|
||||||
|
std::copy(segment->samples, segment->samples + segment->n,
|
||||||
|
float32Array.Data());
|
||||||
|
|
||||||
|
Napi::Object obj = Napi::Object::New(env);
|
||||||
|
obj.Set(Napi::String::New(env, "start"), segment->start);
|
||||||
|
obj.Set(Napi::String::New(env, "samples"), float32Array);
|
||||||
|
|
||||||
|
SherpaOnnxDestroySpeechSegment(segment);
|
||||||
|
|
||||||
|
return obj;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static void VoiceActivityDetectorResetWrapper(const Napi::CallbackInfo &info) {
|
static void VoiceActivityDetectorResetWrapper(const Napi::CallbackInfo &info) {
|
||||||
|
|||||||
@@ -2,6 +2,7 @@
|
|||||||
//
|
//
|
||||||
// Copyright (c) 2024 Xiaomi Corporation
|
// Copyright (c) 2024 Xiaomi Corporation
|
||||||
|
|
||||||
|
#include <algorithm>
|
||||||
#include <sstream>
|
#include <sstream>
|
||||||
|
|
||||||
#include "napi.h" // NOLINT
|
#include "napi.h" // NOLINT
|
||||||
@@ -9,16 +10,17 @@
|
|||||||
|
|
||||||
static Napi::Object ReadWaveWrapper(const Napi::CallbackInfo &info) {
|
static Napi::Object ReadWaveWrapper(const Napi::CallbackInfo &info) {
|
||||||
Napi::Env env = info.Env();
|
Napi::Env env = info.Env();
|
||||||
if (info.Length() != 1) {
|
if (info.Length() > 2) {
|
||||||
std::ostringstream os;
|
std::ostringstream os;
|
||||||
os << "Expect only 1 argument. Given: " << info.Length();
|
os << "Expect only 2 arguments. Given: " << info.Length();
|
||||||
|
|
||||||
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
Napi::TypeError::New(env, os.str()).ThrowAsJavaScriptException();
|
||||||
|
|
||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!info[0].IsString()) {
|
if (!info[0].IsString()) {
|
||||||
Napi::TypeError::New(env, "Argument should be a string")
|
Napi::TypeError::New(env, "Argument 0 should be a string")
|
||||||
.ThrowAsJavaScriptException();
|
.ThrowAsJavaScriptException();
|
||||||
|
|
||||||
return {};
|
return {};
|
||||||
@@ -26,6 +28,18 @@ static Napi::Object ReadWaveWrapper(const Napi::CallbackInfo &info) {
|
|||||||
|
|
||||||
std::string filename = info[0].As<Napi::String>().Utf8Value();
|
std::string filename = info[0].As<Napi::String>().Utf8Value();
|
||||||
|
|
||||||
|
bool enable_external_buffer = true;
|
||||||
|
if (info.Length() == 2) {
|
||||||
|
if (info[1].IsBoolean()) {
|
||||||
|
enable_external_buffer = info[1].As<Napi::Boolean>().Value();
|
||||||
|
} else {
|
||||||
|
Napi::TypeError::New(env, "Argument 1 should be a boolean")
|
||||||
|
.ThrowAsJavaScriptException();
|
||||||
|
|
||||||
|
return {};
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
const SherpaOnnxWave *wave = SherpaOnnxReadWave(filename.c_str());
|
const SherpaOnnxWave *wave = SherpaOnnxReadWave(filename.c_str());
|
||||||
if (!wave) {
|
if (!wave) {
|
||||||
std::ostringstream os;
|
std::ostringstream os;
|
||||||
@@ -35,20 +49,40 @@ static Napi::Object ReadWaveWrapper(const Napi::CallbackInfo &info) {
|
|||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
if (enable_external_buffer) {
|
||||||
env, const_cast<float *>(wave->samples),
|
Napi::ArrayBuffer arrayBuffer = Napi::ArrayBuffer::New(
|
||||||
sizeof(float) * wave->num_samples,
|
env, const_cast<float *>(wave->samples),
|
||||||
[](Napi::Env /*env*/, void * /*data*/, const SherpaOnnxWave *hint) {
|
sizeof(float) * wave->num_samples,
|
||||||
SherpaOnnxFreeWave(hint);
|
[](Napi::Env /*env*/, void * /*data*/, const SherpaOnnxWave *hint) {
|
||||||
},
|
SherpaOnnxFreeWave(hint);
|
||||||
wave);
|
},
|
||||||
Napi::Float32Array float32Array =
|
wave);
|
||||||
Napi::Float32Array::New(env, wave->num_samples, arrayBuffer, 0);
|
Napi::Float32Array float32Array =
|
||||||
|
Napi::Float32Array::New(env, wave->num_samples, arrayBuffer, 0);
|
||||||
|
|
||||||
Napi::Object obj = Napi::Object::New(env);
|
Napi::Object obj = Napi::Object::New(env);
|
||||||
obj.Set(Napi::String::New(env, "samples"), float32Array);
|
obj.Set(Napi::String::New(env, "samples"), float32Array);
|
||||||
obj.Set(Napi::String::New(env, "sampleRate"), wave->sample_rate);
|
obj.Set(Napi::String::New(env, "sampleRate"), wave->sample_rate);
|
||||||
return obj;
|
return obj;
|
||||||
|
} else {
|
||||||
|
// don't use external buffer
|
||||||
|
Napi::ArrayBuffer arrayBuffer =
|
||||||
|
Napi::ArrayBuffer::New(env, sizeof(float) * wave->num_samples);
|
||||||
|
|
||||||
|
Napi::Float32Array float32Array =
|
||||||
|
Napi::Float32Array::New(env, wave->num_samples, arrayBuffer, 0);
|
||||||
|
|
||||||
|
std::copy(wave->samples, wave->samples + wave->num_samples,
|
||||||
|
float32Array.Data());
|
||||||
|
|
||||||
|
Napi::Object obj = Napi::Object::New(env);
|
||||||
|
obj.Set(Napi::String::New(env, "samples"), float32Array);
|
||||||
|
obj.Set(Napi::String::New(env, "sampleRate"), wave->sample_rate);
|
||||||
|
|
||||||
|
SherpaOnnxFreeWave(wave);
|
||||||
|
|
||||||
|
return obj;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void InitWaveReader(Napi::Env env, Napi::Object exports) {
|
void InitWaveReader(Napi::Env env, Napi::Object exports) {
|
||||||
|
|||||||
Reference in New Issue
Block a user