Add Java API for spoken language identification with whisper multilingual models (#817)

This commit is contained in:
Fangjun Kuang
2024-04-26 19:05:39 +08:00
committed by GitHub
parent f2d074aea9
commit db25986240
12 changed files with 406 additions and 11 deletions

View File

@@ -0,0 +1,59 @@
// Copyright 2024 Xiaomi Corporation
package com.k2fsa.sherpa.onnx;
import java.util.HashMap;
import java.util.Locale;
import java.util.Map;
public class SpokenLanguageIdentification {
static {
System.loadLibrary("sherpa-onnx-jni");
}
private final Map<String, String> localeMap;
private long ptr = 0; // this is the asr engine ptrss
public SpokenLanguageIdentification(SpokenLanguageIdentificationConfig config) {
ptr = newFromFile(config);
String[] languages = Locale.getISOLanguages();
localeMap = new HashMap<String, String>(languages.length);
for (String language : languages) {
Locale locale = new Locale(language);
localeMap.put(language, locale.getDisplayName());
}
}
public String compute(OfflineStream stream) {
String lang = compute(ptr, stream.getPtr());
return localeMap.getOrDefault(lang, lang);
}
public OfflineStream createStream() {
long p = createStream(ptr);
return new OfflineStream(p);
}
@Override
protected void finalize() throws Throwable {
release();
}
// You'd better call it manually if it is not used anymore
public void release() {
if (this.ptr == 0) {
return;
}
delete(this.ptr);
this.ptr = 0;
}
private native void delete(long ptr);
private native long newFromFile(SpokenLanguageIdentificationConfig config);
private native long createStream(long ptr);
private native String compute(long ptr, long streamPtr);
}