Add Java API for spoken language identification with whisper multilingual models (#817)

This commit is contained in:
Fangjun Kuang
2024-04-26 19:05:39 +08:00
committed by GitHub
parent f2d074aea9
commit db25986240
12 changed files with 406 additions and 11 deletions

View File

@@ -0,0 +1,56 @@
// Copyright 2024 Xiaomi Corporation
package com.k2fsa.sherpa.onnx;
public class SpokenLanguageIdentificationWhisperConfig {
private final String encoder;
private final String decoder;
private final int tailPaddings;
private SpokenLanguageIdentificationWhisperConfig(Builder builder) {
this.encoder = builder.encoder;
this.decoder = builder.decoder;
this.tailPaddings = builder.tailPaddings;
}
public static Builder builder() {
return new Builder();
}
public String getEncoder() {
return encoder;
}
public String getDecoder() {
return decoder;
}
public int getTailPaddings() {
return tailPaddings;
}
public static class Builder {
private String encoder = "";
private String decoder = "";
private int tailPaddings = 1000; // number of frames to pad
public SpokenLanguageIdentificationWhisperConfig build() {
return new SpokenLanguageIdentificationWhisperConfig(this);
}
public Builder setEncoder(String encoder) {
this.encoder = encoder;
return this;
}
public Builder setDecoder(String decoder) {
this.decoder = decoder;
return this;
}
public Builder setTailPaddings(int tailPaddings) {
this.tailPaddings = tailPaddings;
return this;
}
}
}