Add Java API for spoken language identification with whisper multilingual models (#817)

2024-04-26 19:05:39 +08:00
parent f2d074aea9
commit db25986240
12 changed files with 406 additions and 11 deletions
--- a/sherpa-onnx/java-api/src/com/k2fsa/sherpa/onnx/SpokenLanguageIdentificationWhisperConfig.java
+++ b/sherpa-onnx/java-api/src/com/k2fsa/sherpa/onnx/SpokenLanguageIdentificationWhisperConfig.java
@@ -0,0 +1,56 @@
+// Copyright 2024 Xiaomi Corporation
+
+package com.k2fsa.sherpa.onnx;
+
+public class SpokenLanguageIdentificationWhisperConfig {
+    private final String encoder;
+    private final String decoder;
+    private final int tailPaddings;
+
+    private SpokenLanguageIdentificationWhisperConfig(Builder builder) {
+        this.encoder = builder.encoder;
+        this.decoder = builder.decoder;
+        this.tailPaddings = builder.tailPaddings;
+    }
+
+    public static Builder builder() {
+        return new Builder();
+    }
+
+    public String getEncoder() {
+        return encoder;
+    }
+
+    public String getDecoder() {
+        return decoder;
+    }
+
+    public int getTailPaddings() {
+        return tailPaddings;
+    }
+
+    public static class Builder {
+        private String encoder = "";
+        private String decoder = "";
+        private int tailPaddings = 1000; // number of frames to pad
+
+        public SpokenLanguageIdentificationWhisperConfig build() {
+            return new SpokenLanguageIdentificationWhisperConfig(this);
+        }
+
+        public Builder setEncoder(String encoder) {
+            this.encoder = encoder;
+            return this;
+        }
+
+        public Builder setDecoder(String decoder) {
+            this.decoder = decoder;
+            return this;
+        }
+
+        public Builder setTailPaddings(int tailPaddings) {
+            this.tailPaddings = tailPaddings;
+            return this;
+        }
+    }
+}