diff --git a/.github/workflows/apk-spoken-language-identification.yaml b/.github/workflows/apk-spoken-language-identification.yaml
new file mode 100644
index 00000000..39e1e1b7
--- /dev/null
+++ b/.github/workflows/apk-spoken-language-identification.yaml
@@ -0,0 +1,174 @@
+name: apk-slid
+
+on:
+ push:
+ tags:
+ - '*'
+
+ workflow_dispatch:
+
+concurrency:
+ group: apk-slid-${{ github.ref }}
+ cancel-in-progress: true
+
+permissions:
+ contents: write
+
+jobs:
+ apk_slid:
+ if: github.repository_owner == 'csukuangfj' || github.repository_owner == 'k2-fsa'
+ runs-on: ${{ matrix.os }}
+ name: apk for slid ${{ matrix.index }}/${{ matrix.total }}
+ strategy:
+ fail-fast: false
+ matrix:
+ os: [ubuntu-latest]
+ total: ["1"]
+ index: ["0"]
+
+ steps:
+ - uses: actions/checkout@v4
+ with:
+ fetch-depth: 0
+
+ # https://github.com/actions/setup-java
+ - uses: actions/setup-java@v4
+ with:
+ distribution: 'temurin' # See 'Supported distributions' for available options
+ java-version: '21'
+
+ - name: ccache
+ uses: hendrikmuhs/ccache-action@v1.2
+ with:
+ key: ${{ matrix.os }}-android
+
+ - name: Display NDK HOME
+ shell: bash
+ run: |
+ echo "ANDROID_NDK_LATEST_HOME: ${ANDROID_NDK_LATEST_HOME}"
+ ls -lh ${ANDROID_NDK_LATEST_HOME}
+
+ - name: Install Python dependencies
+ shell: bash
+ run: |
+ python3 -m pip install --upgrade pip jinja2
+
+ - name: Setup build tool version variable
+ shell: bash
+ run: |
+ echo "---"
+ ls -lh /usr/local/lib/android/
+ echo "---"
+
+ ls -lh /usr/local/lib/android/sdk
+ echo "---"
+
+ ls -lh /usr/local/lib/android/sdk/build-tools
+ echo "---"
+
+ BUILD_TOOL_VERSION=$(ls /usr/local/lib/android/sdk/build-tools/ | tail -n 1)
+ echo "BUILD_TOOL_VERSION=$BUILD_TOOL_VERSION" >> $GITHUB_ENV
+ echo "Last build tool version is: $BUILD_TOOL_VERSION"
+
+ - name: Generate build script
+ shell: bash
+ run: |
+ cd scripts/apk
+
+ total=${{ matrix.total }}
+ index=${{ matrix.index }}
+
+ ./generate-slid-apk-script.py --total $total --index $index
+
+ chmod +x build-apk-slid.sh
+ mv -v ./build-apk-slid.sh ../..
+
+ - name: build APK
+ shell: bash
+ run: |
+ export CMAKE_CXX_COMPILER_LAUNCHER=ccache
+ export PATH="/usr/lib/ccache:/usr/local/opt/ccache/libexec:$PATH"
+ cmake --version
+
+ export ANDROID_NDK=$ANDROID_NDK_LATEST_HOME
+ ./build-apk-slid.sh
+
+ - name: Display APK
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
+ # https://github.com/marketplace/actions/sign-android-release
+ - uses: r0adkll/sign-android-release@v1
+ name: Sign app APK
+ with:
+ releaseDirectory: ./apks
+ signingKeyBase64: ${{ secrets.ANDROID_SIGNING_KEY }}
+ alias: ${{ secrets.ANDROID_SIGNING_KEY_ALIAS }}
+ keyStorePassword: ${{ secrets.ANDROID_SIGNING_KEY_STORE_PASSWORD }}
+ env:
+ BUILD_TOOLS_VERSION: ${{ env.BUILD_TOOL_VERSION }}
+
+ - name: Display APK for slid after signing
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Rename APK for slid after signing
+ shell: bash
+ run: |
+ cd apks
+ rm -fv signingKey.jks
+ rm -fv *.apk.idsig
+ rm -fv *-aligned.apk
+
+ all_apks=$(ls -1 *-signed.apk)
+ echo "----"
+ echo $all_apks
+ echo "----"
+ for apk in ${all_apks[@]}; do
+ n=$(echo $apk | sed -e s/-signed//)
+ mv -v $apk $n
+ done
+
+ cd ..
+
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Display APK after rename
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Publish to huggingface
+ env:
+ HF_TOKEN: ${{ secrets.HF_TOKEN }}
+ uses: nick-fields/retry@v3
+ with:
+ max_attempts: 20
+ timeout_seconds: 200
+ shell: bash
+ command: |
+ git config --global user.email "csukuangfj@gmail.com"
+ git config --global user.name "Fangjun Kuang"
+
+ rm -rf huggingface
+ export GIT_LFS_SKIP_SMUDGE=1
+
+ git clone https://huggingface.co/csukuangfj/sherpa-onnx-apk huggingface
+ cd huggingface
+ git fetch
+ git pull
+ git merge -m "merge remote" --ff origin main
+
+ mkdir -p slid
+ cp -v ../apks/*.apk ./slid/
+ git status
+ git lfs track "*.apk"
+ git add .
+ git commit -m "add more apks"
+ git push https://csukuangfj:$HF_TOKEN@huggingface.co/csukuangfj/sherpa-onnx-apk main
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/.gitignore b/android/SherpaOnnxSpokenLanguageIdentification/.gitignore
new file mode 100644
index 00000000..aa724b77
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/.gitignore
@@ -0,0 +1,15 @@
+*.iml
+.gradle
+/local.properties
+/.idea/caches
+/.idea/libraries
+/.idea/modules.xml
+/.idea/workspace.xml
+/.idea/navEditor.xml
+/.idea/assetWizardSettings.xml
+.DS_Store
+/build
+/captures
+.externalNativeBuild
+.cxx
+local.properties
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/.gitignore b/android/SherpaOnnxSpokenLanguageIdentification/app/.gitignore
new file mode 100644
index 00000000..42afabfd
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/.gitignore
@@ -0,0 +1 @@
+/build
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/build.gradle.kts b/android/SherpaOnnxSpokenLanguageIdentification/app/build.gradle.kts
new file mode 100644
index 00000000..63858267
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/build.gradle.kts
@@ -0,0 +1,69 @@
+plugins {
+ id("com.android.application")
+ id("org.jetbrains.kotlin.android")
+}
+
+android {
+ namespace = "com.k2fsa.sherpa.onnx.slid"
+ compileSdk = 34
+
+ defaultConfig {
+ applicationId = "com.k2fsa.sherpa.onnx.slid"
+ minSdk = 21
+ targetSdk = 34
+ versionCode = 1
+ versionName = "1.0"
+
+ testInstrumentationRunner = "androidx.test.runner.AndroidJUnitRunner"
+ vectorDrawables {
+ useSupportLibrary = true
+ }
+ }
+
+ buildTypes {
+ release {
+ isMinifyEnabled = false
+ proguardFiles(
+ getDefaultProguardFile("proguard-android-optimize.txt"),
+ "proguard-rules.pro"
+ )
+ }
+ }
+ compileOptions {
+ sourceCompatibility = JavaVersion.VERSION_1_8
+ targetCompatibility = JavaVersion.VERSION_1_8
+ }
+ kotlinOptions {
+ jvmTarget = "1.8"
+ }
+ buildFeatures {
+ compose = true
+ }
+ composeOptions {
+ kotlinCompilerExtensionVersion = "1.5.1"
+ }
+ packaging {
+ resources {
+ excludes += "/META-INF/{AL2.0,LGPL2.1}"
+ }
+ }
+}
+
+dependencies {
+
+ implementation("androidx.core:core-ktx:1.12.0")
+ implementation("androidx.lifecycle:lifecycle-runtime-ktx:2.7.0")
+ implementation("androidx.activity:activity-compose:1.8.2")
+ implementation(platform("androidx.compose:compose-bom:2023.08.00"))
+ implementation("androidx.compose.ui:ui")
+ implementation("androidx.compose.ui:ui-graphics")
+ implementation("androidx.compose.ui:ui-tooling-preview")
+ implementation("androidx.compose.material3:material3")
+ testImplementation("junit:junit:4.13.2")
+ androidTestImplementation("androidx.test.ext:junit:1.1.5")
+ androidTestImplementation("androidx.test.espresso:espresso-core:3.5.1")
+ androidTestImplementation(platform("androidx.compose:compose-bom:2023.08.00"))
+ androidTestImplementation("androidx.compose.ui:ui-test-junit4")
+ debugImplementation("androidx.compose.ui:ui-tooling")
+ debugImplementation("androidx.compose.ui:ui-test-manifest")
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/proguard-rules.pro b/android/SherpaOnnxSpokenLanguageIdentification/app/proguard-rules.pro
new file mode 100644
index 00000000..481bb434
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/proguard-rules.pro
@@ -0,0 +1,21 @@
+# Add project specific ProGuard rules here.
+# You can control the set of applied configuration files using the
+# proguardFiles setting in build.gradle.
+#
+# For more details, see
+# http://developer.android.com/guide/developing/tools/proguard.html
+
+# If your project uses WebView with JS, uncomment the following
+# and specify the fully qualified class name to the JavaScript interface
+# class:
+#-keepclassmembers class fqcn.of.javascript.interface.for.webview {
+# public *;
+#}
+
+# Uncomment this to preserve the line number information for
+# debugging stack traces.
+#-keepattributes SourceFile,LineNumberTable
+
+# If you keep the line number information, uncomment this to
+# hide the original source file name.
+#-renamesourcefileattribute SourceFile
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/androidTest/java/com/k2fsa/sherpa/onnx/slid/ExampleInstrumentedTest.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/androidTest/java/com/k2fsa/sherpa/onnx/slid/ExampleInstrumentedTest.kt
new file mode 100644
index 00000000..5cb3e238
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/androidTest/java/com/k2fsa/sherpa/onnx/slid/ExampleInstrumentedTest.kt
@@ -0,0 +1,24 @@
+package com.k2fsa.sherpa.onnx.slid
+
+import androidx.test.platform.app.InstrumentationRegistry
+import androidx.test.ext.junit.runners.AndroidJUnit4
+
+import org.junit.Test
+import org.junit.runner.RunWith
+
+import org.junit.Assert.*
+
+/**
+ * Instrumented test, which will execute on an Android device.
+ *
+ * See [testing documentation](http://d.android.com/tools/testing).
+ */
+@RunWith(AndroidJUnit4::class)
+class ExampleInstrumentedTest {
+ @Test
+ fun useAppContext() {
+ // Context of the app under test.
+ val appContext = InstrumentationRegistry.getInstrumentation().targetContext
+ assertEquals("com.k2fsa.sherpa.onnx.slid", appContext.packageName)
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/AndroidManifest.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/AndroidManifest.xml
new file mode 100644
index 00000000..df44766e
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/AndroidManifest.xml
@@ -0,0 +1,30 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/assets/.gitignore b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/assets/.gitignore
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/Home.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/Home.kt
new file mode 100644
index 00000000..018e3913
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/Home.kt
@@ -0,0 +1,171 @@
+@file:OptIn(ExperimentalMaterial3Api::class, ExperimentalFoundationApi::class)
+
+package com.k2fsa.sherpa.onnx.slid
+
+import android.Manifest
+import android.app.Activity
+import android.content.pm.PackageManager
+import android.media.AudioFormat
+import android.media.AudioRecord
+import android.media.MediaRecorder
+import android.util.Log
+import androidx.compose.foundation.ExperimentalFoundationApi
+import androidx.compose.foundation.layout.Box
+import androidx.compose.foundation.layout.Column
+import androidx.compose.foundation.layout.PaddingValues
+import androidx.compose.ui.Modifier
+import androidx.compose.foundation.layout.Spacer
+import androidx.compose.foundation.layout.fillMaxSize
+import androidx.compose.foundation.layout.height
+import androidx.compose.foundation.layout.padding
+import androidx.compose.material3.Button
+import androidx.compose.material3.CenterAlignedTopAppBar
+import androidx.compose.material3.ExperimentalMaterial3Api
+import androidx.compose.material3.MaterialTheme
+import androidx.compose.material3.Scaffold
+import androidx.compose.material3.Text
+import androidx.compose.material3.TopAppBarDefaults
+import androidx.compose.runtime.Composable
+import androidx.compose.runtime.getValue
+import androidx.compose.runtime.mutableStateOf
+import androidx.compose.runtime.remember
+import androidx.compose.runtime.setValue
+import androidx.compose.ui.Alignment
+import androidx.compose.ui.platform.LocalContext
+import androidx.compose.ui.text.font.FontWeight
+import androidx.compose.ui.unit.dp
+import androidx.compose.ui.unit.sp
+import androidx.core.app.ActivityCompat
+import kotlin.concurrent.thread
+
+@Composable
+fun Home() {
+ Scaffold(
+ topBar = {
+ CenterAlignedTopAppBar(
+ colors = TopAppBarDefaults.topAppBarColors(
+ containerColor = MaterialTheme.colorScheme.primaryContainer,
+ titleContentColor = MaterialTheme.colorScheme.primary,
+ ),
+ title = {
+ Text(
+ "Next-gen Kaldi: Spoken language identification",
+ fontWeight = FontWeight.Bold,
+ fontSize = 13.sp,
+ )
+ },
+ )
+ },
+ content = {
+ MyApp(it)
+ },
+ )
+}
+
+private var audioRecord: AudioRecord? = null
+private val sampleRateInHz = 16000
+
+@Composable
+fun MyApp(padding: PaddingValues) {
+ val activity = LocalContext.current as Activity
+ var isStarted by remember { mutableStateOf(false) }
+ var result by remember { mutableStateOf("") }
+
+ val onButtonClick: () -> Unit = {
+ isStarted = !isStarted
+ if (isStarted) {
+ result = ""
+ if (ActivityCompat.checkSelfPermission(
+ activity,
+ Manifest.permission.RECORD_AUDIO
+ ) != PackageManager.PERMISSION_GRANTED
+ ) {
+ Log.i(TAG, "Recording is not allowed")
+ } else {
+ val audioSource = MediaRecorder.AudioSource.MIC
+ val channelConfig = AudioFormat.CHANNEL_IN_MONO
+ val audioFormat = AudioFormat.ENCODING_PCM_16BIT
+ val numBytes =
+ AudioRecord.getMinBufferSize(sampleRateInHz, channelConfig, audioFormat)
+
+ audioRecord = AudioRecord(
+ audioSource,
+ sampleRateInHz,
+ AudioFormat.CHANNEL_IN_MONO,
+ AudioFormat.ENCODING_PCM_16BIT,
+ numBytes * 2 // a sample has two bytes as we are using 16-bit PCM
+ )
+
+ thread(true) {
+ Log.i(TAG, "processing samples")
+ val interval = 0.1 // i.e., 100 ms
+ val bufferSize = (interval * sampleRateInHz).toInt() // in samples
+ val buffer = ShortArray(bufferSize)
+ val sampleList = ArrayList()
+ audioRecord?.let {
+ it.startRecording()
+ while (isStarted) {
+ val ret = it.read(buffer, 0, buffer.size)
+ ret.let { n ->
+ val samples = FloatArray(n) { buffer[it] / 32768.0f }
+ sampleList.add(samples)
+ }
+ }
+ }
+ Log.i(TAG, "Stop recording")
+ Log.i(TAG, "Start recognition")
+ val samples = Flatten(sampleList)
+ val stream = Slid.slid.createStream()
+ stream.acceptWaveform(samples, sampleRateInHz)
+ val lang = Slid.slid.compute(stream)
+
+ result = Slid.localeMap.get(lang) ?: lang
+
+ stream.release()
+ }
+ }
+ }
+ }
+
+ Box(
+ modifier = Modifier.fillMaxSize(),
+ contentAlignment = Alignment.TopCenter
+ ) {
+ Column(
+ Modifier.padding(padding),
+ horizontalAlignment = Alignment.CenterHorizontally,
+ ) {
+ Spacer(modifier = Modifier.height(16.dp))
+ Button(onClick = onButtonClick) {
+ if (isStarted) {
+ Text("Stop")
+ } else {
+ Text("Start")
+ }
+ }
+
+ Spacer(modifier = Modifier.height(16.dp))
+ if (result.isNotEmpty() && result.isNotBlank()) {
+ Text("Detected language: $result")
+ }
+ }
+ }
+}
+
+fun Flatten(sampleList: ArrayList): FloatArray {
+ var totalSamples = 0
+ for (a in sampleList) {
+ totalSamples += a.size
+ }
+ var i = 0
+ val samples = FloatArray(totalSamples)
+ for (a in sampleList) {
+ for (s in a) {
+ samples[i] = s
+ i += 1
+ }
+ }
+ Log.i(TAG, "$i, $totalSamples")
+
+ return samples
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/MainActivity.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/MainActivity.kt
new file mode 100644
index 00000000..dfbcba16
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/MainActivity.kt
@@ -0,0 +1,74 @@
+package com.k2fsa.sherpa.onnx.slid
+
+import android.Manifest
+import android.content.pm.PackageManager
+import android.os.Bundle
+import android.util.Log
+import android.widget.Toast
+import androidx.activity.ComponentActivity
+import androidx.activity.compose.setContent
+import androidx.compose.foundation.layout.fillMaxSize
+import androidx.compose.material3.MaterialTheme
+import androidx.compose.material3.Surface
+import androidx.compose.material3.Text
+import androidx.compose.runtime.Composable
+import androidx.compose.ui.Modifier
+import androidx.compose.ui.tooling.preview.Preview
+import androidx.core.app.ActivityCompat
+import com.k2fsa.sherpa.onnx.SpokenLanguageIdentification
+import com.k2fsa.sherpa.onnx.slid.ui.theme.SherpaOnnxSpokenLanguageIdentificationTheme
+
+const val TAG = "sherpa-onnx"
+private const val REQUEST_RECORD_AUDIO_PERMISSION = 200
+
+class MainActivity : ComponentActivity() {
+ private val permissions: Array = arrayOf(Manifest.permission.RECORD_AUDIO)
+
+ override fun onCreate(savedInstanceState: Bundle?) {
+ super.onCreate(savedInstanceState)
+ setContent {
+ SpokenLanguageIdentificationApp()
+ }
+ ActivityCompat.requestPermissions(this, permissions, REQUEST_RECORD_AUDIO_PERMISSION)
+ Slid.initSlid(this.assets)
+ }
+ @Suppress("DEPRECATION")
+ @Deprecated("Deprecated in Java")
+ override fun onRequestPermissionsResult(
+ requestCode: Int,
+ permissions: Array,
+ grantResults: IntArray
+ ) {
+ super.onRequestPermissionsResult(requestCode, permissions, grantResults)
+ val permissionToRecordAccepted = if (requestCode == REQUEST_RECORD_AUDIO_PERMISSION) {
+ grantResults[0] == PackageManager.PERMISSION_GRANTED
+ } else {
+ false
+ }
+
+ if (!permissionToRecordAccepted) {
+ Log.e(TAG, "Audio record is disallowed")
+ Toast.makeText(
+ this,
+ "This App needs access to the microphone",
+ Toast.LENGTH_SHORT
+ )
+ .show()
+ finish()
+ }
+ Log.i(TAG, "Audio record is permitted")
+ }
+}
+
+@Composable
+fun SpokenLanguageIdentificationApp() {
+ SherpaOnnxSpokenLanguageIdentificationTheme {
+ // A surface container using the 'background' color from the theme
+ Surface(
+ modifier = Modifier.fillMaxSize(),
+ color = MaterialTheme.colorScheme.background
+ ) {
+ Home()
+ }
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/OfflineStream.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/OfflineStream.kt
new file mode 120000
index 00000000..1a5dfc31
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/OfflineStream.kt
@@ -0,0 +1 @@
+../../../../../../../../../../SherpaOnnxAudioTagging/app/src/main/java/com/k2fsa/sherpa/onnx/audio/tagging/OfflineStream.kt
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/SpokenLanguageIdentification.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/SpokenLanguageIdentification.kt
new file mode 100644
index 00000000..fedf9d65
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/SpokenLanguageIdentification.kt
@@ -0,0 +1,102 @@
+package com.k2fsa.sherpa.onnx
+
+import android.content.res.AssetManager
+import android.util.Log
+
+private val TAG = "sherpa-onnx"
+
+data class SpokenLanguageIdentificationWhisperConfig (
+ var encoder: String,
+ var decoder: String,
+ var tailPaddings: Int = -1,
+)
+
+data class SpokenLanguageIdentificationConfig (
+ var whisper: SpokenLanguageIdentificationWhisperConfig,
+ var numThreads: Int = 1,
+ var debug: Boolean = false,
+ var provider: String = "cpu",
+)
+
+class SpokenLanguageIdentification (
+ assetManager: AssetManager? = null,
+ config: SpokenLanguageIdentificationConfig,
+) {
+ private var ptr: Long
+
+ init {
+ ptr = if (assetManager != null) {
+ newFromAsset(assetManager, config)
+ } else {
+ newFromFile(config)
+ }
+ }
+
+ protected fun finalize() {
+ if (ptr != 0L) {
+ delete(ptr)
+ ptr = 0
+ }
+ }
+
+ fun release() = finalize()
+
+ fun createStream(): OfflineStream {
+ val p = createStream(ptr)
+ return OfflineStream(p)
+ }
+
+ fun compute(stream: OfflineStream) = compute(ptr, stream.ptr)
+
+ private external fun newFromAsset(
+ assetManager: AssetManager,
+ config: SpokenLanguageIdentificationConfig,
+ ): Long
+
+ private external fun newFromFile(
+ config: SpokenLanguageIdentificationConfig,
+ ): Long
+
+ private external fun delete(ptr: Long)
+
+ private external fun createStream(ptr: Long): Long
+
+ private external fun compute(ptr: Long, streamPtr: Long): String
+
+ companion object {
+ init {
+ System.loadLibrary("sherpa-onnx-jni")
+ }
+ }
+}
+// please refer to
+// https://k2-fsa.github.io/sherpa/onnx/spolken-language-identification/pretrained_models.html#whisper
+// to download more models
+fun getSpokenLanguageIdentificationConfig(type: Int, numThreads: Int=1): SpokenLanguageIdentificationConfig? {
+ when (type) {
+ 0 -> {
+ val modelDir = "sherpa-onnx-whisper-tiny"
+ return SpokenLanguageIdentificationConfig(
+ whisper = SpokenLanguageIdentificationWhisperConfig(
+ encoder = "$modelDir/tiny-encoder.int8.onnx",
+ decoder = "$modelDir/tiny-decoder.int8.onnx",
+ ),
+ numThreads = numThreads,
+ debug = true,
+ )
+ }
+
+ 1 -> {
+ val modelDir = "sherpa-onnx-whisper-base"
+ return SpokenLanguageIdentificationConfig(
+ whisper = SpokenLanguageIdentificationWhisperConfig(
+ encoder = "$modelDir/tiny-encoder.int8.onnx",
+ decoder = "$modelDir/tiny-decoder.int8.onnx",
+ ),
+ numThreads = 1,
+ debug = true,
+ )
+ }
+ }
+ return null
+}
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/slid.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/slid.kt
new file mode 100644
index 00000000..60c51170
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/slid.kt
@@ -0,0 +1,42 @@
+package com.k2fsa.sherpa.onnx.slid
+
+import android.content.res.AssetManager
+import android.util.Log
+import com.k2fsa.sherpa.onnx.SpokenLanguageIdentification
+import com.k2fsa.sherpa.onnx.getSpokenLanguageIdentificationConfig
+import java.util.Locale
+
+
+object Slid {
+ private var _slid: SpokenLanguageIdentification? = null
+
+ private var _localeMap = mutableMapOf()
+ val slid: SpokenLanguageIdentification
+ get() {
+ return _slid!!
+ }
+ val localeMap : Map
+ get() {
+ return _localeMap
+ }
+
+ fun initSlid(assetManager: AssetManager? = null, numThreads: Int = 1) {
+ synchronized(this) {
+ if (_slid == null) {
+
+ Log.i(TAG, "Initializing slid")
+ val config =
+ getSpokenLanguageIdentificationConfig(type = 0, numThreads = numThreads)!!
+ _slid = SpokenLanguageIdentification(assetManager, config)
+ }
+
+ if (_localeMap.isEmpty()) {
+ val allLang = Locale.getISOLanguages();
+ for (lang in allLang) {
+ val locale = Locale(lang)
+ _localeMap[lang] = locale.displayName
+ }
+ }
+ }
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Color.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Color.kt
new file mode 100644
index 00000000..cbfdfd17
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Color.kt
@@ -0,0 +1,11 @@
+package com.k2fsa.sherpa.onnx.slid.ui.theme
+
+import androidx.compose.ui.graphics.Color
+
+val Purple80 = Color(0xFFD0BCFF)
+val PurpleGrey80 = Color(0xFFCCC2DC)
+val Pink80 = Color(0xFFEFB8C8)
+
+val Purple40 = Color(0xFF6650a4)
+val PurpleGrey40 = Color(0xFF625b71)
+val Pink40 = Color(0xFF7D5260)
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Theme.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Theme.kt
new file mode 100644
index 00000000..02f83371
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Theme.kt
@@ -0,0 +1,70 @@
+package com.k2fsa.sherpa.onnx.slid.ui.theme
+
+import android.app.Activity
+import android.os.Build
+import androidx.compose.foundation.isSystemInDarkTheme
+import androidx.compose.material3.MaterialTheme
+import androidx.compose.material3.darkColorScheme
+import androidx.compose.material3.dynamicDarkColorScheme
+import androidx.compose.material3.dynamicLightColorScheme
+import androidx.compose.material3.lightColorScheme
+import androidx.compose.runtime.Composable
+import androidx.compose.runtime.SideEffect
+import androidx.compose.ui.graphics.toArgb
+import androidx.compose.ui.platform.LocalContext
+import androidx.compose.ui.platform.LocalView
+import androidx.core.view.WindowCompat
+
+private val DarkColorScheme = darkColorScheme(
+ primary = Purple80,
+ secondary = PurpleGrey80,
+ tertiary = Pink80
+)
+
+private val LightColorScheme = lightColorScheme(
+ primary = Purple40,
+ secondary = PurpleGrey40,
+ tertiary = Pink40
+
+ /* Other default colors to override
+ background = Color(0xFFFFFBFE),
+ surface = Color(0xFFFFFBFE),
+ onPrimary = Color.White,
+ onSecondary = Color.White,
+ onTertiary = Color.White,
+ onBackground = Color(0xFF1C1B1F),
+ onSurface = Color(0xFF1C1B1F),
+ */
+)
+
+@Composable
+fun SherpaOnnxSpokenLanguageIdentificationTheme(
+ darkTheme: Boolean = isSystemInDarkTheme(),
+ // Dynamic color is available on Android 12+
+ dynamicColor: Boolean = true,
+ content: @Composable () -> Unit
+) {
+ val colorScheme = when {
+ dynamicColor && Build.VERSION.SDK_INT >= Build.VERSION_CODES.S -> {
+ val context = LocalContext.current
+ if (darkTheme) dynamicDarkColorScheme(context) else dynamicLightColorScheme(context)
+ }
+
+ darkTheme -> DarkColorScheme
+ else -> LightColorScheme
+ }
+ val view = LocalView.current
+ if (!view.isInEditMode) {
+ SideEffect {
+ val window = (view.context as Activity).window
+ window.statusBarColor = colorScheme.primary.toArgb()
+ WindowCompat.getInsetsController(window, view).isAppearanceLightStatusBars = darkTheme
+ }
+ }
+
+ MaterialTheme(
+ colorScheme = colorScheme,
+ typography = Typography,
+ content = content
+ )
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Type.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Type.kt
new file mode 100644
index 00000000..48bb5ae9
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/ui/theme/Type.kt
@@ -0,0 +1,34 @@
+package com.k2fsa.sherpa.onnx.slid.ui.theme
+
+import androidx.compose.material3.Typography
+import androidx.compose.ui.text.TextStyle
+import androidx.compose.ui.text.font.FontFamily
+import androidx.compose.ui.text.font.FontWeight
+import androidx.compose.ui.unit.sp
+
+// Set of Material typography styles to start with
+val Typography = Typography(
+ bodyLarge = TextStyle(
+ fontFamily = FontFamily.Default,
+ fontWeight = FontWeight.Normal,
+ fontSize = 16.sp,
+ lineHeight = 24.sp,
+ letterSpacing = 0.5.sp
+ )
+ /* Other default text styles to override
+ titleLarge = TextStyle(
+ fontFamily = FontFamily.Default,
+ fontWeight = FontWeight.Normal,
+ fontSize = 22.sp,
+ lineHeight = 28.sp,
+ letterSpacing = 0.sp
+ ),
+ labelSmall = TextStyle(
+ fontFamily = FontFamily.Default,
+ fontWeight = FontWeight.Medium,
+ fontSize = 11.sp,
+ lineHeight = 16.sp,
+ letterSpacing = 0.5.sp
+ )
+ */
+)
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/arm64-v8a/.gitignore b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/arm64-v8a/.gitignore
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/armeabi-v7a/.gitignore b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/armeabi-v7a/.gitignore
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/x86/.gitignore b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/x86/.gitignore
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/x86_64/.gitignore b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/x86_64/.gitignore
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/drawable-v24/ic_launcher_foreground.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/drawable-v24/ic_launcher_foreground.xml
new file mode 100644
index 00000000..2b068d11
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/drawable-v24/ic_launcher_foreground.xml
@@ -0,0 +1,30 @@
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/drawable/ic_launcher_background.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/drawable/ic_launcher_background.xml
new file mode 100644
index 00000000..07d5da9c
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/drawable/ic_launcher_background.xml
@@ -0,0 +1,170 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml
new file mode 100644
index 00000000..6f3b755b
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml
@@ -0,0 +1,6 @@
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml
new file mode 100644
index 00000000..6f3b755b
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml
@@ -0,0 +1,6 @@
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-hdpi/ic_launcher.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-hdpi/ic_launcher.webp
new file mode 100644
index 00000000..c209e78e
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-hdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..b2dfe3d1
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-mdpi/ic_launcher.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-mdpi/ic_launcher.webp
new file mode 100644
index 00000000..4f0f1d64
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-mdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..62b611da
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xhdpi/ic_launcher.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xhdpi/ic_launcher.webp
new file mode 100644
index 00000000..948a3070
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xhdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..1b9a6956
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp
new file mode 100644
index 00000000..28d4b77f
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..9287f508
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp
new file mode 100644
index 00000000..aa7d6427
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..9126ae37
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/colors.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/colors.xml
new file mode 100644
index 00000000..f8c6127d
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/colors.xml
@@ -0,0 +1,10 @@
+
+
+ #FFBB86FC
+ #FF6200EE
+ #FF3700B3
+ #FF03DAC5
+ #FF018786
+ #FF000000
+ #FFFFFFFF
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/strings.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/strings.xml
new file mode 100644
index 00000000..f0a3e3a4
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/strings.xml
@@ -0,0 +1,3 @@
+
+ SherpaOnnxSpokenLanguageIdentification
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/themes.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/themes.xml
new file mode 100644
index 00000000..07b6588b
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/values/themes.xml
@@ -0,0 +1,5 @@
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/xml/backup_rules.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/xml/backup_rules.xml
new file mode 100644
index 00000000..fa0f996d
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/xml/backup_rules.xml
@@ -0,0 +1,13 @@
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/xml/data_extraction_rules.xml b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/xml/data_extraction_rules.xml
new file mode 100644
index 00000000..9ee9997b
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/main/res/xml/data_extraction_rules.xml
@@ -0,0 +1,19 @@
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/app/src/test/java/com/k2fsa/sherpa/onnx/slid/ExampleUnitTest.kt b/android/SherpaOnnxSpokenLanguageIdentification/app/src/test/java/com/k2fsa/sherpa/onnx/slid/ExampleUnitTest.kt
new file mode 100644
index 00000000..e6d048a8
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/app/src/test/java/com/k2fsa/sherpa/onnx/slid/ExampleUnitTest.kt
@@ -0,0 +1,17 @@
+package com.k2fsa.sherpa.onnx.slid
+
+import org.junit.Test
+
+import org.junit.Assert.*
+
+/**
+ * Example local unit test, which will execute on the development machine (host).
+ *
+ * See [testing documentation](http://d.android.com/tools/testing).
+ */
+class ExampleUnitTest {
+ @Test
+ fun addition_isCorrect() {
+ assertEquals(4, 2 + 2)
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/build.gradle.kts b/android/SherpaOnnxSpokenLanguageIdentification/build.gradle.kts
new file mode 100644
index 00000000..8e8f4ab9
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/build.gradle.kts
@@ -0,0 +1,5 @@
+// Top-level build file where you can add configuration options common to all sub-projects/modules.
+plugins {
+ id("com.android.application") version "8.2.0" apply false
+ id("org.jetbrains.kotlin.android") version "1.9.0" apply false
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/gradle.properties b/android/SherpaOnnxSpokenLanguageIdentification/gradle.properties
new file mode 100644
index 00000000..3c5031eb
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/gradle.properties
@@ -0,0 +1,23 @@
+# Project-wide Gradle settings.
+# IDE (e.g. Android Studio) users:
+# Gradle settings configured through the IDE *will override*
+# any settings specified in this file.
+# For more details on how to configure your build environment visit
+# http://www.gradle.org/docs/current/userguide/build_environment.html
+# Specifies the JVM arguments used for the daemon process.
+# The setting is particularly useful for tweaking memory settings.
+org.gradle.jvmargs=-Xmx2048m -Dfile.encoding=UTF-8
+# When configured, Gradle will run in incubating parallel mode.
+# This option should only be used with decoupled projects. More details, visit
+# http://www.gradle.org/docs/current/userguide/multi_project_builds.html#sec:decoupled_projects
+# org.gradle.parallel=true
+# AndroidX package structure to make it clearer which packages are bundled with the
+# Android operating system, and which are packaged with your app's APK
+# https://developer.android.com/topic/libraries/support-library/androidx-rn
+android.useAndroidX=true
+# Kotlin code style for this project: "official" or "obsolete":
+kotlin.code.style=official
+# Enables namespacing of each library's R class so that its R class includes only the
+# resources declared in the library itself and none from the library's dependencies,
+# thereby reducing the size of the R class for that library
+android.nonTransitiveRClass=true
\ No newline at end of file
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/gradle/wrapper/gradle-wrapper.jar b/android/SherpaOnnxSpokenLanguageIdentification/gradle/wrapper/gradle-wrapper.jar
new file mode 100644
index 00000000..e708b1c0
Binary files /dev/null and b/android/SherpaOnnxSpokenLanguageIdentification/gradle/wrapper/gradle-wrapper.jar differ
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/gradle/wrapper/gradle-wrapper.properties b/android/SherpaOnnxSpokenLanguageIdentification/gradle/wrapper/gradle-wrapper.properties
new file mode 100644
index 00000000..731fe5a7
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/gradle/wrapper/gradle-wrapper.properties
@@ -0,0 +1,6 @@
+#Wed Apr 17 19:48:00 CST 2024
+distributionBase=GRADLE_USER_HOME
+distributionPath=wrapper/dists
+distributionUrl=https\://services.gradle.org/distributions/gradle-8.2-bin.zip
+zipStoreBase=GRADLE_USER_HOME
+zipStorePath=wrapper/dists
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/gradlew b/android/SherpaOnnxSpokenLanguageIdentification/gradlew
new file mode 100755
index 00000000..4f906e0c
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/gradlew
@@ -0,0 +1,185 @@
+#!/usr/bin/env sh
+
+#
+# Copyright 2015 the original author or authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+##############################################################################
+##
+## Gradle start up script for UN*X
+##
+##############################################################################
+
+# Attempt to set APP_HOME
+# Resolve links: $0 may be a link
+PRG="$0"
+# Need this for relative symlinks.
+while [ -h "$PRG" ] ; do
+ ls=`ls -ld "$PRG"`
+ link=`expr "$ls" : '.*-> \(.*\)$'`
+ if expr "$link" : '/.*' > /dev/null; then
+ PRG="$link"
+ else
+ PRG=`dirname "$PRG"`"/$link"
+ fi
+done
+SAVED="`pwd`"
+cd "`dirname \"$PRG\"`/" >/dev/null
+APP_HOME="`pwd -P`"
+cd "$SAVED" >/dev/null
+
+APP_NAME="Gradle"
+APP_BASE_NAME=`basename "$0"`
+
+# Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
+DEFAULT_JVM_OPTS='"-Xmx64m" "-Xms64m"'
+
+# Use the maximum available, or set MAX_FD != -1 to use that value.
+MAX_FD="maximum"
+
+warn () {
+ echo "$*"
+}
+
+die () {
+ echo
+ echo "$*"
+ echo
+ exit 1
+}
+
+# OS specific support (must be 'true' or 'false').
+cygwin=false
+msys=false
+darwin=false
+nonstop=false
+case "`uname`" in
+ CYGWIN* )
+ cygwin=true
+ ;;
+ Darwin* )
+ darwin=true
+ ;;
+ MINGW* )
+ msys=true
+ ;;
+ NONSTOP* )
+ nonstop=true
+ ;;
+esac
+
+CLASSPATH=$APP_HOME/gradle/wrapper/gradle-wrapper.jar
+
+
+# Determine the Java command to use to start the JVM.
+if [ -n "$JAVA_HOME" ] ; then
+ if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
+ # IBM's JDK on AIX uses strange locations for the executables
+ JAVACMD="$JAVA_HOME/jre/sh/java"
+ else
+ JAVACMD="$JAVA_HOME/bin/java"
+ fi
+ if [ ! -x "$JAVACMD" ] ; then
+ die "ERROR: JAVA_HOME is set to an invalid directory: $JAVA_HOME
+
+Please set the JAVA_HOME variable in your environment to match the
+location of your Java installation."
+ fi
+else
+ JAVACMD="java"
+ which java >/dev/null 2>&1 || die "ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
+
+Please set the JAVA_HOME variable in your environment to match the
+location of your Java installation."
+fi
+
+# Increase the maximum file descriptors if we can.
+if [ "$cygwin" = "false" -a "$darwin" = "false" -a "$nonstop" = "false" ] ; then
+ MAX_FD_LIMIT=`ulimit -H -n`
+ if [ $? -eq 0 ] ; then
+ if [ "$MAX_FD" = "maximum" -o "$MAX_FD" = "max" ] ; then
+ MAX_FD="$MAX_FD_LIMIT"
+ fi
+ ulimit -n $MAX_FD
+ if [ $? -ne 0 ] ; then
+ warn "Could not set maximum file descriptor limit: $MAX_FD"
+ fi
+ else
+ warn "Could not query maximum file descriptor limit: $MAX_FD_LIMIT"
+ fi
+fi
+
+# For Darwin, add options to specify how the application appears in the dock
+if $darwin; then
+ GRADLE_OPTS="$GRADLE_OPTS \"-Xdock:name=$APP_NAME\" \"-Xdock:icon=$APP_HOME/media/gradle.icns\""
+fi
+
+# For Cygwin or MSYS, switch paths to Windows format before running java
+if [ "$cygwin" = "true" -o "$msys" = "true" ] ; then
+ APP_HOME=`cygpath --path --mixed "$APP_HOME"`
+ CLASSPATH=`cygpath --path --mixed "$CLASSPATH"`
+
+ JAVACMD=`cygpath --unix "$JAVACMD"`
+
+ # We build the pattern for arguments to be converted via cygpath
+ ROOTDIRSRAW=`find -L / -maxdepth 1 -mindepth 1 -type d 2>/dev/null`
+ SEP=""
+ for dir in $ROOTDIRSRAW ; do
+ ROOTDIRS="$ROOTDIRS$SEP$dir"
+ SEP="|"
+ done
+ OURCYGPATTERN="(^($ROOTDIRS))"
+ # Add a user-defined pattern to the cygpath arguments
+ if [ "$GRADLE_CYGPATTERN" != "" ] ; then
+ OURCYGPATTERN="$OURCYGPATTERN|($GRADLE_CYGPATTERN)"
+ fi
+ # Now convert the arguments - kludge to limit ourselves to /bin/sh
+ i=0
+ for arg in "$@" ; do
+ CHECK=`echo "$arg"|egrep -c "$OURCYGPATTERN" -`
+ CHECK2=`echo "$arg"|egrep -c "^-"` ### Determine if an option
+
+ if [ $CHECK -ne 0 ] && [ $CHECK2 -eq 0 ] ; then ### Added a condition
+ eval `echo args$i`=`cygpath --path --ignore --mixed "$arg"`
+ else
+ eval `echo args$i`="\"$arg\""
+ fi
+ i=`expr $i + 1`
+ done
+ case $i in
+ 0) set -- ;;
+ 1) set -- "$args0" ;;
+ 2) set -- "$args0" "$args1" ;;
+ 3) set -- "$args0" "$args1" "$args2" ;;
+ 4) set -- "$args0" "$args1" "$args2" "$args3" ;;
+ 5) set -- "$args0" "$args1" "$args2" "$args3" "$args4" ;;
+ 6) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" ;;
+ 7) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" ;;
+ 8) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" ;;
+ 9) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" "$args8" ;;
+ esac
+fi
+
+# Escape application args
+save () {
+ for i do printf %s\\n "$i" | sed "s/'/'\\\\''/g;1s/^/'/;\$s/\$/' \\\\/" ; done
+ echo " "
+}
+APP_ARGS=`save "$@"`
+
+# Collect all arguments for the java command, following the shell quoting and substitution rules
+eval set -- $DEFAULT_JVM_OPTS $JAVA_OPTS $GRADLE_OPTS "\"-Dorg.gradle.appname=$APP_BASE_NAME\"" -classpath "\"$CLASSPATH\"" org.gradle.wrapper.GradleWrapperMain "$APP_ARGS"
+
+exec "$JAVACMD" "$@"
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/gradlew.bat b/android/SherpaOnnxSpokenLanguageIdentification/gradlew.bat
new file mode 100644
index 00000000..ac1b06f9
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/gradlew.bat
@@ -0,0 +1,89 @@
+@rem
+@rem Copyright 2015 the original author or authors.
+@rem
+@rem Licensed under the Apache License, Version 2.0 (the "License");
+@rem you may not use this file except in compliance with the License.
+@rem You may obtain a copy of the License at
+@rem
+@rem https://www.apache.org/licenses/LICENSE-2.0
+@rem
+@rem Unless required by applicable law or agreed to in writing, software
+@rem distributed under the License is distributed on an "AS IS" BASIS,
+@rem WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+@rem See the License for the specific language governing permissions and
+@rem limitations under the License.
+@rem
+
+@if "%DEBUG%" == "" @echo off
+@rem ##########################################################################
+@rem
+@rem Gradle startup script for Windows
+@rem
+@rem ##########################################################################
+
+@rem Set local scope for the variables with windows NT shell
+if "%OS%"=="Windows_NT" setlocal
+
+set DIRNAME=%~dp0
+if "%DIRNAME%" == "" set DIRNAME=.
+set APP_BASE_NAME=%~n0
+set APP_HOME=%DIRNAME%
+
+@rem Resolve any "." and ".." in APP_HOME to make it shorter.
+for %%i in ("%APP_HOME%") do set APP_HOME=%%~fi
+
+@rem Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
+set DEFAULT_JVM_OPTS="-Xmx64m" "-Xms64m"
+
+@rem Find java.exe
+if defined JAVA_HOME goto findJavaFromJavaHome
+
+set JAVA_EXE=java.exe
+%JAVA_EXE% -version >NUL 2>&1
+if "%ERRORLEVEL%" == "0" goto execute
+
+echo.
+echo ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
+echo.
+echo Please set the JAVA_HOME variable in your environment to match the
+echo location of your Java installation.
+
+goto fail
+
+:findJavaFromJavaHome
+set JAVA_HOME=%JAVA_HOME:"=%
+set JAVA_EXE=%JAVA_HOME%/bin/java.exe
+
+if exist "%JAVA_EXE%" goto execute
+
+echo.
+echo ERROR: JAVA_HOME is set to an invalid directory: %JAVA_HOME%
+echo.
+echo Please set the JAVA_HOME variable in your environment to match the
+echo location of your Java installation.
+
+goto fail
+
+:execute
+@rem Setup the command line
+
+set CLASSPATH=%APP_HOME%\gradle\wrapper\gradle-wrapper.jar
+
+
+@rem Execute Gradle
+"%JAVA_EXE%" %DEFAULT_JVM_OPTS% %JAVA_OPTS% %GRADLE_OPTS% "-Dorg.gradle.appname=%APP_BASE_NAME%" -classpath "%CLASSPATH%" org.gradle.wrapper.GradleWrapperMain %*
+
+:end
+@rem End local scope for the variables with windows NT shell
+if "%ERRORLEVEL%"=="0" goto mainEnd
+
+:fail
+rem Set variable GRADLE_EXIT_CONSOLE if you need the _script_ return code instead of
+rem the _cmd.exe /c_ return code!
+if not "" == "%GRADLE_EXIT_CONSOLE%" exit 1
+exit /b 1
+
+:mainEnd
+if "%OS%"=="Windows_NT" endlocal
+
+:omega
diff --git a/android/SherpaOnnxSpokenLanguageIdentification/settings.gradle.kts b/android/SherpaOnnxSpokenLanguageIdentification/settings.gradle.kts
new file mode 100644
index 00000000..3b2d9721
--- /dev/null
+++ b/android/SherpaOnnxSpokenLanguageIdentification/settings.gradle.kts
@@ -0,0 +1,17 @@
+pluginManagement {
+ repositories {
+ google()
+ mavenCentral()
+ gradlePluginPortal()
+ }
+}
+dependencyResolutionManagement {
+ repositoriesMode.set(RepositoriesMode.FAIL_ON_PROJECT_REPOS)
+ repositories {
+ google()
+ mavenCentral()
+ }
+}
+
+rootProject.name = "SherpaOnnxSpokenLanguageIdentification"
+include(":app")
diff --git a/kotlin-api-examples/SpokenLanguageIdentification.kt b/kotlin-api-examples/SpokenLanguageIdentification.kt
deleted file mode 100644
index ef117c8b..00000000
--- a/kotlin-api-examples/SpokenLanguageIdentification.kt
+++ /dev/null
@@ -1,71 +0,0 @@
-package com.k2fsa.sherpa.onnx
-
-import android.content.res.AssetManager
-import android.util.Log
-
-private val TAG = "sherpa-onnx"
-
-data class SpokenLanguageIdentificationWhisperConfig (
- var encoder: String,
- var decoder: String,
- var tailPaddings: Int = -1,
-)
-
-data class SpokenLanguageIdentificationConfig (
- var whisper: SpokenLanguageIdentificationWhisperConfig,
- var numThreads: Int = 1,
- var debug: Boolean = false,
- var provider: String = "cpu",
-)
-
-class SpokenLanguageIdentification (
- assetManager: AssetManager? = null,
- config: SpokenLanguageIdentificationConfig,
-) {
- private var ptr: Long
-
- init {
- ptr = if (assetManager != null) {
- newFromAsset(assetManager, config)
- } else {
- newFromFile(config)
- }
- }
-
- protected fun finalize() {
- if (ptr != 0L) {
- delete(ptr)
- ptr = 0
- }
- }
-
- fun release() = finalize()
-
- fun createStream(): OfflineStream {
- val p = createStream(ptr)
- return OfflineStream(p)
- }
-
- fun compute(stream: OfflineStream) = compute(ptr, stream.ptr)
-
- private external fun newFromAsset(
- assetManager: AssetManager,
- config: SpokenLanguageIdentificationConfig,
- ): Long
-
- private external fun newFromFile(
- config: SpokenLanguageIdentificationConfig,
- ): Long
-
- private external fun delete(ptr: Long)
-
- private external fun createStream(ptr: Long): Long
-
- private external fun compute(ptr: Long, streamPtr: Long): String
-
- companion object {
- init {
- System.loadLibrary("sherpa-onnx-jni")
- }
- }
-}
diff --git a/kotlin-api-examples/SpokenLanguageIdentification.kt b/kotlin-api-examples/SpokenLanguageIdentification.kt
new file mode 120000
index 00000000..702a54c9
--- /dev/null
+++ b/kotlin-api-examples/SpokenLanguageIdentification.kt
@@ -0,0 +1 @@
+../android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/SpokenLanguageIdentification.kt
\ No newline at end of file
diff --git a/scripts/apk/build-apk-slid.sh.in b/scripts/apk/build-apk-slid.sh.in
new file mode 100644
index 00000000..6d6e33f8
--- /dev/null
+++ b/scripts/apk/build-apk-slid.sh.in
@@ -0,0 +1,91 @@
+#!/usr/bin/env bash
+#
+# Auto generated! Please DO NOT EDIT!
+
+# Please set the environment variable ANDROID_NDK
+# before running this script
+
+# Inside the $ANDROID_NDK directory, you can find a binary ndk-build
+# and some other files like the file "build/cmake/android.toolchain.cmake"
+
+set -ex
+
+log() {
+ # This function is from espnet
+ local fname=${BASH_SOURCE[1]##*/}
+ echo -e "$(date '+%Y-%m-%d %H:%M:%S') (${fname}:${BASH_LINENO[0]}:${FUNCNAME[1]}) $*"
+}
+
+SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
+
+log "Building spoken language identification APK for sherpa-onnx v${SHERPA_ONNX_VERSION}"
+
+log "====================arm64-v8a================="
+./build-android-arm64-v8a.sh
+log "====================armv7-eabi================"
+./build-android-armv7-eabi.sh
+log "====================x86-64===================="
+./build-android-x86-64.sh
+log "====================x86===================="
+./build-android-x86.sh
+
+mkdir -p apks
+
+{% for model in model_list %}
+pushd ./android/SherpaOnnxSpokenLanguageIdentification/app/src/main/assets/
+model_name={{ model.model_name }}
+short_name={{ model.short_name }}
+type={{ model.idx }}
+
+curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/${model_name}.tar.bz2
+tar xvf ${model_name}.tar.bz2
+rm -rfv $model_name/*-encoder.onnx
+rm -rfv $model_name/*-decoder.onnx
+rm -rfv $model_name/*.py
+rm -rfv $model_name/*.txt
+rm -rfv $model_name/*.md
+rm -rfv $model_name/test_wavs
+rm -rf *.tar.bz2
+ls -lh $model_name
+
+popd
+# Now we are at the project root directory
+
+git checkout .
+pushd android/SherpaOnnxSpokenLanguageIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/slid/
+sed -i.bak s/"type = 0/type = $type/" ./slid.kt
+git diff
+popd
+
+for arch in arm64-v8a armeabi-v7a x86_64 x86; do
+ log "------------------------------------------------------------"
+ log "build spoken language identification apk for $arch"
+ log "------------------------------------------------------------"
+ src_arch=$arch
+ if [ $arch == "armeabi-v7a" ]; then
+ src_arch=armv7-eabi
+ elif [ $arch == "x86_64" ]; then
+ src_arch=x86-64
+ fi
+
+ ls -lh ./build-android-$src_arch/install/lib/*.so
+
+ cp -v ./build-android-$src_arch/install/lib/*.so ./android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/$arch/
+
+ pushd ./android/SherpaOnnxSpokenLanguageIdentification
+ sed -i.bak s/2048/9012/g ./gradle.properties
+ git diff ./gradle.properties
+ ./gradlew assembleRelease
+ popd
+
+ mv android/SherpaOnnxSpokenLanguageIdentification/app/build/outputs/apk/release/app-release-unsigned.apk ./apks/sherpa-onnx-${SHERPA_ONNX_VERSION}-$arch-audio-tagging-$short_name.apk
+ ls -lh apks
+ rm -v ./android/SherpaOnnxSpokenLanguageIdentification/app/src/main/jniLibs/$arch/*.so
+done
+
+rm -rf ./android/SherpaOnnxSpokenLanguageIdentification/app/src/main/assets/$model_name
+{% endfor %}
+
+git checkout .
+
+ls -lh apks/
diff --git a/scripts/apk/generate-slid-apk-script.py b/scripts/apk/generate-slid-apk-script.py
new file mode 100755
index 00000000..a1f9ffae
--- /dev/null
+++ b/scripts/apk/generate-slid-apk-script.py
@@ -0,0 +1,90 @@
+#!/usr/bin/env python3
+
+import argparse
+from dataclasses import dataclass
+from typing import List, Optional
+
+import jinja2
+
+
+def get_args():
+ parser = argparse.ArgumentParser()
+ parser.add_argument(
+ "--total",
+ type=int,
+ default=1,
+ help="Number of runners",
+ )
+ parser.add_argument(
+ "--index",
+ type=int,
+ default=0,
+ help="Index of the current runner",
+ )
+ return parser.parse_args()
+
+
+@dataclass
+class SlidModel:
+ model_name: str
+ idx: int
+ short_name: str = ""
+
+
+def get_models():
+ # see https://k2-fsa.github.io/sherpa/onnx/spolken-language-identification/pretrained_models.html#pre-trained-models
+ whisper_models = [
+ SlidModel(
+ model_name="sherpa-onnx-whisper-tiny",
+ idx=0,
+ short_name="whisper_tiny",
+ ),
+ ]
+
+ return whisper_models
+
+
+def main():
+ args = get_args()
+ index = args.index
+ total = args.total
+ assert 0 <= index < total, (index, total)
+
+ all_model_list = get_models()
+
+ num_models = len(all_model_list)
+
+ num_per_runner = num_models // total
+ if num_per_runner <= 0:
+ raise ValueError(f"num_models: {num_models}, num_runners: {total}")
+
+ start = index * num_per_runner
+ end = start + num_per_runner
+
+ remaining = num_models - args.total * num_per_runner
+
+ print(f"{index}/{total}: {start}-{end}/{num_models}")
+
+ d = dict()
+ d["model_list"] = all_model_list[start:end]
+ if index < remaining:
+ s = args.total * num_per_runner + index
+ d["model_list"].append(all_model_list[s])
+ print(f"{s}/{num_models}")
+
+ filename_list = [
+ "./build-apk-slid.sh",
+ ]
+ for filename in filename_list:
+ environment = jinja2.Environment()
+ with open(f"{filename}.in") as f:
+ s = f.read()
+ template = environment.from_string(s)
+
+ s = template.render(**d)
+ with open(filename, "w") as f:
+ print(s, file=f)
+
+
+if __name__ == "__main__":
+ main()
diff --git a/sherpa-onnx/csrc/audio-tagging-impl.cc b/sherpa-onnx/csrc/audio-tagging-impl.cc
index 37cd6faa..3aa44d71 100644
--- a/sherpa-onnx/csrc/audio-tagging-impl.cc
+++ b/sherpa-onnx/csrc/audio-tagging-impl.cc
@@ -4,6 +4,8 @@
#include "sherpa-onnx/csrc/audio-tagging-impl.h"
+#include
+
#if __ANDROID_API__ >= 9
#include "android/asset_manager.h"
#include "android/asset_manager_jni.h"
diff --git a/sherpa-onnx/csrc/audio-tagging.cc b/sherpa-onnx/csrc/audio-tagging.cc
index 8fcb6ef4..c6d1e24f 100644
--- a/sherpa-onnx/csrc/audio-tagging.cc
+++ b/sherpa-onnx/csrc/audio-tagging.cc
@@ -4,6 +4,8 @@
#include "sherpa-onnx/csrc/audio-tagging.h"
+#include
+
#if __ANDROID_API__ >= 9
#include "android/asset_manager.h"
#include "android/asset_manager_jni.h"
diff --git a/sherpa-onnx/csrc/offline-whisper-model.cc b/sherpa-onnx/csrc/offline-whisper-model.cc
index 2dcfac90..183574f9 100644
--- a/sherpa-onnx/csrc/offline-whisper-model.cc
+++ b/sherpa-onnx/csrc/offline-whisper-model.cc
@@ -70,6 +70,23 @@ class OfflineWhisperModel::Impl {
InitDecoder(buf.data(), buf.size());
}
}
+
+ Impl(AAssetManager *mgr, const SpokenLanguageIdentificationConfig &config)
+ : lid_config_(config),
+ env_(ORT_LOGGING_LEVEL_ERROR),
+ sess_opts_(GetSessionOptions(config)),
+ allocator_{} {
+ debug_ = config_.debug;
+ {
+ auto buf = ReadFile(mgr, config.whisper.encoder);
+ InitEncoder(buf.data(), buf.size());
+ }
+
+ {
+ auto buf = ReadFile(mgr, config.whisper.decoder);
+ InitDecoder(buf.data(), buf.size());
+ }
+ }
#endif
std::pair ForwardEncoder(Ort::Value features) {
@@ -326,6 +343,11 @@ OfflineWhisperModel::OfflineWhisperModel(
OfflineWhisperModel::OfflineWhisperModel(AAssetManager *mgr,
const OfflineModelConfig &config)
: impl_(std::make_unique(mgr, config)) {}
+
+OfflineWhisperModel::OfflineWhisperModel(
+ AAssetManager *mgr, const SpokenLanguageIdentificationConfig &config)
+ : impl_(std::make_unique(mgr, config)) {}
+
#endif
OfflineWhisperModel::~OfflineWhisperModel() = default;
diff --git a/sherpa-onnx/csrc/offline-whisper-model.h b/sherpa-onnx/csrc/offline-whisper-model.h
index 386a4d87..892af24a 100644
--- a/sherpa-onnx/csrc/offline-whisper-model.h
+++ b/sherpa-onnx/csrc/offline-whisper-model.h
@@ -31,6 +31,8 @@ class OfflineWhisperModel {
#if __ANDROID_API__ >= 9
OfflineWhisperModel(AAssetManager *mgr, const OfflineModelConfig &config);
+ OfflineWhisperModel(AAssetManager *mgr,
+ const SpokenLanguageIdentificationConfig &config);
#endif
~OfflineWhisperModel();
diff --git a/sherpa-onnx/csrc/spoken-language-identification-impl.cc b/sherpa-onnx/csrc/spoken-language-identification-impl.cc
index 599a72a7..016ac7e0 100644
--- a/sherpa-onnx/csrc/spoken-language-identification-impl.cc
+++ b/sherpa-onnx/csrc/spoken-language-identification-impl.cc
@@ -5,6 +5,11 @@
#include
+#if __ANDROID_API__ >= 9
+#include "android/asset_manager.h"
+#include "android/asset_manager_jni.h"
+#endif
+
#include "sherpa-onnx/csrc/macros.h"
#include "sherpa-onnx/csrc/onnx-utils.h"
#include "sherpa-onnx/csrc/spoken-language-identification-whisper-impl.h"
@@ -85,4 +90,34 @@ SpokenLanguageIdentificationImpl::Create(
return nullptr;
}
+#if __ANDROID_API__ >= 9
+std::unique_ptr
+SpokenLanguageIdentificationImpl::Create(
+ AAssetManager *mgr, const SpokenLanguageIdentificationConfig &config) {
+ ModelType model_type = ModelType::kUnknown;
+ {
+ if (config.whisper.encoder.empty()) {
+ SHERPA_ONNX_LOGE("Only whisper models are supported at present");
+ exit(-1);
+ }
+ auto buffer = ReadFile(mgr, config.whisper.encoder);
+
+ model_type = GetModelType(buffer.data(), buffer.size(), config.debug);
+ }
+
+ switch (model_type) {
+ case ModelType::kWhisper:
+ return std::make_unique(mgr,
+ config);
+ case ModelType::kUnknown:
+ SHERPA_ONNX_LOGE(
+ "Unknown model type for spoken language identification!");
+ return nullptr;
+ }
+
+ // unreachable code
+ return nullptr;
+}
+#endif
+
} // namespace sherpa_onnx
diff --git a/sherpa-onnx/csrc/spoken-language-identification-impl.h b/sherpa-onnx/csrc/spoken-language-identification-impl.h
index b9112fa4..bbbfedef 100644
--- a/sherpa-onnx/csrc/spoken-language-identification-impl.h
+++ b/sherpa-onnx/csrc/spoken-language-identification-impl.h
@@ -7,6 +7,11 @@
#include
#include
+#if __ANDROID_API__ >= 9
+#include "android/asset_manager.h"
+#include "android/asset_manager_jni.h"
+#endif
+
#include "sherpa-onnx/csrc/spoken-language-identification.h"
namespace sherpa_onnx {
@@ -18,6 +23,11 @@ class SpokenLanguageIdentificationImpl {
static std::unique_ptr Create(
const SpokenLanguageIdentificationConfig &config);
+#if __ANDROID_API__ >= 9
+ static std::unique_ptr Create(
+ AAssetManager *mgr, const SpokenLanguageIdentificationConfig &config);
+#endif
+
virtual std::unique_ptr CreateStream() const = 0;
virtual std::string Compute(OfflineStream *s) const = 0;
diff --git a/sherpa-onnx/csrc/spoken-language-identification-whisper-impl.h b/sherpa-onnx/csrc/spoken-language-identification-whisper-impl.h
index a44001d5..d82883b5 100644
--- a/sherpa-onnx/csrc/spoken-language-identification-whisper-impl.h
+++ b/sherpa-onnx/csrc/spoken-language-identification-whisper-impl.h
@@ -11,6 +11,11 @@
#include
#include
+#if __ANDROID_API__ >= 9
+#include "android/asset_manager.h"
+#include "android/asset_manager_jni.h"
+#endif
+
#include "sherpa-onnx/csrc/offline-whisper-model.h"
#include "sherpa-onnx/csrc/spoken-language-identification-impl.h"
#include "sherpa-onnx/csrc/transpose.h"
@@ -26,6 +31,15 @@ class SpokenLanguageIdentificationWhisperImpl
Check();
}
+#if __ANDROID_API__ >= 9
+ SpokenLanguageIdentificationWhisperImpl(
+ AAssetManager *mgr, const SpokenLanguageIdentificationConfig &config)
+ : config_(config),
+ model_(std::make_unique(mgr, config)) {
+ Check();
+ }
+#endif
+
std::unique_ptr CreateStream() const override {
return std::make_unique(WhisperTag{});
}
diff --git a/sherpa-onnx/csrc/spoken-language-identification.cc b/sherpa-onnx/csrc/spoken-language-identification.cc
index 2cb2d99a..eff49662 100644
--- a/sherpa-onnx/csrc/spoken-language-identification.cc
+++ b/sherpa-onnx/csrc/spoken-language-identification.cc
@@ -6,6 +6,11 @@
#include
+#if __ANDROID_API__ >= 9
+#include "android/asset_manager.h"
+#include "android/asset_manager_jni.h"
+#endif
+
#include "sherpa-onnx/csrc/file-utils.h"
#include "sherpa-onnx/csrc/macros.h"
#include "sherpa-onnx/csrc/spoken-language-identification-impl.h"
@@ -103,6 +108,12 @@ SpokenLanguageIdentification::SpokenLanguageIdentification(
const SpokenLanguageIdentificationConfig &config)
: impl_(SpokenLanguageIdentificationImpl::Create(config)) {}
+#if __ANDROID_API__ >= 9
+SpokenLanguageIdentification::SpokenLanguageIdentification(
+ AAssetManager *mgr, const SpokenLanguageIdentificationConfig &config)
+ : impl_(SpokenLanguageIdentificationImpl::Create(mgr, config)) {}
+#endif
+
SpokenLanguageIdentification::~SpokenLanguageIdentification() = default;
std::unique_ptr SpokenLanguageIdentification::CreateStream()
diff --git a/sherpa-onnx/csrc/spoken-language-identification.h b/sherpa-onnx/csrc/spoken-language-identification.h
index 83e60da5..6adb25d2 100644
--- a/sherpa-onnx/csrc/spoken-language-identification.h
+++ b/sherpa-onnx/csrc/spoken-language-identification.h
@@ -7,6 +7,11 @@
#include
#include
+#if __ANDROID_API__ >= 9
+#include "android/asset_manager.h"
+#include "android/asset_manager_jni.h"
+#endif
+
#include "sherpa-onnx/csrc/offline-stream.h"
#include "sherpa-onnx/csrc/parse-options.h"
@@ -70,6 +75,11 @@ class SpokenLanguageIdentification {
explicit SpokenLanguageIdentification(
const SpokenLanguageIdentificationConfig &config);
+#if __ANDROID_API__ >= 9
+ SpokenLanguageIdentification(
+ AAssetManager *mgr, const SpokenLanguageIdentificationConfig &config);
+#endif
+
~SpokenLanguageIdentification();
// Create a stream to accept audio samples and compute features
diff --git a/sherpa-onnx/jni/spoken-language-identification.cc b/sherpa-onnx/jni/spoken-language-identification.cc
index 0bff585d..0a4d88ea 100644
--- a/sherpa-onnx/jni/spoken-language-identification.cc
+++ b/sherpa-onnx/jni/spoken-language-identification.cc
@@ -54,6 +54,32 @@ static SpokenLanguageIdentificationConfig GetSpokenLanguageIdentificationConfig(
} // namespace sherpa_onnx
+SHERPA_ONNX_EXTERN_C
+JNIEXPORT jlong JNICALL
+Java_com_k2fsa_sherpa_onnx_SpokenLanguageIdentification_newFromAsset(
+ JNIEnv *env, jobject /*obj*/, jobject asset_manager, jobject _config) {
+#if __ANDROID_API__ >= 9
+ AAssetManager *mgr = AAssetManager_fromJava(env, asset_manager);
+ if (!mgr) {
+ SHERPA_ONNX_LOGE("Failed to get asset manager: %p", mgr);
+ }
+#endif
+
+ auto config =
+ sherpa_onnx::GetSpokenLanguageIdentificationConfig(env, _config);
+ SHERPA_ONNX_LOGE("spoken language identification newFromAsset config:\n%s",
+ config.ToString().c_str());
+
+ auto slid = new sherpa_onnx::SpokenLanguageIdentification(
+#if __ANDROID_API__ >= 9
+ mgr,
+#endif
+ config);
+ SHERPA_ONNX_LOGE("slid %p", slid);
+
+ return (jlong)slid;
+}
+
SHERPA_ONNX_EXTERN_C
JNIEXPORT jlong JNICALL
Java_com_k2fsa_sherpa_onnx_SpokenLanguageIdentification_newFromFile(
@@ -73,6 +99,14 @@ Java_com_k2fsa_sherpa_onnx_SpokenLanguageIdentification_newFromFile(
return (jlong)tagger;
}
+SHERPA_ONNX_EXTERN_C
+JNIEXPORT void JNICALL
+Java_com_k2fsa_sherpa_onnx_SpokenLanguageIdentification_delete(JNIEnv *env,
+ jobject /*obj*/,
+ jlong ptr) {
+ delete reinterpret_cast(ptr);
+}
+
SHERPA_ONNX_EXTERN_C
JNIEXPORT jlong JNICALL
Java_com_k2fsa_sherpa_onnx_SpokenLanguageIdentification_createStream(