diff --git a/.github/workflows/apk-speaker-diarization.yaml b/.github/workflows/apk-speaker-diarization.yaml
new file mode 100644
index 00000000..19f0b99b
--- /dev/null
+++ b/.github/workflows/apk-speaker-diarization.yaml
@@ -0,0 +1,175 @@
+name: apk-speaker-diarization
+
+on:
+ push:
+ branches:
+ - apk
+ - android-demo-speaker-diarization-2
+
+ workflow_dispatch:
+
+concurrency:
+ group: apk-speaker-diarization-${{ github.ref }}
+ cancel-in-progress: true
+
+permissions:
+ contents: write
+
+jobs:
+ apk_speaker_identification:
+ if: github.repository_owner == 'csukuangfj' || github.repository_owner == 'k2-fsa'
+ runs-on: ${{ matrix.os }}
+ name: apk for speaker diarization ${{ matrix.index }}/${{ matrix.total }}
+ strategy:
+ fail-fast: false
+ matrix:
+ os: [ubuntu-latest]
+ total: ["1"]
+ index: ["0"]
+
+ steps:
+ - uses: actions/checkout@v4
+ with:
+ fetch-depth: 0
+
+ # https://github.com/actions/setup-java
+ - uses: actions/setup-java@v4
+ with:
+ distribution: 'temurin' # See 'Supported distributions' for available options
+ java-version: '21'
+
+ - name: ccache
+ uses: hendrikmuhs/ccache-action@v1.2
+ with:
+ key: ${{ matrix.os }}-android
+
+ - name: Display NDK HOME
+ shell: bash
+ run: |
+ echo "ANDROID_NDK_LATEST_HOME: ${ANDROID_NDK_LATEST_HOME}"
+ ls -lh ${ANDROID_NDK_LATEST_HOME}
+
+ - name: Install Python dependencies
+ shell: bash
+ run: |
+ python3 -m pip install --upgrade pip jinja2
+
+ - name: Setup build tool version variable
+ shell: bash
+ run: |
+ echo "---"
+ ls -lh /usr/local/lib/android/
+ echo "---"
+
+ ls -lh /usr/local/lib/android/sdk
+ echo "---"
+
+ ls -lh /usr/local/lib/android/sdk/build-tools
+ echo "---"
+
+ BUILD_TOOL_VERSION=$(ls /usr/local/lib/android/sdk/build-tools/ | tail -n 1)
+ echo "BUILD_TOOL_VERSION=$BUILD_TOOL_VERSION" >> $GITHUB_ENV
+ echo "Last build tool version is: $BUILD_TOOL_VERSION"
+
+ - name: Generate build script
+ shell: bash
+ run: |
+ cd scripts/apk
+
+ chmod +x build-apk-speaker-diarization.sh
+ mv -v ./build-apk-speaker-diarization.sh ../..
+
+ - name: build APK
+ shell: bash
+ run: |
+ export CMAKE_CXX_COMPILER_LAUNCHER=ccache
+ export PATH="/usr/lib/ccache:/usr/local/opt/ccache/libexec:$PATH"
+ cmake --version
+
+ export ANDROID_NDK=$ANDROID_NDK_LATEST_HOME
+ ./build-apk-speaker-diarization.sh
+
+ - name: Display APK
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
+ # https://github.com/marketplace/actions/sign-android-release
+ - uses: r0adkll/sign-android-release@v1
+ name: Sign app APK
+ with:
+ releaseDirectory: ./apks
+ signingKeyBase64: ${{ secrets.ANDROID_SIGNING_KEY }}
+ alias: ${{ secrets.ANDROID_SIGNING_KEY_ALIAS }}
+ keyStorePassword: ${{ secrets.ANDROID_SIGNING_KEY_STORE_PASSWORD }}
+ env:
+ BUILD_TOOLS_VERSION: ${{ env.BUILD_TOOL_VERSION }}
+
+ - name: Display APK after signing
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Rename APK after signing
+ shell: bash
+ run: |
+ cd apks
+ rm -fv signingKey.jks
+ rm -fv *.apk.idsig
+ rm -fv *-aligned.apk
+
+ all_apks=$(ls -1 *-signed.apk)
+ echo "----"
+ echo $all_apks
+ echo "----"
+ for apk in ${all_apks[@]}; do
+ n=$(echo $apk | sed -e s/-signed//)
+ mv -v $apk $n
+ done
+
+ cd ..
+
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Display APK after rename
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Publish to huggingface
+ env:
+ HF_TOKEN: ${{ secrets.HF_TOKEN }}
+ uses: nick-fields/retry@v3
+ with:
+ max_attempts: 20
+ timeout_seconds: 200
+ shell: bash
+ command: |
+ git config --global user.email "csukuangfj@gmail.com"
+ git config --global user.name "Fangjun Kuang"
+
+ rm -rf huggingface
+ export GIT_LFS_SKIP_SMUDGE=1
+ export GIT_CLONE_PROTECTION_ACTIVE=false
+
+ SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
+ echo "SHERPA_ONNX_VERSION $SHERPA_ONNX_VERSION"
+
+ git clone https://huggingface.co/csukuangfj/sherpa-onnx-apk huggingface
+ cd huggingface
+ git fetch
+ git pull
+ git merge -m "merge remote" --ff origin main
+
+ d=speaker-diarization/$SHERPA_ONNX_VERSION
+ mkdir -p $d/
+ cp -v ../apks/*.apk $d/
+ git status
+ git lfs track "*.apk"
+ git add .
+ git commit -m "add more apks"
+ git push https://csukuangfj:$HF_TOKEN@huggingface.co/csukuangfj/sherpa-onnx-apk main
diff --git a/.github/workflows/apk-speaker-identification.yaml b/.github/workflows/apk-speaker-identification.yaml
index ca89ec49..e32ad3bc 100644
--- a/.github/workflows/apk-speaker-identification.yaml
+++ b/.github/workflows/apk-speaker-identification.yaml
@@ -53,6 +53,23 @@ jobs:
run: |
python3 -m pip install --upgrade pip jinja2
+ - name: Setup build tool version variable
+ shell: bash
+ run: |
+ echo "---"
+ ls -lh /usr/local/lib/android/
+ echo "---"
+
+ ls -lh /usr/local/lib/android/sdk
+ echo "---"
+
+ ls -lh /usr/local/lib/android/sdk/build-tools
+ echo "---"
+
+ BUILD_TOOL_VERSION=$(ls /usr/local/lib/android/sdk/build-tools/ | tail -n 1)
+ echo "BUILD_TOOL_VERSION=$BUILD_TOOL_VERSION" >> $GITHUB_ENV
+ echo "Last build tool version is: $BUILD_TOOL_VERSION"
+
- name: Generate build script
shell: bash
run: |
@@ -82,6 +99,51 @@ jobs:
ls -lh ./apks/
du -h -d1 .
+ # https://github.com/marketplace/actions/sign-android-release
+ - uses: r0adkll/sign-android-release@v1
+ name: Sign app APK
+ with:
+ releaseDirectory: ./apks
+ signingKeyBase64: ${{ secrets.ANDROID_SIGNING_KEY }}
+ alias: ${{ secrets.ANDROID_SIGNING_KEY_ALIAS }}
+ keyStorePassword: ${{ secrets.ANDROID_SIGNING_KEY_STORE_PASSWORD }}
+ env:
+ BUILD_TOOLS_VERSION: ${{ env.BUILD_TOOL_VERSION }}
+
+ - name: Display APK after signing
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Rename APK after signing
+ shell: bash
+ run: |
+ cd apks
+ rm -fv signingKey.jks
+ rm -fv *.apk.idsig
+ rm -fv *-aligned.apk
+
+ all_apks=$(ls -1 *-signed.apk)
+ echo "----"
+ echo $all_apks
+ echo "----"
+ for apk in ${all_apks[@]}; do
+ n=$(echo $apk | sed -e s/-signed//)
+ mv -v $apk $n
+ done
+
+ cd ..
+
+ ls -lh ./apks/
+ du -h -d1 .
+
+ - name: Display APK after rename
+ shell: bash
+ run: |
+ ls -lh ./apks/
+ du -h -d1 .
+
- name: Publish to huggingface
env:
HF_TOKEN: ${{ secrets.HF_TOKEN }}
diff --git a/.github/workflows/apk-vad.yaml b/.github/workflows/apk-vad.yaml
index 8253145b..d9af7547 100644
--- a/.github/workflows/apk-vad.yaml
+++ b/.github/workflows/apk-vad.yaml
@@ -166,7 +166,7 @@ jobs:
git pull
git merge -m "merge remote" --ff origin main
- d=vad/SHERPA_ONNX_VERSION
+ d=vad/$SHERPA_ONNX_VERSION
mkdir -p $d
cp -v ../apks/*.apk $d/
git status
diff --git a/README.md b/README.md
index 1828847e..32d141f9 100644
--- a/README.md
+++ b/README.md
@@ -84,8 +84,9 @@ with the following APIs
### Links for Huggingface Spaces
-You can visit the following Huggingface spaces to try `sherpa-onnx` without
-installing anything. All you need is a browser.
+
+You can visit the following Huggingface spaces to try sherpa-onnx without
+installing anything. All you need is a browser.
| Description | URL |
|-------------------------------------------------------|------------------------------------|
@@ -118,23 +119,34 @@ We also have spaces built using WebAssembly. They are listed below:
|Speech synthesis (German) |[Click me][wasm-hf-tts-piper-de]| [地址][wasm-ms-tts-piper-de]|
|Speaker diarization |[Click me][wasm-hf-speaker-diarization]|[地址][wasm-ms-speaker-diarization]|
+
+
### Links for pre-built Android APKs
-| Description | URL | 中国用户 |
-|----------------------------------------|------------------------------|-----------------------------|
-| Streaming speech recognition | [Address][apk-streaming-asr] | [点此][apk-streaming-asr-cn]|
-| Text-to-speech | [Address][apk-tts] | [点此][apk-tts-cn] |
-| Voice activity detection (VAD) | [Address][apk-vad] | [点此][apk-vad-cn] |
-| VAD + non-streaming speech recognition | [Address][apk-vad-asr] | [点此][apk-vad-asr-cn] |
-| Two-pass speech recognition | [Address][apk-2pass] | [点此][apk-2pass-cn] |
-| Audio tagging | [Address][apk-at] | [点此][apk-at-cn] |
-| Audio tagging (WearOS) | [Address][apk-at-wearos] | [点此][apk-at-wearos-cn] |
-| Speaker identification | [Address][apk-sid] | [点此][apk-sid-cn] |
-| Spoken language identification | [Address][apk-slid] | [点此][apk-slid-cn] |
-| Keyword spotting | [Address][apk-kws] | [点此][apk-kws-cn] |
+
+
+You can find pre-built Android APKs for this repository in the following table
+
+| Description | URL | 中国用户 |
+|----------------------------------------|------------------------------------|-----------------------------------|
+| Speaker diarization | [Address][apk-speaker-diarization] | [点此][apk-speaker-diarization-cn]|
+| Streaming speech recognition | [Address][apk-streaming-asr] | [点此][apk-streaming-asr-cn] |
+| Text-to-speech | [Address][apk-tts] | [点此][apk-tts-cn] |
+| Voice activity detection (VAD) | [Address][apk-vad] | [点此][apk-vad-cn] |
+| VAD + non-streaming speech recognition | [Address][apk-vad-asr] | [点此][apk-vad-asr-cn] |
+| Two-pass speech recognition | [Address][apk-2pass] | [点此][apk-2pass-cn] |
+| Audio tagging | [Address][apk-at] | [点此][apk-at-cn] |
+| Audio tagging (WearOS) | [Address][apk-at-wearos] | [点此][apk-at-wearos-cn] |
+| Speaker identification | [Address][apk-sid] | [点此][apk-sid-cn] |
+| Spoken language identification | [Address][apk-slid] | [点此][apk-slid-cn] |
+| Keyword spotting | [Address][apk-kws] | [点此][apk-kws-cn] |
+
+
### Links for pre-built Flutter APPs
+
+
#### Real-time speech recognition
| Description | URL | 中国用户 |
@@ -153,17 +165,24 @@ We also have spaces built using WebAssembly. They are listed below:
> Note: You need to build from source for iOS.
+
+
### Links for pre-built Lazarus APPs
+
+
#### Generating subtitles
| Description | URL | 中国用户 |
|--------------------------------|----------------------------|----------------------------|
| Generate subtitles (生成字幕) | [Address][lazarus-subtitle]| [点此][lazarus-subtitle-cn]|
+
### Links for pre-trained models
+
+
| Description | URL |
|---------------------------------------------|---------------------------------------------------------------------------------------|
| Speech recognition (speech to text, ASR) | [Address][asr-models] |
@@ -176,6 +195,8 @@ We also have spaces built using WebAssembly. They are listed below:
| Punctuation | [Address][punct-models] |
| Speaker segmentation | [Address][speaker-segmentation-models] |
+
+
### Useful links
- Documentation: https://k2-fsa.github.io/sherpa/onnx/
@@ -265,6 +286,8 @@ Video demo in Chinese: [爆了!炫神教你开打字挂!真正影响胜率
[wasm-ms-tts-piper-de]: https://modelscope.cn/studios/k2-fsa/web-assembly-tts-sherpa-onnx-de
[wasm-hf-speaker-diarization]: https://huggingface.co/spaces/k2-fsa/web-assembly-speaker-diarization-sherpa-onnx
[wasm-ms-speaker-diarization]: https://www.modelscope.cn/studios/csukuangfj/web-assembly-speaker-diarization-sherpa-onnx
+[apk-speaker-diarization]: https://k2-fsa.github.io/sherpa/onnx/speaker-diarization/apk.html
+[apk-speaker-diarization-cn]: https://k2-fsa.github.io/sherpa/onnx/speaker-diarization/apk-cn.html
[apk-streaming-asr]: https://k2-fsa.github.io/sherpa/onnx/android/apk.html
[apk-streaming-asr-cn]: https://k2-fsa.github.io/sherpa/onnx/android/apk-cn.html
[apk-tts]: https://k2-fsa.github.io/sherpa/onnx/tts/apk-engine.html
diff --git a/android/README.md b/android/README.md
index 42b29e08..bae33559 100644
--- a/android/README.md
+++ b/android/README.md
@@ -4,6 +4,8 @@ Please refer to
https://k2-fsa.github.io/sherpa/onnx/android/index.html
for usage.
+- [SherpaOnnxSpeakerDiarization](./SherpaOnnxSpeakerDiarization) It is for speaker diarization.
+
- [SherpaOnnx](./SherpaOnnx) It uses a streaming ASR model.
- [SherpaOnnx2Pass](./SherpaOnnx2Pass) It uses a streaming ASR model
diff --git a/android/SherpaOnnxSpeakerDiarization/.gitignore b/android/SherpaOnnxSpeakerDiarization/.gitignore
new file mode 100644
index 00000000..aa724b77
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/.gitignore
@@ -0,0 +1,15 @@
+*.iml
+.gradle
+/local.properties
+/.idea/caches
+/.idea/libraries
+/.idea/modules.xml
+/.idea/workspace.xml
+/.idea/navEditor.xml
+/.idea/assetWizardSettings.xml
+.DS_Store
+/build
+/captures
+.externalNativeBuild
+.cxx
+local.properties
diff --git a/android/SherpaOnnxSpeakerDiarization/app/.gitignore b/android/SherpaOnnxSpeakerDiarization/app/.gitignore
new file mode 100644
index 00000000..42afabfd
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/.gitignore
@@ -0,0 +1 @@
+/build
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/build.gradle.kts b/android/SherpaOnnxSpeakerDiarization/app/build.gradle.kts
new file mode 100644
index 00000000..7a390ba4
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/build.gradle.kts
@@ -0,0 +1,71 @@
+plugins {
+ alias(libs.plugins.android.application)
+ alias(libs.plugins.jetbrains.kotlin.android)
+}
+
+android {
+ namespace = "com.k2fsa.sherpa.onnx.speaker.diarization"
+ compileSdk = 34
+
+ defaultConfig {
+ applicationId = "com.k2fsa.sherpa.onnx.speaker.diarization"
+ minSdk = 21
+ targetSdk = 34
+ versionCode = 1
+ versionName = "1.0"
+
+ testInstrumentationRunner = "androidx.test.runner.AndroidJUnitRunner"
+ vectorDrawables {
+ useSupportLibrary = true
+ }
+ }
+
+ buildTypes {
+ release {
+ isMinifyEnabled = false
+ proguardFiles(
+ getDefaultProguardFile("proguard-android-optimize.txt"),
+ "proguard-rules.pro"
+ )
+ }
+ }
+ compileOptions {
+ sourceCompatibility = JavaVersion.VERSION_1_8
+ targetCompatibility = JavaVersion.VERSION_1_8
+ }
+ kotlinOptions {
+ jvmTarget = "1.8"
+ }
+ buildFeatures {
+ compose = true
+ }
+ composeOptions {
+ kotlinCompilerExtensionVersion = "1.5.1"
+ }
+ packaging {
+ resources {
+ excludes += "/META-INF/{AL2.0,LGPL2.1}"
+ }
+ }
+}
+
+dependencies {
+
+ implementation(libs.androidx.core.ktx)
+ implementation(libs.androidx.lifecycle.runtime.ktx)
+ implementation(libs.androidx.activity.compose)
+ implementation(platform(libs.androidx.compose.bom))
+ implementation(libs.androidx.ui)
+ implementation(libs.androidx.ui.graphics)
+ implementation(libs.androidx.ui.tooling.preview)
+ implementation(libs.androidx.material3)
+ implementation(libs.androidx.navigation.compose)
+ implementation(libs.androidx.documentfile)
+ testImplementation(libs.junit)
+ androidTestImplementation(libs.androidx.junit)
+ androidTestImplementation(libs.androidx.espresso.core)
+ androidTestImplementation(platform(libs.androidx.compose.bom))
+ androidTestImplementation(libs.androidx.ui.test.junit4)
+ debugImplementation(libs.androidx.ui.tooling)
+ debugImplementation(libs.androidx.ui.test.manifest)
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/proguard-rules.pro b/android/SherpaOnnxSpeakerDiarization/app/proguard-rules.pro
new file mode 100644
index 00000000..481bb434
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/proguard-rules.pro
@@ -0,0 +1,21 @@
+# Add project specific ProGuard rules here.
+# You can control the set of applied configuration files using the
+# proguardFiles setting in build.gradle.
+#
+# For more details, see
+# http://developer.android.com/guide/developing/tools/proguard.html
+
+# If your project uses WebView with JS, uncomment the following
+# and specify the fully qualified class name to the JavaScript interface
+# class:
+#-keepclassmembers class fqcn.of.javascript.interface.for.webview {
+# public *;
+#}
+
+# Uncomment this to preserve the line number information for
+# debugging stack traces.
+#-keepattributes SourceFile,LineNumberTable
+
+# If you keep the line number information, uncomment this to
+# hide the original source file name.
+#-renamesourcefileattribute SourceFile
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/androidTest/java/com/k2fsa/sherpa/onnx/speaker/diarization/ExampleInstrumentedTest.kt b/android/SherpaOnnxSpeakerDiarization/app/src/androidTest/java/com/k2fsa/sherpa/onnx/speaker/diarization/ExampleInstrumentedTest.kt
new file mode 100644
index 00000000..53d7af15
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/androidTest/java/com/k2fsa/sherpa/onnx/speaker/diarization/ExampleInstrumentedTest.kt
@@ -0,0 +1,24 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization
+
+import androidx.test.platform.app.InstrumentationRegistry
+import androidx.test.ext.junit.runners.AndroidJUnit4
+
+import org.junit.Test
+import org.junit.runner.RunWith
+
+import org.junit.Assert.*
+
+/**
+ * Instrumented test, which will execute on an Android device.
+ *
+ * See [testing documentation](http://d.android.com/tools/testing).
+ */
+@RunWith(AndroidJUnit4::class)
+class ExampleInstrumentedTest {
+ @Test
+ fun useAppContext() {
+ // Context of the app under test.
+ val appContext = InstrumentationRegistry.getInstrumentation().targetContext
+ assertEquals("com.k2fsa.sherpa.onnx.speaker.diarization", appContext.packageName)
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/AndroidManifest.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/AndroidManifest.xml
new file mode 100644
index 00000000..d58f7e8d
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/AndroidManifest.xml
@@ -0,0 +1,32 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/assets/.gitkeep b/android/SherpaOnnxSpeakerDiarization/app/src/main/assets/.gitkeep
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/BarItem.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/BarItem.kt
new file mode 100644
index 00000000..0895cf52
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/BarItem.kt
@@ -0,0 +1,13 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization
+
+import androidx.compose.ui.graphics.vector.ImageVector
+
+data class BarItem(
+ val title: String,
+
+ // see https://www.composables.com/icons
+ // and
+ // https://developer.android.com/reference/kotlin/androidx/compose/material/icons/filled/package-summary
+ val image: ImageVector,
+ val route: String,
+)
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/MainActivity.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/MainActivity.kt
new file mode 100644
index 00000000..7a25d49b
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/MainActivity.kt
@@ -0,0 +1,132 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization
+
+import android.os.Bundle
+import androidx.activity.ComponentActivity
+import androidx.activity.compose.setContent
+import androidx.activity.enableEdgeToEdge
+import androidx.compose.foundation.layout.Column
+import androidx.compose.foundation.layout.fillMaxSize
+import androidx.compose.foundation.layout.padding
+import androidx.compose.material3.CenterAlignedTopAppBar
+import androidx.compose.material3.ExperimentalMaterial3Api
+import androidx.compose.material3.Icon
+import androidx.compose.material3.MaterialTheme
+import androidx.compose.material3.NavigationBar
+import androidx.compose.material3.NavigationBarItem
+import androidx.compose.material3.Scaffold
+import androidx.compose.material3.Surface
+import androidx.compose.material3.Text
+import androidx.compose.material3.TopAppBarDefaults
+import androidx.compose.runtime.Composable
+import androidx.compose.runtime.getValue
+import androidx.compose.ui.Modifier
+import androidx.compose.ui.text.font.FontWeight
+import androidx.compose.ui.tooling.preview.Preview
+import androidx.navigation.NavGraph.Companion.findStartDestination
+import androidx.navigation.NavHostController
+import androidx.navigation.compose.NavHost
+import androidx.navigation.compose.composable
+import androidx.navigation.compose.currentBackStackEntryAsState
+import androidx.navigation.compose.rememberNavController
+import com.k2fsa.sherpa.onnx.speaker.diarization.screens.HelpScreen
+import com.k2fsa.sherpa.onnx.speaker.diarization.screens.HomeScreen
+import com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme.SherpaOnnxSpeakerDiarizationTheme
+
+const val TAG = "sherpa-onnx-sd"
+
+class MainActivity : ComponentActivity() {
+ override fun onCreate(savedInstanceState: Bundle?) {
+ super.onCreate(savedInstanceState)
+ enableEdgeToEdge()
+ setContent {
+ SherpaOnnxSpeakerDiarizationTheme {
+ // A surface container using the 'background' color from the theme
+ Surface(
+ modifier = Modifier.fillMaxSize(),
+ color = MaterialTheme.colorScheme.background
+ ) {
+ MainScreen()
+ }
+ }
+ }
+ SpeakerDiarizationObject.initSpeakerDiarization(this.assets)
+ }
+}
+
+@OptIn(ExperimentalMaterial3Api::class)
+@Composable
+fun MainScreen(modifier: Modifier = Modifier) {
+ val navController = rememberNavController()
+ Scaffold(
+ topBar = {
+ CenterAlignedTopAppBar(
+ colors = TopAppBarDefaults.topAppBarColors(
+ containerColor = MaterialTheme.colorScheme.primaryContainer,
+ titleContentColor = MaterialTheme.colorScheme.primary,
+ ),
+ title = {
+ Text(
+ "Next-gen Kaldi: Speaker Diarization",
+ fontWeight = FontWeight.Bold,
+ )
+ },
+ )
+ },
+ content = { padding ->
+ Column(Modifier.padding(padding)) {
+ NavigationHost(navController = navController)
+
+ }
+ },
+ bottomBar = {
+ BottomNavigationBar(navController = navController)
+ }
+ )
+}
+
+@Composable
+fun NavigationHost(navController: NavHostController) {
+ NavHost(navController = navController, startDestination = NavRoutes.Home.route) {
+ composable(NavRoutes.Home.route) {
+ HomeScreen()
+ }
+
+ composable(NavRoutes.Help.route) {
+ HelpScreen()
+ }
+ }
+}
+
+@Composable
+fun BottomNavigationBar(navController: NavHostController) {
+ NavigationBar {
+ val backStackEntry by navController.currentBackStackEntryAsState()
+ val currentRoute = backStackEntry?.destination?.route
+
+ NavBarItems.BarItems.forEach { navItem ->
+ NavigationBarItem(selected = currentRoute == navItem.route,
+ onClick = {
+ navController.navigate(navItem.route) {
+ popUpTo(navController.graph.findStartDestination().id) {
+ saveState = true
+ }
+ launchSingleTop = true
+ restoreState = true
+ }
+ },
+ icon = {
+ Icon(imageVector = navItem.image, contentDescription = navItem.title)
+ }, label = {
+ Text(text = navItem.title)
+ })
+ }
+ }
+}
+
+@Preview(showBackground = true)
+@Composable
+fun MainScreenPreview() {
+ SherpaOnnxSpeakerDiarizationTheme {
+ MainScreen()
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/NavBarItems.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/NavBarItems.kt
new file mode 100644
index 00000000..65c737f9
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/NavBarItems.kt
@@ -0,0 +1,20 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization
+
+import androidx.compose.material.icons.Icons
+import androidx.compose.material.icons.filled.Home
+import androidx.compose.material.icons.filled.Info
+
+object NavBarItems {
+ val BarItems = listOf(
+ BarItem(
+ title = "Home",
+ image = Icons.Filled.Home,
+ route = "home",
+ ),
+ BarItem(
+ title = "Help",
+ image = Icons.Filled.Info,
+ route = "help",
+ ),
+ )
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/NavRoutes.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/NavRoutes.kt
new file mode 100644
index 00000000..2e1ae90b
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/NavRoutes.kt
@@ -0,0 +1,6 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization
+
+sealed class NavRoutes(val route: String) {
+ object Home : NavRoutes("home")
+ object Help : NavRoutes("help")
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/OfflineSpeakerDiarization.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/OfflineSpeakerDiarization.kt
new file mode 120000
index 00000000..459cc22c
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/OfflineSpeakerDiarization.kt
@@ -0,0 +1 @@
+../../../../../../../../../../../../sherpa-onnx/kotlin-api/OfflineSpeakerDiarization.kt
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ReadWaveFile.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ReadWaveFile.kt
new file mode 100644
index 00000000..940a2b64
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ReadWaveFile.kt
@@ -0,0 +1,137 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization.screens
+
+import android.content.Context
+import android.media.AudioFormat
+import android.media.MediaCodec
+import android.media.MediaExtractor
+import android.media.MediaFormat
+import android.net.Uri
+
+data class WaveData(
+ val sampleRate: Int? = null,
+ val samples: FloatArray? = null,
+ val msg: String? = null
+)
+
+// It supports only 16-bit encoded wave files
+//
+// References
+// - https://gist.github.com/a-m-s/1991ab18fbcb0fcc2cf9
+// - https://github.com/taehwandev/MediaCodecExample/blob/master/app/src/main/java/tech/thdev/mediacodecexample/audio/AACAudioDecoderThread.kt
+fun readUri(context: Context, uri: Uri): WaveData {
+ val extractor = MediaExtractor()
+ extractor.setDataSource(context, uri, null)
+
+ val samplesList: MutableList = ArrayList()
+
+ for (i in 0 until extractor.trackCount) {
+ val format = extractor.getTrackFormat(i)
+ val mime = format.getString(MediaFormat.KEY_MIME)
+ if (mime?.startsWith("audio/") == true) {
+ extractor.selectTrack(i)
+
+ var encoding: Int = -1
+ try {
+ encoding = format.getInteger(MediaFormat.KEY_PCM_ENCODING)
+ } catch (_: Exception) {
+ }
+
+ if (encoding != AudioFormat.ENCODING_PCM_16BIT) {
+ return WaveData(msg = "We support only 16-bit encoded wave files")
+ }
+
+ val sampleRate = format.getInteger(MediaFormat.KEY_SAMPLE_RATE)
+ val decoder = MediaCodec.createDecoderByType(mime)
+ decoder.configure(format, null, null, 0)
+ decoder.start()
+
+ val inputBuffers = decoder.inputBuffers
+ var outputBuffers = decoder.outputBuffers
+
+ val info = MediaCodec.BufferInfo()
+ var eof = false
+
+ var outputBufferIndex = -1
+
+ while (true) {
+ if (!eof) {
+ val inputBufferIndex = decoder.dequeueInputBuffer(10000)
+ if (inputBufferIndex > 0) {
+ val size = extractor.readSampleData(inputBuffers[inputBufferIndex], 0)
+ if (size < 0) {
+ decoder.queueInputBuffer(
+ inputBufferIndex,
+ 0,
+ 0,
+ 0,
+ MediaCodec.BUFFER_FLAG_END_OF_STREAM
+ )
+ eof = true
+ } else {
+ decoder.queueInputBuffer(
+ inputBufferIndex,
+ 0,
+ size,
+ extractor.sampleTime,
+ 0
+ )
+ extractor.advance()
+ }
+ }
+ } // if (!eof)
+
+ if (outputBufferIndex >= 0) {
+ outputBuffers[outputBufferIndex].position(0)
+ }
+
+ outputBufferIndex = decoder.dequeueOutputBuffer(info, 10000)
+ if (outputBufferIndex >= 0) {
+ if (info.flags != 0) {
+ decoder.stop()
+ decoder.release()
+
+ var k = 0
+ for (s in samplesList) {
+ k += s.size
+ }
+ if (k == 0) {
+ return WaveData(msg = "Failed to read selected file")
+ }
+
+ val ans = FloatArray(k)
+ k = 0
+ for (s in samplesList) {
+ s.copyInto(ans, k)
+ k += s.size
+ }
+
+ return WaveData(sampleRate = sampleRate, samples = ans)
+ }
+
+ val buffer = outputBuffers[outputBufferIndex]
+ val chunk = ByteArray(info.size)
+ buffer[chunk]
+ buffer.clear()
+
+ val numSamples = info.size / 2
+
+ val samples = FloatArray(numSamples)
+ for (k in 0 until numSamples) {
+ // assume little endian
+ val s = chunk[2 * k] + (chunk[2 * k + 1] * 256.0f)
+
+ samples[k] = s / 32768.0f
+ }
+ samplesList.add(samples)
+
+ decoder.releaseOutputBuffer(outputBufferIndex, false)
+ } else if (outputBufferIndex == MediaCodec.INFO_OUTPUT_BUFFERS_CHANGED) {
+ outputBuffers = decoder.outputBuffers
+ }
+ }
+ }
+ }
+
+ extractor.release()
+ return WaveData(msg = "not an audio file")
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/SpeakerDiarizationObject.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/SpeakerDiarizationObject.kt
new file mode 100644
index 00000000..f4bc2455
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/SpeakerDiarizationObject.kt
@@ -0,0 +1,66 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization
+
+import android.content.res.AssetManager
+import android.util.Log
+import com.k2fsa.sherpa.onnx.FastClusteringConfig
+import com.k2fsa.sherpa.onnx.OfflineSpeakerDiarization
+import com.k2fsa.sherpa.onnx.OfflineSpeakerDiarizationConfig
+import com.k2fsa.sherpa.onnx.OfflineSpeakerSegmentationModelConfig
+import com.k2fsa.sherpa.onnx.OfflineSpeakerSegmentationPyannoteModelConfig
+import com.k2fsa.sherpa.onnx.SpeakerEmbeddingExtractorConfig
+
+// Please download
+// https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-segmentation-models/sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
+// then unzip it, rename model.onnx to segmentation.onnx, and mv
+// segmentation.onnx to the assets folder
+val segmentationModel = "segmentation.onnx"
+
+// please download it from
+// https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-recongition-models/3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx
+// and move it to the assets folder
+val embeddingModel = "3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx"
+
+// in the end, your assets folder should look like below
+/*
+(py38) fangjuns-MacBook-Pro:assets fangjun$ pwd
+/Users/fangjun/open-source/sherpa-onnx/android/SherpaOnnxSpeakerDiarization/app/src/main/assets
+(py38) fangjuns-MacBook-Pro:assets fangjun$ ls -lh
+total 89048
+-rw-r--r-- 1 fangjun staff 38M Oct 12 20:28 3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx
+-rw-r--r-- 1 fangjun staff 5.7M Oct 12 20:28 segmentation.onnx
+ */
+
+object SpeakerDiarizationObject {
+ var _sd: OfflineSpeakerDiarization? = null
+ val sd: OfflineSpeakerDiarization
+ get() {
+ return _sd!!
+ }
+
+ fun initSpeakerDiarization(assetManager: AssetManager? = null) {
+ synchronized(this) {
+ if (_sd != null) {
+ return
+ }
+ Log.i(TAG, "Initializing sherpa-onnx speaker diarization")
+
+ val config = OfflineSpeakerDiarizationConfig(
+ segmentation = OfflineSpeakerSegmentationModelConfig(
+ pyannote = OfflineSpeakerSegmentationPyannoteModelConfig(
+ segmentationModel
+ ),
+ debug = true,
+ ),
+ embedding = SpeakerEmbeddingExtractorConfig(
+ model = embeddingModel,
+ debug = true,
+ numThreads = 2,
+ ),
+ clustering = FastClusteringConfig(numClusters = -1, threshold = 0.5f),
+ minDurationOn = 0.2f,
+ minDurationOff = 0.5f,
+ )
+ _sd = OfflineSpeakerDiarization(assetManager = assetManager, config = config)
+ }
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/SpeakerEmbeddingExtractorConfig.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/SpeakerEmbeddingExtractorConfig.kt
new file mode 120000
index 00000000..9bab8fe8
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/SpeakerEmbeddingExtractorConfig.kt
@@ -0,0 +1 @@
+../../../../../../../../../../../../sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/screens/Help.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/screens/Help.kt
new file mode 100644
index 00000000..b3640b9e
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/screens/Help.kt
@@ -0,0 +1,38 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization.screens
+
+import androidx.compose.foundation.layout.Box
+import androidx.compose.foundation.layout.Column
+import androidx.compose.foundation.layout.Spacer
+import androidx.compose.foundation.layout.fillMaxSize
+import androidx.compose.foundation.layout.height
+import androidx.compose.foundation.layout.padding
+import androidx.compose.material3.Text
+import androidx.compose.runtime.Composable
+import androidx.compose.ui.Modifier
+import androidx.compose.ui.unit.dp
+import androidx.compose.ui.unit.sp
+
+@Composable
+fun HelpScreen() {
+ Box(modifier = Modifier.fillMaxSize()) {
+ Column(
+ modifier = Modifier.padding(8.dp)
+ ) {
+ Text(
+ "This app accepts only 16kHz 16-bit 1-channel *.wav files. " +
+ "It has two arguments: Number of speakers and clustering threshold. " +
+ "If you know the actual number of speakers in the file, please set it. " +
+ "Otherwise, please set it to 0. In that case, you have to set the threshold. " +
+ "A larger threshold leads to fewer segmented speakers."
+ )
+ Spacer(modifier = Modifier.height(5.dp))
+ Text("The speaker segmentation model is from " +
+ "pyannote-audio (https://huggingface.co/pyannote/segmentation-3.0), "+
+ "whereas the embedding extractor model is from 3D-Speaker (https://github.com/modelscope/3D-Speaker)")
+ Spacer(modifier = Modifier.height(5.dp))
+ Text("Please see http://github.com/k2-fsa/sherpa-onnx ")
+ Spacer(modifier = Modifier.height(5.dp))
+ Text("Everything is open-sourced!", fontSize = 20.sp)
+ }
+ }
+}
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/screens/Home.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/screens/Home.kt
new file mode 100644
index 00000000..a5a9cd31
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/screens/Home.kt
@@ -0,0 +1,210 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization.screens
+
+import android.util.Log
+import androidx.activity.compose.rememberLauncherForActivityResult
+import androidx.activity.result.contract.ActivityResultContracts
+import androidx.compose.foundation.layout.Arrangement
+import androidx.compose.foundation.layout.Column
+import androidx.compose.foundation.layout.Row
+import androidx.compose.foundation.layout.Spacer
+import androidx.compose.foundation.layout.fillMaxWidth
+import androidx.compose.foundation.layout.padding
+import androidx.compose.foundation.layout.size
+import androidx.compose.foundation.rememberScrollState
+import androidx.compose.foundation.verticalScroll
+import androidx.compose.material3.Button
+import androidx.compose.material3.OutlinedTextField
+import androidx.compose.material3.Text
+import androidx.compose.runtime.Composable
+import androidx.compose.runtime.getValue
+import androidx.compose.runtime.mutableStateOf
+import androidx.compose.runtime.remember
+import androidx.compose.runtime.setValue
+import androidx.compose.ui.Alignment
+import androidx.compose.ui.Modifier
+import androidx.compose.ui.platform.LocalClipboardManager
+import androidx.compose.ui.platform.LocalContext
+import androidx.compose.ui.text.AnnotatedString
+import androidx.compose.ui.unit.dp
+import androidx.compose.ui.unit.sp
+import androidx.documentfile.provider.DocumentFile
+import com.k2fsa.sherpa.onnx.speaker.diarization.SpeakerDiarizationObject
+import com.k2fsa.sherpa.onnx.speaker.diarization.TAG
+import kotlin.concurrent.thread
+
+
+private var samples: FloatArray? = null
+
+@Composable
+fun HomeScreen() {
+ val context = LocalContext.current
+
+ var sampleRate: Int
+ var filename by remember { mutableStateOf("") }
+ var status by remember { mutableStateOf("") }
+ var progress by remember { mutableStateOf("") }
+ val clipboardManager = LocalClipboardManager.current
+ var done by remember { mutableStateOf(false) }
+ var fileIsOk by remember { mutableStateOf(false) }
+ var started by remember { mutableStateOf(false) }
+ var numSpeakers by remember { mutableStateOf(0) }
+ var threshold by remember { mutableStateOf(0.5f) }
+
+
+ val callback = here@{ numProcessedChunks: Int, numTotalChunks: Int, arg: Long ->
+ Int
+ val percent = 100.0 * numProcessedChunks / numTotalChunks
+ progress = "%.2f%%".format(percent)
+ Log.i(TAG, progress)
+ return@here 0
+ }
+
+ val launcher = rememberLauncherForActivityResult(ActivityResultContracts.OpenDocument()) {
+ it?.let {
+ val documentFile = DocumentFile.fromSingleUri(context, it)
+ filename = documentFile?.name ?: ""
+
+ progress = ""
+ done = false
+ fileIsOk = false
+
+ if (filename.isNotEmpty()) {
+ val data = readUri(context, it)
+ Log.i(TAG, "sample rate: ${data.sampleRate}")
+ Log.i(TAG, "numSamples: ${data.samples?.size ?: 0}")
+ if (data.msg != null) {
+ Log.i(TAG, "failed to read $filename")
+ status = data.msg
+ } else if (data.sampleRate != SpeakerDiarizationObject.sd.sampleRate()) {
+ status =
+ "Expected sample rate: ${SpeakerDiarizationObject.sd.sampleRate()}. Given wave file with sample rate: ${data.sampleRate}"
+ } else {
+ samples = data.samples!!
+ fileIsOk = true
+ }
+ }
+ }
+ }
+
+ Column(
+ modifier = Modifier.padding(10.dp),
+ verticalArrangement = Arrangement.Top,
+ ) {
+ Row(
+ modifier = Modifier.fillMaxWidth(),
+ horizontalArrangement = Arrangement.SpaceEvenly,
+ verticalAlignment = Alignment.CenterVertically
+ ) {
+
+ Button(onClick = {
+ launcher.launch(arrayOf("audio/*"))
+ }) {
+ Text("Select a .wav file")
+ }
+
+ Button(enabled = fileIsOk && !started,
+ onClick = {
+ Log.i(TAG, "started")
+ Log.i(TAG, "num samples: ${samples?.size}")
+ started = true
+ progress = ""
+
+ val config = SpeakerDiarizationObject.sd.config
+ config.clustering.numClusters = numSpeakers
+ config.clustering.threshold = threshold
+
+ SpeakerDiarizationObject.sd.setConfig(config)
+
+ thread(true) {
+ done = false
+ status = "Started! Please wait"
+ val segments = SpeakerDiarizationObject.sd.processWithCallback(
+ samples!!,
+ callback = callback,
+ )
+ done = true
+ started = false
+ status = ""
+ for (s in segments) {
+ val start = "%.2f".format(s.start)
+ val end = "%.2f".format(s.end)
+ val speaker = "speaker_%02d".format(s.speaker)
+ status += "$start -- $end $speaker\n"
+ Log.i(TAG, "$start -- $end $speaker")
+ }
+
+ Log.i(TAG, status)
+ }
+ }) {
+ Text("Start")
+ }
+ if (progress.isNotEmpty()) {
+ Text(progress, fontSize = 25.sp)
+ }
+ }
+
+ Row(
+ modifier = Modifier.fillMaxWidth(),
+ horizontalArrangement = Arrangement.SpaceEvenly,
+ verticalAlignment = Alignment.CenterVertically
+ ) {
+ OutlinedTextField(
+ value = numSpeakers.toString(),
+ onValueChange = {
+ if (it.isEmpty() || it.isBlank()) {
+ numSpeakers = 0
+ } else {
+ numSpeakers = it.toIntOrNull() ?: 0
+ }
+ },
+ label = {
+ Text("Number of Speakers")
+ },
+ )
+ }
+
+ Row(
+ modifier = Modifier.fillMaxWidth(),
+ horizontalArrangement = Arrangement.SpaceEvenly,
+ verticalAlignment = Alignment.CenterVertically
+ ) {
+ OutlinedTextField(
+ value = threshold.toString(),
+ onValueChange = {
+ if (it.isEmpty() || it.isBlank()) {
+ threshold = 0.5f
+ } else {
+ threshold = it.toFloatOrNull() ?: 0.5f
+ }
+ },
+ label = {
+ Text("Clustering threshold")
+ },
+ )
+ }
+
+ if (filename.isNotEmpty()) {
+ Text(text = "Selected $filename")
+ Spacer(Modifier.size(20.dp))
+ }
+
+ if (done) {
+ Button(onClick = {
+ clipboardManager.setText(AnnotatedString(status))
+ progress = "Copied!"
+ }) {
+ Text("Copy result")
+ }
+ Spacer(Modifier.size(20.dp))
+ }
+
+ if (status.isNotEmpty()) {
+ Text(
+ status,
+ modifier = Modifier.verticalScroll(rememberScrollState()),
+ )
+ }
+
+
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Color.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Color.kt
new file mode 100644
index 00000000..a96515d3
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Color.kt
@@ -0,0 +1,11 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme
+
+import androidx.compose.ui.graphics.Color
+
+val Purple80 = Color(0xFFD0BCFF)
+val PurpleGrey80 = Color(0xFFCCC2DC)
+val Pink80 = Color(0xFFEFB8C8)
+
+val Purple40 = Color(0xFF6650a4)
+val PurpleGrey40 = Color(0xFF625b71)
+val Pink40 = Color(0xFF7D5260)
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Theme.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Theme.kt
new file mode 100644
index 00000000..5dbbe7e5
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Theme.kt
@@ -0,0 +1,58 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme
+
+import android.app.Activity
+import android.os.Build
+import androidx.compose.foundation.isSystemInDarkTheme
+import androidx.compose.material3.MaterialTheme
+import androidx.compose.material3.darkColorScheme
+import androidx.compose.material3.dynamicDarkColorScheme
+import androidx.compose.material3.dynamicLightColorScheme
+import androidx.compose.material3.lightColorScheme
+import androidx.compose.runtime.Composable
+import androidx.compose.ui.platform.LocalContext
+
+private val DarkColorScheme = darkColorScheme(
+ primary = Purple80,
+ secondary = PurpleGrey80,
+ tertiary = Pink80
+)
+
+private val LightColorScheme = lightColorScheme(
+ primary = Purple40,
+ secondary = PurpleGrey40,
+ tertiary = Pink40
+
+ /* Other default colors to override
+ background = Color(0xFFFFFBFE),
+ surface = Color(0xFFFFFBFE),
+ onPrimary = Color.White,
+ onSecondary = Color.White,
+ onTertiary = Color.White,
+ onBackground = Color(0xFF1C1B1F),
+ onSurface = Color(0xFF1C1B1F),
+ */
+)
+
+@Composable
+fun SherpaOnnxSpeakerDiarizationTheme(
+ darkTheme: Boolean = isSystemInDarkTheme(),
+ // Dynamic color is available on Android 12+
+ dynamicColor: Boolean = true,
+ content: @Composable () -> Unit
+) {
+ val colorScheme = when {
+ dynamicColor && Build.VERSION.SDK_INT >= Build.VERSION_CODES.S -> {
+ val context = LocalContext.current
+ if (darkTheme) dynamicDarkColorScheme(context) else dynamicLightColorScheme(context)
+ }
+
+ darkTheme -> DarkColorScheme
+ else -> LightColorScheme
+ }
+
+ MaterialTheme(
+ colorScheme = colorScheme,
+ typography = Typography,
+ content = content
+ )
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Type.kt b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Type.kt
new file mode 100644
index 00000000..39a81b94
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/diarization/ui/theme/Type.kt
@@ -0,0 +1,34 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme
+
+import androidx.compose.material3.Typography
+import androidx.compose.ui.text.TextStyle
+import androidx.compose.ui.text.font.FontFamily
+import androidx.compose.ui.text.font.FontWeight
+import androidx.compose.ui.unit.sp
+
+// Set of Material typography styles to start with
+val Typography = Typography(
+ bodyLarge = TextStyle(
+ fontFamily = FontFamily.Default,
+ fontWeight = FontWeight.Normal,
+ fontSize = 16.sp,
+ lineHeight = 24.sp,
+ letterSpacing = 0.5.sp
+ )
+ /* Other default text styles to override
+ titleLarge = TextStyle(
+ fontFamily = FontFamily.Default,
+ fontWeight = FontWeight.Normal,
+ fontSize = 22.sp,
+ lineHeight = 28.sp,
+ letterSpacing = 0.sp
+ ),
+ labelSmall = TextStyle(
+ fontFamily = FontFamily.Default,
+ fontWeight = FontWeight.Medium,
+ fontSize = 11.sp,
+ lineHeight = 16.sp,
+ letterSpacing = 0.5.sp
+ )
+ */
+)
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/arm64-v8a/.gitkeep b/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/arm64-v8a/.gitkeep
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/armeabi-v7a/.gitkeep b/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/armeabi-v7a/.gitkeep
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/x86/.gitkeep b/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/x86/.gitkeep
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/x86_64/.gitkeep b/android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/x86_64/.gitkeep
new file mode 100644
index 00000000..e69de29b
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/drawable-v24/ic_launcher_foreground.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/drawable-v24/ic_launcher_foreground.xml
new file mode 100644
index 00000000..2b068d11
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/drawable-v24/ic_launcher_foreground.xml
@@ -0,0 +1,30 @@
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/drawable/ic_launcher_background.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/drawable/ic_launcher_background.xml
new file mode 100644
index 00000000..07d5da9c
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/drawable/ic_launcher_background.xml
@@ -0,0 +1,170 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml
new file mode 100644
index 00000000..6f3b755b
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-anydpi-v26/ic_launcher.xml
@@ -0,0 +1,6 @@
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml
new file mode 100644
index 00000000..6f3b755b
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml
@@ -0,0 +1,6 @@
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-hdpi/ic_launcher.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-hdpi/ic_launcher.webp
new file mode 100644
index 00000000..c209e78e
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-hdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..b2dfe3d1
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-mdpi/ic_launcher.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-mdpi/ic_launcher.webp
new file mode 100644
index 00000000..4f0f1d64
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-mdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..62b611da
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xhdpi/ic_launcher.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xhdpi/ic_launcher.webp
new file mode 100644
index 00000000..948a3070
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xhdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..1b9a6956
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp
new file mode 100644
index 00000000..28d4b77f
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..9287f508
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp
new file mode 100644
index 00000000..aa7d6427
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp
new file mode 100644
index 00000000..9126ae37
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp differ
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/colors.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/colors.xml
new file mode 100644
index 00000000..f8c6127d
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/colors.xml
@@ -0,0 +1,10 @@
+
+
+ #FFBB86FC
+ #FF6200EE
+ #FF3700B3
+ #FF03DAC5
+ #FF018786
+ #FF000000
+ #FFFFFFFF
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/strings.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/strings.xml
new file mode 100644
index 00000000..05f2df09
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/strings.xml
@@ -0,0 +1,3 @@
+
+ SherpaOnnxSpeakerDiarization
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/themes.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/themes.xml
new file mode 100644
index 00000000..34d1d96e
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/values/themes.xml
@@ -0,0 +1,5 @@
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/xml/backup_rules.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/xml/backup_rules.xml
new file mode 100644
index 00000000..fa0f996d
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/xml/backup_rules.xml
@@ -0,0 +1,13 @@
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/main/res/xml/data_extraction_rules.xml b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/xml/data_extraction_rules.xml
new file mode 100644
index 00000000..9ee9997b
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/main/res/xml/data_extraction_rules.xml
@@ -0,0 +1,19 @@
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/app/src/test/java/com/k2fsa/sherpa/onnx/speaker/diarization/ExampleUnitTest.kt b/android/SherpaOnnxSpeakerDiarization/app/src/test/java/com/k2fsa/sherpa/onnx/speaker/diarization/ExampleUnitTest.kt
new file mode 100644
index 00000000..5571dbb5
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/app/src/test/java/com/k2fsa/sherpa/onnx/speaker/diarization/ExampleUnitTest.kt
@@ -0,0 +1,17 @@
+package com.k2fsa.sherpa.onnx.speaker.diarization
+
+import org.junit.Test
+
+import org.junit.Assert.*
+
+/**
+ * Example local unit test, which will execute on the development machine (host).
+ *
+ * See [testing documentation](http://d.android.com/tools/testing).
+ */
+class ExampleUnitTest {
+ @Test
+ fun addition_isCorrect() {
+ assertEquals(4, 2 + 2)
+ }
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/build.gradle.kts b/android/SherpaOnnxSpeakerDiarization/build.gradle.kts
new file mode 100644
index 00000000..f74b04bf
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/build.gradle.kts
@@ -0,0 +1,5 @@
+// Top-level build file where you can add configuration options common to all sub-projects/modules.
+plugins {
+ alias(libs.plugins.android.application) apply false
+ alias(libs.plugins.jetbrains.kotlin.android) apply false
+}
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/gradle.properties b/android/SherpaOnnxSpeakerDiarization/gradle.properties
new file mode 100644
index 00000000..20e2a015
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/gradle.properties
@@ -0,0 +1,23 @@
+# Project-wide Gradle settings.
+# IDE (e.g. Android Studio) users:
+# Gradle settings configured through the IDE *will override*
+# any settings specified in this file.
+# For more details on how to configure your build environment visit
+# http://www.gradle.org/docs/current/userguide/build_environment.html
+# Specifies the JVM arguments used for the daemon process.
+# The setting is particularly useful for tweaking memory settings.
+org.gradle.jvmargs=-Xmx2048m -Dfile.encoding=UTF-8
+# When configured, Gradle will run in incubating parallel mode.
+# This option should only be used with decoupled projects. For more details, visit
+# https://developer.android.com/r/tools/gradle-multi-project-decoupled-projects
+# org.gradle.parallel=true
+# AndroidX package structure to make it clearer which packages are bundled with the
+# Android operating system, and which are packaged with your app's APK
+# https://developer.android.com/topic/libraries/support-library/androidx-rn
+android.useAndroidX=true
+# Kotlin code style for this project: "official" or "obsolete":
+kotlin.code.style=official
+# Enables namespacing of each library's R class so that its R class includes only the
+# resources declared in the library itself and none from the library's dependencies,
+# thereby reducing the size of the R class for that library
+android.nonTransitiveRClass=true
\ No newline at end of file
diff --git a/android/SherpaOnnxSpeakerDiarization/gradle/libs.versions.toml b/android/SherpaOnnxSpeakerDiarization/gradle/libs.versions.toml
new file mode 100644
index 00000000..fe93be92
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/gradle/libs.versions.toml
@@ -0,0 +1,35 @@
+[versions]
+agp = "8.4.0"
+kotlin = "1.9.0"
+coreKtx = "1.10.1"
+junit = "4.13.2"
+junitVersion = "1.1.5"
+espressoCore = "3.5.1"
+lifecycleRuntimeKtx = "2.6.1"
+activityCompose = "1.8.0"
+composeBom = "2023.08.00"
+navigationCompose = "2.8.2"
+documentfile = "1.0.1"
+
+[libraries]
+androidx-core-ktx = { group = "androidx.core", name = "core-ktx", version.ref = "coreKtx" }
+junit = { group = "junit", name = "junit", version.ref = "junit" }
+androidx-junit = { group = "androidx.test.ext", name = "junit", version.ref = "junitVersion" }
+androidx-espresso-core = { group = "androidx.test.espresso", name = "espresso-core", version.ref = "espressoCore" }
+androidx-lifecycle-runtime-ktx = { group = "androidx.lifecycle", name = "lifecycle-runtime-ktx", version.ref = "lifecycleRuntimeKtx" }
+androidx-activity-compose = { group = "androidx.activity", name = "activity-compose", version.ref = "activityCompose" }
+androidx-compose-bom = { group = "androidx.compose", name = "compose-bom", version.ref = "composeBom" }
+androidx-ui = { group = "androidx.compose.ui", name = "ui" }
+androidx-ui-graphics = { group = "androidx.compose.ui", name = "ui-graphics" }
+androidx-ui-tooling = { group = "androidx.compose.ui", name = "ui-tooling" }
+androidx-ui-tooling-preview = { group = "androidx.compose.ui", name = "ui-tooling-preview" }
+androidx-ui-test-manifest = { group = "androidx.compose.ui", name = "ui-test-manifest" }
+androidx-ui-test-junit4 = { group = "androidx.compose.ui", name = "ui-test-junit4" }
+androidx-material3 = { group = "androidx.compose.material3", name = "material3" }
+androidx-navigation-compose = { group = "androidx.navigation", name = "navigation-compose", version.ref = "navigationCompose" }
+androidx-documentfile = { group = "androidx.documentfile", name = "documentfile", version.ref = "documentfile" }
+
+[plugins]
+android-application = { id = "com.android.application", version.ref = "agp" }
+jetbrains-kotlin-android = { id = "org.jetbrains.kotlin.android", version.ref = "kotlin" }
+
diff --git a/android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.jar b/android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.jar
new file mode 100644
index 00000000..e708b1c0
Binary files /dev/null and b/android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.jar differ
diff --git a/android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.properties b/android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.properties
new file mode 100644
index 00000000..a4669300
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.properties
@@ -0,0 +1,6 @@
+#Sat Oct 12 14:27:04 CST 2024
+distributionBase=GRADLE_USER_HOME
+distributionPath=wrapper/dists
+distributionUrl=https\://services.gradle.org/distributions/gradle-8.6-bin.zip
+zipStoreBase=GRADLE_USER_HOME
+zipStorePath=wrapper/dists
diff --git a/android/SherpaOnnxSpeakerDiarization/gradlew b/android/SherpaOnnxSpeakerDiarization/gradlew
new file mode 100755
index 00000000..4f906e0c
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/gradlew
@@ -0,0 +1,185 @@
+#!/usr/bin/env sh
+
+#
+# Copyright 2015 the original author or authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+##############################################################################
+##
+## Gradle start up script for UN*X
+##
+##############################################################################
+
+# Attempt to set APP_HOME
+# Resolve links: $0 may be a link
+PRG="$0"
+# Need this for relative symlinks.
+while [ -h "$PRG" ] ; do
+ ls=`ls -ld "$PRG"`
+ link=`expr "$ls" : '.*-> \(.*\)$'`
+ if expr "$link" : '/.*' > /dev/null; then
+ PRG="$link"
+ else
+ PRG=`dirname "$PRG"`"/$link"
+ fi
+done
+SAVED="`pwd`"
+cd "`dirname \"$PRG\"`/" >/dev/null
+APP_HOME="`pwd -P`"
+cd "$SAVED" >/dev/null
+
+APP_NAME="Gradle"
+APP_BASE_NAME=`basename "$0"`
+
+# Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
+DEFAULT_JVM_OPTS='"-Xmx64m" "-Xms64m"'
+
+# Use the maximum available, or set MAX_FD != -1 to use that value.
+MAX_FD="maximum"
+
+warn () {
+ echo "$*"
+}
+
+die () {
+ echo
+ echo "$*"
+ echo
+ exit 1
+}
+
+# OS specific support (must be 'true' or 'false').
+cygwin=false
+msys=false
+darwin=false
+nonstop=false
+case "`uname`" in
+ CYGWIN* )
+ cygwin=true
+ ;;
+ Darwin* )
+ darwin=true
+ ;;
+ MINGW* )
+ msys=true
+ ;;
+ NONSTOP* )
+ nonstop=true
+ ;;
+esac
+
+CLASSPATH=$APP_HOME/gradle/wrapper/gradle-wrapper.jar
+
+
+# Determine the Java command to use to start the JVM.
+if [ -n "$JAVA_HOME" ] ; then
+ if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
+ # IBM's JDK on AIX uses strange locations for the executables
+ JAVACMD="$JAVA_HOME/jre/sh/java"
+ else
+ JAVACMD="$JAVA_HOME/bin/java"
+ fi
+ if [ ! -x "$JAVACMD" ] ; then
+ die "ERROR: JAVA_HOME is set to an invalid directory: $JAVA_HOME
+
+Please set the JAVA_HOME variable in your environment to match the
+location of your Java installation."
+ fi
+else
+ JAVACMD="java"
+ which java >/dev/null 2>&1 || die "ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
+
+Please set the JAVA_HOME variable in your environment to match the
+location of your Java installation."
+fi
+
+# Increase the maximum file descriptors if we can.
+if [ "$cygwin" = "false" -a "$darwin" = "false" -a "$nonstop" = "false" ] ; then
+ MAX_FD_LIMIT=`ulimit -H -n`
+ if [ $? -eq 0 ] ; then
+ if [ "$MAX_FD" = "maximum" -o "$MAX_FD" = "max" ] ; then
+ MAX_FD="$MAX_FD_LIMIT"
+ fi
+ ulimit -n $MAX_FD
+ if [ $? -ne 0 ] ; then
+ warn "Could not set maximum file descriptor limit: $MAX_FD"
+ fi
+ else
+ warn "Could not query maximum file descriptor limit: $MAX_FD_LIMIT"
+ fi
+fi
+
+# For Darwin, add options to specify how the application appears in the dock
+if $darwin; then
+ GRADLE_OPTS="$GRADLE_OPTS \"-Xdock:name=$APP_NAME\" \"-Xdock:icon=$APP_HOME/media/gradle.icns\""
+fi
+
+# For Cygwin or MSYS, switch paths to Windows format before running java
+if [ "$cygwin" = "true" -o "$msys" = "true" ] ; then
+ APP_HOME=`cygpath --path --mixed "$APP_HOME"`
+ CLASSPATH=`cygpath --path --mixed "$CLASSPATH"`
+
+ JAVACMD=`cygpath --unix "$JAVACMD"`
+
+ # We build the pattern for arguments to be converted via cygpath
+ ROOTDIRSRAW=`find -L / -maxdepth 1 -mindepth 1 -type d 2>/dev/null`
+ SEP=""
+ for dir in $ROOTDIRSRAW ; do
+ ROOTDIRS="$ROOTDIRS$SEP$dir"
+ SEP="|"
+ done
+ OURCYGPATTERN="(^($ROOTDIRS))"
+ # Add a user-defined pattern to the cygpath arguments
+ if [ "$GRADLE_CYGPATTERN" != "" ] ; then
+ OURCYGPATTERN="$OURCYGPATTERN|($GRADLE_CYGPATTERN)"
+ fi
+ # Now convert the arguments - kludge to limit ourselves to /bin/sh
+ i=0
+ for arg in "$@" ; do
+ CHECK=`echo "$arg"|egrep -c "$OURCYGPATTERN" -`
+ CHECK2=`echo "$arg"|egrep -c "^-"` ### Determine if an option
+
+ if [ $CHECK -ne 0 ] && [ $CHECK2 -eq 0 ] ; then ### Added a condition
+ eval `echo args$i`=`cygpath --path --ignore --mixed "$arg"`
+ else
+ eval `echo args$i`="\"$arg\""
+ fi
+ i=`expr $i + 1`
+ done
+ case $i in
+ 0) set -- ;;
+ 1) set -- "$args0" ;;
+ 2) set -- "$args0" "$args1" ;;
+ 3) set -- "$args0" "$args1" "$args2" ;;
+ 4) set -- "$args0" "$args1" "$args2" "$args3" ;;
+ 5) set -- "$args0" "$args1" "$args2" "$args3" "$args4" ;;
+ 6) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" ;;
+ 7) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" ;;
+ 8) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" ;;
+ 9) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" "$args8" ;;
+ esac
+fi
+
+# Escape application args
+save () {
+ for i do printf %s\\n "$i" | sed "s/'/'\\\\''/g;1s/^/'/;\$s/\$/' \\\\/" ; done
+ echo " "
+}
+APP_ARGS=`save "$@"`
+
+# Collect all arguments for the java command, following the shell quoting and substitution rules
+eval set -- $DEFAULT_JVM_OPTS $JAVA_OPTS $GRADLE_OPTS "\"-Dorg.gradle.appname=$APP_BASE_NAME\"" -classpath "\"$CLASSPATH\"" org.gradle.wrapper.GradleWrapperMain "$APP_ARGS"
+
+exec "$JAVACMD" "$@"
diff --git a/android/SherpaOnnxSpeakerDiarization/gradlew.bat b/android/SherpaOnnxSpeakerDiarization/gradlew.bat
new file mode 100644
index 00000000..ac1b06f9
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/gradlew.bat
@@ -0,0 +1,89 @@
+@rem
+@rem Copyright 2015 the original author or authors.
+@rem
+@rem Licensed under the Apache License, Version 2.0 (the "License");
+@rem you may not use this file except in compliance with the License.
+@rem You may obtain a copy of the License at
+@rem
+@rem https://www.apache.org/licenses/LICENSE-2.0
+@rem
+@rem Unless required by applicable law or agreed to in writing, software
+@rem distributed under the License is distributed on an "AS IS" BASIS,
+@rem WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+@rem See the License for the specific language governing permissions and
+@rem limitations under the License.
+@rem
+
+@if "%DEBUG%" == "" @echo off
+@rem ##########################################################################
+@rem
+@rem Gradle startup script for Windows
+@rem
+@rem ##########################################################################
+
+@rem Set local scope for the variables with windows NT shell
+if "%OS%"=="Windows_NT" setlocal
+
+set DIRNAME=%~dp0
+if "%DIRNAME%" == "" set DIRNAME=.
+set APP_BASE_NAME=%~n0
+set APP_HOME=%DIRNAME%
+
+@rem Resolve any "." and ".." in APP_HOME to make it shorter.
+for %%i in ("%APP_HOME%") do set APP_HOME=%%~fi
+
+@rem Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
+set DEFAULT_JVM_OPTS="-Xmx64m" "-Xms64m"
+
+@rem Find java.exe
+if defined JAVA_HOME goto findJavaFromJavaHome
+
+set JAVA_EXE=java.exe
+%JAVA_EXE% -version >NUL 2>&1
+if "%ERRORLEVEL%" == "0" goto execute
+
+echo.
+echo ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
+echo.
+echo Please set the JAVA_HOME variable in your environment to match the
+echo location of your Java installation.
+
+goto fail
+
+:findJavaFromJavaHome
+set JAVA_HOME=%JAVA_HOME:"=%
+set JAVA_EXE=%JAVA_HOME%/bin/java.exe
+
+if exist "%JAVA_EXE%" goto execute
+
+echo.
+echo ERROR: JAVA_HOME is set to an invalid directory: %JAVA_HOME%
+echo.
+echo Please set the JAVA_HOME variable in your environment to match the
+echo location of your Java installation.
+
+goto fail
+
+:execute
+@rem Setup the command line
+
+set CLASSPATH=%APP_HOME%\gradle\wrapper\gradle-wrapper.jar
+
+
+@rem Execute Gradle
+"%JAVA_EXE%" %DEFAULT_JVM_OPTS% %JAVA_OPTS% %GRADLE_OPTS% "-Dorg.gradle.appname=%APP_BASE_NAME%" -classpath "%CLASSPATH%" org.gradle.wrapper.GradleWrapperMain %*
+
+:end
+@rem End local scope for the variables with windows NT shell
+if "%ERRORLEVEL%"=="0" goto mainEnd
+
+:fail
+rem Set variable GRADLE_EXIT_CONSOLE if you need the _script_ return code instead of
+rem the _cmd.exe /c_ return code!
+if not "" == "%GRADLE_EXIT_CONSOLE%" exit 1
+exit /b 1
+
+:mainEnd
+if "%OS%"=="Windows_NT" endlocal
+
+:omega
diff --git a/android/SherpaOnnxSpeakerDiarization/settings.gradle.kts b/android/SherpaOnnxSpeakerDiarization/settings.gradle.kts
new file mode 100644
index 00000000..7226b549
--- /dev/null
+++ b/android/SherpaOnnxSpeakerDiarization/settings.gradle.kts
@@ -0,0 +1,23 @@
+pluginManagement {
+ repositories {
+ google {
+ content {
+ includeGroupByRegex("com\\.android.*")
+ includeGroupByRegex("com\\.google.*")
+ includeGroupByRegex("androidx.*")
+ }
+ }
+ mavenCentral()
+ gradlePluginPortal()
+ }
+}
+dependencyResolutionManagement {
+ repositoriesMode.set(RepositoriesMode.FAIL_ON_PROJECT_REPOS)
+ repositories {
+ google()
+ mavenCentral()
+ }
+}
+
+rootProject.name = "SherpaOnnxSpeakerDiarization"
+include(":app")
diff --git a/android/SherpaOnnxSpeakerIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/identification/SpeakerEmbeddingExtractorConfig.kt b/android/SherpaOnnxSpeakerIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/identification/SpeakerEmbeddingExtractorConfig.kt
new file mode 120000
index 00000000..9bab8fe8
--- /dev/null
+++ b/android/SherpaOnnxSpeakerIdentification/app/src/main/java/com/k2fsa/sherpa/onnx/speaker/identification/SpeakerEmbeddingExtractorConfig.kt
@@ -0,0 +1 @@
+../../../../../../../../../../../../sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
\ No newline at end of file
diff --git a/kotlin-api-examples/SpeakerEmbeddingExtractorConfig.kt b/kotlin-api-examples/SpeakerEmbeddingExtractorConfig.kt
new file mode 120000
index 00000000..57faadba
--- /dev/null
+++ b/kotlin-api-examples/SpeakerEmbeddingExtractorConfig.kt
@@ -0,0 +1 @@
+../sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
\ No newline at end of file
diff --git a/kotlin-api-examples/run.sh b/kotlin-api-examples/run.sh
index 50e7816f..a2adab41 100755
--- a/kotlin-api-examples/run.sh
+++ b/kotlin-api-examples/run.sh
@@ -48,6 +48,7 @@ function testSpeakerEmbeddingExtractor() {
test_speaker_id.kt \
OnlineStream.kt \
Speaker.kt \
+ SpeakerEmbeddingExtractorConfig.kt \
WaveReader.kt \
faked-asset-manager.kt \
faked-log.kt
@@ -305,6 +306,7 @@ function testOfflineSpeakerDiarization() {
test_offline_speaker_diarization.kt \
OfflineSpeakerDiarization.kt \
Speaker.kt \
+ SpeakerEmbeddingExtractorConfig.kt \
OnlineStream.kt \
WaveReader.kt \
faked-asset-manager.kt \
diff --git a/scripts/apk/build-apk-speaker-diarization.sh b/scripts/apk/build-apk-speaker-diarization.sh
new file mode 100755
index 00000000..04e294c6
--- /dev/null
+++ b/scripts/apk/build-apk-speaker-diarization.sh
@@ -0,0 +1,73 @@
+#!/usr/bin/env bash
+#
+# Please set the environment variable ANDROID_NDK
+# before running this script
+
+# Inside the $ANDROID_NDK directory, you can find a binary ndk-build
+# and some other files like the file "build/cmake/android.toolchain.cmake"
+
+set -ex
+
+log() {
+ # This function is from espnet
+ local fname=${BASH_SOURCE[1]##*/}
+ echo -e "$(date '+%Y-%m-%d %H:%M:%S') (${fname}:${BASH_LINENO[0]}:${FUNCNAME[1]}) $*"
+}
+
+SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
+
+log "Building Speaker identification APK for sherpa-onnx v${SHERPA_ONNX_VERSION}"
+
+export SHERPA_ONNX_ENABLE_TTS=OFF
+
+log "====================arm64-v8a================="
+./build-android-arm64-v8a.sh
+log "====================armv7-eabi================"
+./build-android-armv7-eabi.sh
+log "====================x86-64===================="
+./build-android-x86-64.sh
+log "====================x86===================="
+./build-android-x86.sh
+
+mkdir -p apks
+
+pushd ./android/SherpaOnnxSpeakerDiarization/app/src/main/assets/
+
+curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-segmentation-models/sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
+tar xvf sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
+rm sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
+mv sherpa-onnx-pyannote-segmentation-3-0/model.onnx segmentation.onnx
+rm -rf sherpa-onnx-pyannote-segmentation-3-0
+
+curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-recongition-models/3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx
+
+echo "pwd: $PWD"
+ls -lh
+
+popd
+
+for arch in arm64-v8a armeabi-v7a x86_64 x86; do
+ log "------------------------------------------------------------"
+ log "build speaker diarization apk for $arch"
+ log "------------------------------------------------------------"
+ src_arch=$arch
+ if [ $arch == "armeabi-v7a" ]; then
+ src_arch=armv7-eabi
+ elif [ $arch == "x86_64" ]; then
+ src_arch=x86-64
+ fi
+
+ ls -lh ./build-android-$src_arch/install/lib/*.so
+
+ cp -v ./build-android-$src_arch/install/lib/*.so ./android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/$arch/
+
+ pushd ./android/SherpaOnnxSpeakerDiarization
+ ./gradlew build
+ popd
+
+ mv android/SherpaOnnxSpeakerDiarization/app/build/outputs/apk/debug/app-debug.apk ./apks/sherpa-onnx-${SHERPA_ONNX_VERSION}-$arch-speaker-diarization-pyannote_audio-3dspeaker.apk
+ ls -lh apks
+ rm -v ./android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/$arch/*.so
+done
+
+ls -lh apks
diff --git a/sherpa-onnx/kotlin-api/OfflineSpeakerDiarization.kt b/sherpa-onnx/kotlin-api/OfflineSpeakerDiarization.kt
index de0a9dff..9190f8ae 100644
--- a/sherpa-onnx/kotlin-api/OfflineSpeakerDiarization.kt
+++ b/sherpa-onnx/kotlin-api/OfflineSpeakerDiarization.kt
@@ -34,7 +34,7 @@ data class OfflineSpeakerDiarizationSegment(
class OfflineSpeakerDiarization(
assetManager: AssetManager? = null,
- config: OfflineSpeakerDiarizationConfig,
+ val config: OfflineSpeakerDiarizationConfig,
) {
private var ptr: Long
@@ -64,7 +64,7 @@ class OfflineSpeakerDiarization(
fun process(samples: FloatArray) = process(ptr, samples)
fun processWithCallback(
- samples: FloatArray,
+ samples: FloatArray,
callback: (numProcessedChunks: Int, numTotalChunks: Int, arg: Long) -> Int,
arg: Long = 0,
) = processWithCallback(ptr, samples, callback, arg)
@@ -84,14 +84,17 @@ class OfflineSpeakerDiarization(
private external fun getSampleRate(ptr: Long): Int
- private external fun process(ptr: Long, samples: FloatArray): Array
+ private external fun process(
+ ptr: Long,
+ samples: FloatArray
+ ): Array
private external fun processWithCallback(
ptr: Long,
samples: FloatArray,
callback: (numProcessedChunks: Int, numTotalChunks: Int, arg: Long) -> Int,
arg: Long,
- ): Array
+ ): Array
companion object {
init {
diff --git a/sherpa-onnx/kotlin-api/Speaker.kt b/sherpa-onnx/kotlin-api/Speaker.kt
index 93b1b9e4..e148bba6 100644
--- a/sherpa-onnx/kotlin-api/Speaker.kt
+++ b/sherpa-onnx/kotlin-api/Speaker.kt
@@ -3,13 +3,6 @@ package com.k2fsa.sherpa.onnx
import android.content.res.AssetManager
import android.util.Log
-data class SpeakerEmbeddingExtractorConfig(
- val model: String,
- var numThreads: Int = 1,
- var debug: Boolean = false,
- var provider: String = "cpu",
-)
-
class SpeakerEmbeddingExtractor(
assetManager: AssetManager? = null,
config: SpeakerEmbeddingExtractorConfig,
diff --git a/sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt b/sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
new file mode 100644
index 00000000..4977ac02
--- /dev/null
+++ b/sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
@@ -0,0 +1,8 @@
+package com.k2fsa.sherpa.onnx
+
+data class SpeakerEmbeddingExtractorConfig(
+ val model: String,
+ var numThreads: Int = 1,
+ var debug: Boolean = false,
+ var provider: String = "cpu",
+)