Android demo for speaker diarization (#1423)
175
.github/workflows/apk-speaker-diarization.yaml
vendored
Normal file
@@ -0,0 +1,175 @@
|
|||||||
|
name: apk-speaker-diarization
|
||||||
|
|
||||||
|
on:
|
||||||
|
push:
|
||||||
|
branches:
|
||||||
|
- apk
|
||||||
|
- android-demo-speaker-diarization-2
|
||||||
|
|
||||||
|
workflow_dispatch:
|
||||||
|
|
||||||
|
concurrency:
|
||||||
|
group: apk-speaker-diarization-${{ github.ref }}
|
||||||
|
cancel-in-progress: true
|
||||||
|
|
||||||
|
permissions:
|
||||||
|
contents: write
|
||||||
|
|
||||||
|
jobs:
|
||||||
|
apk_speaker_identification:
|
||||||
|
if: github.repository_owner == 'csukuangfj' || github.repository_owner == 'k2-fsa'
|
||||||
|
runs-on: ${{ matrix.os }}
|
||||||
|
name: apk for speaker diarization ${{ matrix.index }}/${{ matrix.total }}
|
||||||
|
strategy:
|
||||||
|
fail-fast: false
|
||||||
|
matrix:
|
||||||
|
os: [ubuntu-latest]
|
||||||
|
total: ["1"]
|
||||||
|
index: ["0"]
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- uses: actions/checkout@v4
|
||||||
|
with:
|
||||||
|
fetch-depth: 0
|
||||||
|
|
||||||
|
# https://github.com/actions/setup-java
|
||||||
|
- uses: actions/setup-java@v4
|
||||||
|
with:
|
||||||
|
distribution: 'temurin' # See 'Supported distributions' for available options
|
||||||
|
java-version: '21'
|
||||||
|
|
||||||
|
- name: ccache
|
||||||
|
uses: hendrikmuhs/ccache-action@v1.2
|
||||||
|
with:
|
||||||
|
key: ${{ matrix.os }}-android
|
||||||
|
|
||||||
|
- name: Display NDK HOME
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
echo "ANDROID_NDK_LATEST_HOME: ${ANDROID_NDK_LATEST_HOME}"
|
||||||
|
ls -lh ${ANDROID_NDK_LATEST_HOME}
|
||||||
|
|
||||||
|
- name: Install Python dependencies
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
python3 -m pip install --upgrade pip jinja2
|
||||||
|
|
||||||
|
- name: Setup build tool version variable
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
echo "---"
|
||||||
|
ls -lh /usr/local/lib/android/
|
||||||
|
echo "---"
|
||||||
|
|
||||||
|
ls -lh /usr/local/lib/android/sdk
|
||||||
|
echo "---"
|
||||||
|
|
||||||
|
ls -lh /usr/local/lib/android/sdk/build-tools
|
||||||
|
echo "---"
|
||||||
|
|
||||||
|
BUILD_TOOL_VERSION=$(ls /usr/local/lib/android/sdk/build-tools/ | tail -n 1)
|
||||||
|
echo "BUILD_TOOL_VERSION=$BUILD_TOOL_VERSION" >> $GITHUB_ENV
|
||||||
|
echo "Last build tool version is: $BUILD_TOOL_VERSION"
|
||||||
|
|
||||||
|
- name: Generate build script
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
cd scripts/apk
|
||||||
|
|
||||||
|
chmod +x build-apk-speaker-diarization.sh
|
||||||
|
mv -v ./build-apk-speaker-diarization.sh ../..
|
||||||
|
|
||||||
|
- name: build APK
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
export CMAKE_CXX_COMPILER_LAUNCHER=ccache
|
||||||
|
export PATH="/usr/lib/ccache:/usr/local/opt/ccache/libexec:$PATH"
|
||||||
|
cmake --version
|
||||||
|
|
||||||
|
export ANDROID_NDK=$ANDROID_NDK_LATEST_HOME
|
||||||
|
./build-apk-speaker-diarization.sh
|
||||||
|
|
||||||
|
- name: Display APK
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
ls -lh ./apks/
|
||||||
|
du -h -d1 .
|
||||||
|
|
||||||
|
# https://github.com/marketplace/actions/sign-android-release
|
||||||
|
- uses: r0adkll/sign-android-release@v1
|
||||||
|
name: Sign app APK
|
||||||
|
with:
|
||||||
|
releaseDirectory: ./apks
|
||||||
|
signingKeyBase64: ${{ secrets.ANDROID_SIGNING_KEY }}
|
||||||
|
alias: ${{ secrets.ANDROID_SIGNING_KEY_ALIAS }}
|
||||||
|
keyStorePassword: ${{ secrets.ANDROID_SIGNING_KEY_STORE_PASSWORD }}
|
||||||
|
env:
|
||||||
|
BUILD_TOOLS_VERSION: ${{ env.BUILD_TOOL_VERSION }}
|
||||||
|
|
||||||
|
- name: Display APK after signing
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
ls -lh ./apks/
|
||||||
|
du -h -d1 .
|
||||||
|
|
||||||
|
- name: Rename APK after signing
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
cd apks
|
||||||
|
rm -fv signingKey.jks
|
||||||
|
rm -fv *.apk.idsig
|
||||||
|
rm -fv *-aligned.apk
|
||||||
|
|
||||||
|
all_apks=$(ls -1 *-signed.apk)
|
||||||
|
echo "----"
|
||||||
|
echo $all_apks
|
||||||
|
echo "----"
|
||||||
|
for apk in ${all_apks[@]}; do
|
||||||
|
n=$(echo $apk | sed -e s/-signed//)
|
||||||
|
mv -v $apk $n
|
||||||
|
done
|
||||||
|
|
||||||
|
cd ..
|
||||||
|
|
||||||
|
ls -lh ./apks/
|
||||||
|
du -h -d1 .
|
||||||
|
|
||||||
|
- name: Display APK after rename
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
ls -lh ./apks/
|
||||||
|
du -h -d1 .
|
||||||
|
|
||||||
|
- name: Publish to huggingface
|
||||||
|
env:
|
||||||
|
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
||||||
|
uses: nick-fields/retry@v3
|
||||||
|
with:
|
||||||
|
max_attempts: 20
|
||||||
|
timeout_seconds: 200
|
||||||
|
shell: bash
|
||||||
|
command: |
|
||||||
|
git config --global user.email "csukuangfj@gmail.com"
|
||||||
|
git config --global user.name "Fangjun Kuang"
|
||||||
|
|
||||||
|
rm -rf huggingface
|
||||||
|
export GIT_LFS_SKIP_SMUDGE=1
|
||||||
|
export GIT_CLONE_PROTECTION_ACTIVE=false
|
||||||
|
|
||||||
|
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
||||||
|
echo "SHERPA_ONNX_VERSION $SHERPA_ONNX_VERSION"
|
||||||
|
|
||||||
|
git clone https://huggingface.co/csukuangfj/sherpa-onnx-apk huggingface
|
||||||
|
cd huggingface
|
||||||
|
git fetch
|
||||||
|
git pull
|
||||||
|
git merge -m "merge remote" --ff origin main
|
||||||
|
|
||||||
|
d=speaker-diarization/$SHERPA_ONNX_VERSION
|
||||||
|
mkdir -p $d/
|
||||||
|
cp -v ../apks/*.apk $d/
|
||||||
|
git status
|
||||||
|
git lfs track "*.apk"
|
||||||
|
git add .
|
||||||
|
git commit -m "add more apks"
|
||||||
|
git push https://csukuangfj:$HF_TOKEN@huggingface.co/csukuangfj/sherpa-onnx-apk main
|
||||||
@@ -53,6 +53,23 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
python3 -m pip install --upgrade pip jinja2
|
python3 -m pip install --upgrade pip jinja2
|
||||||
|
|
||||||
|
- name: Setup build tool version variable
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
echo "---"
|
||||||
|
ls -lh /usr/local/lib/android/
|
||||||
|
echo "---"
|
||||||
|
|
||||||
|
ls -lh /usr/local/lib/android/sdk
|
||||||
|
echo "---"
|
||||||
|
|
||||||
|
ls -lh /usr/local/lib/android/sdk/build-tools
|
||||||
|
echo "---"
|
||||||
|
|
||||||
|
BUILD_TOOL_VERSION=$(ls /usr/local/lib/android/sdk/build-tools/ | tail -n 1)
|
||||||
|
echo "BUILD_TOOL_VERSION=$BUILD_TOOL_VERSION" >> $GITHUB_ENV
|
||||||
|
echo "Last build tool version is: $BUILD_TOOL_VERSION"
|
||||||
|
|
||||||
- name: Generate build script
|
- name: Generate build script
|
||||||
shell: bash
|
shell: bash
|
||||||
run: |
|
run: |
|
||||||
@@ -82,6 +99,51 @@ jobs:
|
|||||||
ls -lh ./apks/
|
ls -lh ./apks/
|
||||||
du -h -d1 .
|
du -h -d1 .
|
||||||
|
|
||||||
|
# https://github.com/marketplace/actions/sign-android-release
|
||||||
|
- uses: r0adkll/sign-android-release@v1
|
||||||
|
name: Sign app APK
|
||||||
|
with:
|
||||||
|
releaseDirectory: ./apks
|
||||||
|
signingKeyBase64: ${{ secrets.ANDROID_SIGNING_KEY }}
|
||||||
|
alias: ${{ secrets.ANDROID_SIGNING_KEY_ALIAS }}
|
||||||
|
keyStorePassword: ${{ secrets.ANDROID_SIGNING_KEY_STORE_PASSWORD }}
|
||||||
|
env:
|
||||||
|
BUILD_TOOLS_VERSION: ${{ env.BUILD_TOOL_VERSION }}
|
||||||
|
|
||||||
|
- name: Display APK after signing
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
ls -lh ./apks/
|
||||||
|
du -h -d1 .
|
||||||
|
|
||||||
|
- name: Rename APK after signing
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
cd apks
|
||||||
|
rm -fv signingKey.jks
|
||||||
|
rm -fv *.apk.idsig
|
||||||
|
rm -fv *-aligned.apk
|
||||||
|
|
||||||
|
all_apks=$(ls -1 *-signed.apk)
|
||||||
|
echo "----"
|
||||||
|
echo $all_apks
|
||||||
|
echo "----"
|
||||||
|
for apk in ${all_apks[@]}; do
|
||||||
|
n=$(echo $apk | sed -e s/-signed//)
|
||||||
|
mv -v $apk $n
|
||||||
|
done
|
||||||
|
|
||||||
|
cd ..
|
||||||
|
|
||||||
|
ls -lh ./apks/
|
||||||
|
du -h -d1 .
|
||||||
|
|
||||||
|
- name: Display APK after rename
|
||||||
|
shell: bash
|
||||||
|
run: |
|
||||||
|
ls -lh ./apks/
|
||||||
|
du -h -d1 .
|
||||||
|
|
||||||
- name: Publish to huggingface
|
- name: Publish to huggingface
|
||||||
env:
|
env:
|
||||||
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
||||||
|
|||||||
2
.github/workflows/apk-vad.yaml
vendored
@@ -166,7 +166,7 @@ jobs:
|
|||||||
git pull
|
git pull
|
||||||
git merge -m "merge remote" --ff origin main
|
git merge -m "merge remote" --ff origin main
|
||||||
|
|
||||||
d=vad/SHERPA_ONNX_VERSION
|
d=vad/$SHERPA_ONNX_VERSION
|
||||||
mkdir -p $d
|
mkdir -p $d
|
||||||
cp -v ../apks/*.apk $d/
|
cp -v ../apks/*.apk $d/
|
||||||
git status
|
git status
|
||||||
|
|||||||
51
README.md
@@ -84,8 +84,9 @@ with the following APIs
|
|||||||
|
|
||||||
### Links for Huggingface Spaces
|
### Links for Huggingface Spaces
|
||||||
|
|
||||||
You can visit the following Huggingface spaces to try `sherpa-onnx` without
|
<details>
|
||||||
installing anything. All you need is a browser.
|
<summary>You can visit the following Huggingface spaces to try sherpa-onnx without
|
||||||
|
installing anything. All you need is a browser.</summary>
|
||||||
|
|
||||||
| Description | URL |
|
| Description | URL |
|
||||||
|-------------------------------------------------------|------------------------------------|
|
|-------------------------------------------------------|------------------------------------|
|
||||||
@@ -118,23 +119,34 @@ We also have spaces built using WebAssembly. They are listed below:
|
|||||||
|Speech synthesis (German) |[Click me][wasm-hf-tts-piper-de]| [地址][wasm-ms-tts-piper-de]|
|
|Speech synthesis (German) |[Click me][wasm-hf-tts-piper-de]| [地址][wasm-ms-tts-piper-de]|
|
||||||
|Speaker diarization |[Click me][wasm-hf-speaker-diarization]|[地址][wasm-ms-speaker-diarization]|
|
|Speaker diarization |[Click me][wasm-hf-speaker-diarization]|[地址][wasm-ms-speaker-diarization]|
|
||||||
|
|
||||||
|
</details>
|
||||||
|
|
||||||
### Links for pre-built Android APKs
|
### Links for pre-built Android APKs
|
||||||
|
|
||||||
| Description | URL | 中国用户 |
|
<details>
|
||||||
|----------------------------------------|------------------------------|-----------------------------|
|
|
||||||
| Streaming speech recognition | [Address][apk-streaming-asr] | [点此][apk-streaming-asr-cn]|
|
<summary>You can find pre-built Android APKs for this repository in the following table</summary>
|
||||||
| Text-to-speech | [Address][apk-tts] | [点此][apk-tts-cn] |
|
|
||||||
| Voice activity detection (VAD) | [Address][apk-vad] | [点此][apk-vad-cn] |
|
| Description | URL | 中国用户 |
|
||||||
| VAD + non-streaming speech recognition | [Address][apk-vad-asr] | [点此][apk-vad-asr-cn] |
|
|----------------------------------------|------------------------------------|-----------------------------------|
|
||||||
| Two-pass speech recognition | [Address][apk-2pass] | [点此][apk-2pass-cn] |
|
| Speaker diarization | [Address][apk-speaker-diarization] | [点此][apk-speaker-diarization-cn]|
|
||||||
| Audio tagging | [Address][apk-at] | [点此][apk-at-cn] |
|
| Streaming speech recognition | [Address][apk-streaming-asr] | [点此][apk-streaming-asr-cn] |
|
||||||
| Audio tagging (WearOS) | [Address][apk-at-wearos] | [点此][apk-at-wearos-cn] |
|
| Text-to-speech | [Address][apk-tts] | [点此][apk-tts-cn] |
|
||||||
| Speaker identification | [Address][apk-sid] | [点此][apk-sid-cn] |
|
| Voice activity detection (VAD) | [Address][apk-vad] | [点此][apk-vad-cn] |
|
||||||
| Spoken language identification | [Address][apk-slid] | [点此][apk-slid-cn] |
|
| VAD + non-streaming speech recognition | [Address][apk-vad-asr] | [点此][apk-vad-asr-cn] |
|
||||||
| Keyword spotting | [Address][apk-kws] | [点此][apk-kws-cn] |
|
| Two-pass speech recognition | [Address][apk-2pass] | [点此][apk-2pass-cn] |
|
||||||
|
| Audio tagging | [Address][apk-at] | [点此][apk-at-cn] |
|
||||||
|
| Audio tagging (WearOS) | [Address][apk-at-wearos] | [点此][apk-at-wearos-cn] |
|
||||||
|
| Speaker identification | [Address][apk-sid] | [点此][apk-sid-cn] |
|
||||||
|
| Spoken language identification | [Address][apk-slid] | [点此][apk-slid-cn] |
|
||||||
|
| Keyword spotting | [Address][apk-kws] | [点此][apk-kws-cn] |
|
||||||
|
|
||||||
|
</details>
|
||||||
|
|
||||||
### Links for pre-built Flutter APPs
|
### Links for pre-built Flutter APPs
|
||||||
|
|
||||||
|
<details>
|
||||||
|
|
||||||
#### Real-time speech recognition
|
#### Real-time speech recognition
|
||||||
|
|
||||||
| Description | URL | 中国用户 |
|
| Description | URL | 中国用户 |
|
||||||
@@ -153,17 +165,24 @@ We also have spaces built using WebAssembly. They are listed below:
|
|||||||
|
|
||||||
> Note: You need to build from source for iOS.
|
> Note: You need to build from source for iOS.
|
||||||
|
|
||||||
|
</details>
|
||||||
|
|
||||||
### Links for pre-built Lazarus APPs
|
### Links for pre-built Lazarus APPs
|
||||||
|
|
||||||
|
<details>
|
||||||
|
|
||||||
#### Generating subtitles
|
#### Generating subtitles
|
||||||
|
|
||||||
| Description | URL | 中国用户 |
|
| Description | URL | 中国用户 |
|
||||||
|--------------------------------|----------------------------|----------------------------|
|
|--------------------------------|----------------------------|----------------------------|
|
||||||
| Generate subtitles (生成字幕) | [Address][lazarus-subtitle]| [点此][lazarus-subtitle-cn]|
|
| Generate subtitles (生成字幕) | [Address][lazarus-subtitle]| [点此][lazarus-subtitle-cn]|
|
||||||
|
|
||||||
|
</details>
|
||||||
|
|
||||||
### Links for pre-trained models
|
### Links for pre-trained models
|
||||||
|
|
||||||
|
<details>
|
||||||
|
|
||||||
| Description | URL |
|
| Description | URL |
|
||||||
|---------------------------------------------|---------------------------------------------------------------------------------------|
|
|---------------------------------------------|---------------------------------------------------------------------------------------|
|
||||||
| Speech recognition (speech to text, ASR) | [Address][asr-models] |
|
| Speech recognition (speech to text, ASR) | [Address][asr-models] |
|
||||||
@@ -176,6 +195,8 @@ We also have spaces built using WebAssembly. They are listed below:
|
|||||||
| Punctuation | [Address][punct-models] |
|
| Punctuation | [Address][punct-models] |
|
||||||
| Speaker segmentation | [Address][speaker-segmentation-models] |
|
| Speaker segmentation | [Address][speaker-segmentation-models] |
|
||||||
|
|
||||||
|
</details>
|
||||||
|
|
||||||
### Useful links
|
### Useful links
|
||||||
|
|
||||||
- Documentation: https://k2-fsa.github.io/sherpa/onnx/
|
- Documentation: https://k2-fsa.github.io/sherpa/onnx/
|
||||||
@@ -265,6 +286,8 @@ Video demo in Chinese: [爆了!炫神教你开打字挂!真正影响胜率
|
|||||||
[wasm-ms-tts-piper-de]: https://modelscope.cn/studios/k2-fsa/web-assembly-tts-sherpa-onnx-de
|
[wasm-ms-tts-piper-de]: https://modelscope.cn/studios/k2-fsa/web-assembly-tts-sherpa-onnx-de
|
||||||
[wasm-hf-speaker-diarization]: https://huggingface.co/spaces/k2-fsa/web-assembly-speaker-diarization-sherpa-onnx
|
[wasm-hf-speaker-diarization]: https://huggingface.co/spaces/k2-fsa/web-assembly-speaker-diarization-sherpa-onnx
|
||||||
[wasm-ms-speaker-diarization]: https://www.modelscope.cn/studios/csukuangfj/web-assembly-speaker-diarization-sherpa-onnx
|
[wasm-ms-speaker-diarization]: https://www.modelscope.cn/studios/csukuangfj/web-assembly-speaker-diarization-sherpa-onnx
|
||||||
|
[apk-speaker-diarization]: https://k2-fsa.github.io/sherpa/onnx/speaker-diarization/apk.html
|
||||||
|
[apk-speaker-diarization-cn]: https://k2-fsa.github.io/sherpa/onnx/speaker-diarization/apk-cn.html
|
||||||
[apk-streaming-asr]: https://k2-fsa.github.io/sherpa/onnx/android/apk.html
|
[apk-streaming-asr]: https://k2-fsa.github.io/sherpa/onnx/android/apk.html
|
||||||
[apk-streaming-asr-cn]: https://k2-fsa.github.io/sherpa/onnx/android/apk-cn.html
|
[apk-streaming-asr-cn]: https://k2-fsa.github.io/sherpa/onnx/android/apk-cn.html
|
||||||
[apk-tts]: https://k2-fsa.github.io/sherpa/onnx/tts/apk-engine.html
|
[apk-tts]: https://k2-fsa.github.io/sherpa/onnx/tts/apk-engine.html
|
||||||
|
|||||||
@@ -4,6 +4,8 @@ Please refer to
|
|||||||
https://k2-fsa.github.io/sherpa/onnx/android/index.html
|
https://k2-fsa.github.io/sherpa/onnx/android/index.html
|
||||||
for usage.
|
for usage.
|
||||||
|
|
||||||
|
- [SherpaOnnxSpeakerDiarization](./SherpaOnnxSpeakerDiarization) It is for speaker diarization.
|
||||||
|
|
||||||
- [SherpaOnnx](./SherpaOnnx) It uses a streaming ASR model.
|
- [SherpaOnnx](./SherpaOnnx) It uses a streaming ASR model.
|
||||||
|
|
||||||
- [SherpaOnnx2Pass](./SherpaOnnx2Pass) It uses a streaming ASR model
|
- [SherpaOnnx2Pass](./SherpaOnnx2Pass) It uses a streaming ASR model
|
||||||
|
|||||||
15
android/SherpaOnnxSpeakerDiarization/.gitignore
vendored
Normal file
@@ -0,0 +1,15 @@
|
|||||||
|
*.iml
|
||||||
|
.gradle
|
||||||
|
/local.properties
|
||||||
|
/.idea/caches
|
||||||
|
/.idea/libraries
|
||||||
|
/.idea/modules.xml
|
||||||
|
/.idea/workspace.xml
|
||||||
|
/.idea/navEditor.xml
|
||||||
|
/.idea/assetWizardSettings.xml
|
||||||
|
.DS_Store
|
||||||
|
/build
|
||||||
|
/captures
|
||||||
|
.externalNativeBuild
|
||||||
|
.cxx
|
||||||
|
local.properties
|
||||||
1
android/SherpaOnnxSpeakerDiarization/app/.gitignore
vendored
Normal file
@@ -0,0 +1 @@
|
|||||||
|
/build
|
||||||
71
android/SherpaOnnxSpeakerDiarization/app/build.gradle.kts
Normal file
@@ -0,0 +1,71 @@
|
|||||||
|
plugins {
|
||||||
|
alias(libs.plugins.android.application)
|
||||||
|
alias(libs.plugins.jetbrains.kotlin.android)
|
||||||
|
}
|
||||||
|
|
||||||
|
android {
|
||||||
|
namespace = "com.k2fsa.sherpa.onnx.speaker.diarization"
|
||||||
|
compileSdk = 34
|
||||||
|
|
||||||
|
defaultConfig {
|
||||||
|
applicationId = "com.k2fsa.sherpa.onnx.speaker.diarization"
|
||||||
|
minSdk = 21
|
||||||
|
targetSdk = 34
|
||||||
|
versionCode = 1
|
||||||
|
versionName = "1.0"
|
||||||
|
|
||||||
|
testInstrumentationRunner = "androidx.test.runner.AndroidJUnitRunner"
|
||||||
|
vectorDrawables {
|
||||||
|
useSupportLibrary = true
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
buildTypes {
|
||||||
|
release {
|
||||||
|
isMinifyEnabled = false
|
||||||
|
proguardFiles(
|
||||||
|
getDefaultProguardFile("proguard-android-optimize.txt"),
|
||||||
|
"proguard-rules.pro"
|
||||||
|
)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
compileOptions {
|
||||||
|
sourceCompatibility = JavaVersion.VERSION_1_8
|
||||||
|
targetCompatibility = JavaVersion.VERSION_1_8
|
||||||
|
}
|
||||||
|
kotlinOptions {
|
||||||
|
jvmTarget = "1.8"
|
||||||
|
}
|
||||||
|
buildFeatures {
|
||||||
|
compose = true
|
||||||
|
}
|
||||||
|
composeOptions {
|
||||||
|
kotlinCompilerExtensionVersion = "1.5.1"
|
||||||
|
}
|
||||||
|
packaging {
|
||||||
|
resources {
|
||||||
|
excludes += "/META-INF/{AL2.0,LGPL2.1}"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
dependencies {
|
||||||
|
|
||||||
|
implementation(libs.androidx.core.ktx)
|
||||||
|
implementation(libs.androidx.lifecycle.runtime.ktx)
|
||||||
|
implementation(libs.androidx.activity.compose)
|
||||||
|
implementation(platform(libs.androidx.compose.bom))
|
||||||
|
implementation(libs.androidx.ui)
|
||||||
|
implementation(libs.androidx.ui.graphics)
|
||||||
|
implementation(libs.androidx.ui.tooling.preview)
|
||||||
|
implementation(libs.androidx.material3)
|
||||||
|
implementation(libs.androidx.navigation.compose)
|
||||||
|
implementation(libs.androidx.documentfile)
|
||||||
|
testImplementation(libs.junit)
|
||||||
|
androidTestImplementation(libs.androidx.junit)
|
||||||
|
androidTestImplementation(libs.androidx.espresso.core)
|
||||||
|
androidTestImplementation(platform(libs.androidx.compose.bom))
|
||||||
|
androidTestImplementation(libs.androidx.ui.test.junit4)
|
||||||
|
debugImplementation(libs.androidx.ui.tooling)
|
||||||
|
debugImplementation(libs.androidx.ui.test.manifest)
|
||||||
|
}
|
||||||
21
android/SherpaOnnxSpeakerDiarization/app/proguard-rules.pro
vendored
Normal file
@@ -0,0 +1,21 @@
|
|||||||
|
# Add project specific ProGuard rules here.
|
||||||
|
# You can control the set of applied configuration files using the
|
||||||
|
# proguardFiles setting in build.gradle.
|
||||||
|
#
|
||||||
|
# For more details, see
|
||||||
|
# http://developer.android.com/guide/developing/tools/proguard.html
|
||||||
|
|
||||||
|
# If your project uses WebView with JS, uncomment the following
|
||||||
|
# and specify the fully qualified class name to the JavaScript interface
|
||||||
|
# class:
|
||||||
|
#-keepclassmembers class fqcn.of.javascript.interface.for.webview {
|
||||||
|
# public *;
|
||||||
|
#}
|
||||||
|
|
||||||
|
# Uncomment this to preserve the line number information for
|
||||||
|
# debugging stack traces.
|
||||||
|
#-keepattributes SourceFile,LineNumberTable
|
||||||
|
|
||||||
|
# If you keep the line number information, uncomment this to
|
||||||
|
# hide the original source file name.
|
||||||
|
#-renamesourcefileattribute SourceFile
|
||||||
@@ -0,0 +1,24 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization
|
||||||
|
|
||||||
|
import androidx.test.platform.app.InstrumentationRegistry
|
||||||
|
import androidx.test.ext.junit.runners.AndroidJUnit4
|
||||||
|
|
||||||
|
import org.junit.Test
|
||||||
|
import org.junit.runner.RunWith
|
||||||
|
|
||||||
|
import org.junit.Assert.*
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Instrumented test, which will execute on an Android device.
|
||||||
|
*
|
||||||
|
* See [testing documentation](http://d.android.com/tools/testing).
|
||||||
|
*/
|
||||||
|
@RunWith(AndroidJUnit4::class)
|
||||||
|
class ExampleInstrumentedTest {
|
||||||
|
@Test
|
||||||
|
fun useAppContext() {
|
||||||
|
// Context of the app under test.
|
||||||
|
val appContext = InstrumentationRegistry.getInstrumentation().targetContext
|
||||||
|
assertEquals("com.k2fsa.sherpa.onnx.speaker.diarization", appContext.packageName)
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,32 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<manifest xmlns:android="http://schemas.android.com/apk/res/android"
|
||||||
|
xmlns:tools="http://schemas.android.com/tools">
|
||||||
|
|
||||||
|
<uses-permission
|
||||||
|
android:name="android.permission.READ_EXTERNAL_STORAGE"
|
||||||
|
android:maxSdkVersion="32" />
|
||||||
|
|
||||||
|
<application
|
||||||
|
android:allowBackup="true"
|
||||||
|
android:dataExtractionRules="@xml/data_extraction_rules"
|
||||||
|
android:fullBackupContent="@xml/backup_rules"
|
||||||
|
android:icon="@mipmap/ic_launcher"
|
||||||
|
android:label="@string/app_name"
|
||||||
|
android:roundIcon="@mipmap/ic_launcher_round"
|
||||||
|
android:supportsRtl="true"
|
||||||
|
android:theme="@style/Theme.SherpaOnnxSpeakerDiarization"
|
||||||
|
tools:targetApi="31">
|
||||||
|
<activity
|
||||||
|
android:name=".MainActivity"
|
||||||
|
android:exported="true"
|
||||||
|
android:label="@string/app_name"
|
||||||
|
android:theme="@style/Theme.SherpaOnnxSpeakerDiarization">
|
||||||
|
<intent-filter>
|
||||||
|
<action android:name="android.intent.action.MAIN" />
|
||||||
|
|
||||||
|
<category android:name="android.intent.category.LAUNCHER" />
|
||||||
|
</intent-filter>
|
||||||
|
</activity>
|
||||||
|
</application>
|
||||||
|
|
||||||
|
</manifest>
|
||||||
@@ -0,0 +1,13 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization
|
||||||
|
|
||||||
|
import androidx.compose.ui.graphics.vector.ImageVector
|
||||||
|
|
||||||
|
data class BarItem(
|
||||||
|
val title: String,
|
||||||
|
|
||||||
|
// see https://www.composables.com/icons
|
||||||
|
// and
|
||||||
|
// https://developer.android.com/reference/kotlin/androidx/compose/material/icons/filled/package-summary
|
||||||
|
val image: ImageVector,
|
||||||
|
val route: String,
|
||||||
|
)
|
||||||
@@ -0,0 +1,132 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization
|
||||||
|
|
||||||
|
import android.os.Bundle
|
||||||
|
import androidx.activity.ComponentActivity
|
||||||
|
import androidx.activity.compose.setContent
|
||||||
|
import androidx.activity.enableEdgeToEdge
|
||||||
|
import androidx.compose.foundation.layout.Column
|
||||||
|
import androidx.compose.foundation.layout.fillMaxSize
|
||||||
|
import androidx.compose.foundation.layout.padding
|
||||||
|
import androidx.compose.material3.CenterAlignedTopAppBar
|
||||||
|
import androidx.compose.material3.ExperimentalMaterial3Api
|
||||||
|
import androidx.compose.material3.Icon
|
||||||
|
import androidx.compose.material3.MaterialTheme
|
||||||
|
import androidx.compose.material3.NavigationBar
|
||||||
|
import androidx.compose.material3.NavigationBarItem
|
||||||
|
import androidx.compose.material3.Scaffold
|
||||||
|
import androidx.compose.material3.Surface
|
||||||
|
import androidx.compose.material3.Text
|
||||||
|
import androidx.compose.material3.TopAppBarDefaults
|
||||||
|
import androidx.compose.runtime.Composable
|
||||||
|
import androidx.compose.runtime.getValue
|
||||||
|
import androidx.compose.ui.Modifier
|
||||||
|
import androidx.compose.ui.text.font.FontWeight
|
||||||
|
import androidx.compose.ui.tooling.preview.Preview
|
||||||
|
import androidx.navigation.NavGraph.Companion.findStartDestination
|
||||||
|
import androidx.navigation.NavHostController
|
||||||
|
import androidx.navigation.compose.NavHost
|
||||||
|
import androidx.navigation.compose.composable
|
||||||
|
import androidx.navigation.compose.currentBackStackEntryAsState
|
||||||
|
import androidx.navigation.compose.rememberNavController
|
||||||
|
import com.k2fsa.sherpa.onnx.speaker.diarization.screens.HelpScreen
|
||||||
|
import com.k2fsa.sherpa.onnx.speaker.diarization.screens.HomeScreen
|
||||||
|
import com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme.SherpaOnnxSpeakerDiarizationTheme
|
||||||
|
|
||||||
|
const val TAG = "sherpa-onnx-sd"
|
||||||
|
|
||||||
|
class MainActivity : ComponentActivity() {
|
||||||
|
override fun onCreate(savedInstanceState: Bundle?) {
|
||||||
|
super.onCreate(savedInstanceState)
|
||||||
|
enableEdgeToEdge()
|
||||||
|
setContent {
|
||||||
|
SherpaOnnxSpeakerDiarizationTheme {
|
||||||
|
// A surface container using the 'background' color from the theme
|
||||||
|
Surface(
|
||||||
|
modifier = Modifier.fillMaxSize(),
|
||||||
|
color = MaterialTheme.colorScheme.background
|
||||||
|
) {
|
||||||
|
MainScreen()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
SpeakerDiarizationObject.initSpeakerDiarization(this.assets)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@OptIn(ExperimentalMaterial3Api::class)
|
||||||
|
@Composable
|
||||||
|
fun MainScreen(modifier: Modifier = Modifier) {
|
||||||
|
val navController = rememberNavController()
|
||||||
|
Scaffold(
|
||||||
|
topBar = {
|
||||||
|
CenterAlignedTopAppBar(
|
||||||
|
colors = TopAppBarDefaults.topAppBarColors(
|
||||||
|
containerColor = MaterialTheme.colorScheme.primaryContainer,
|
||||||
|
titleContentColor = MaterialTheme.colorScheme.primary,
|
||||||
|
),
|
||||||
|
title = {
|
||||||
|
Text(
|
||||||
|
"Next-gen Kaldi: Speaker Diarization",
|
||||||
|
fontWeight = FontWeight.Bold,
|
||||||
|
)
|
||||||
|
},
|
||||||
|
)
|
||||||
|
},
|
||||||
|
content = { padding ->
|
||||||
|
Column(Modifier.padding(padding)) {
|
||||||
|
NavigationHost(navController = navController)
|
||||||
|
|
||||||
|
}
|
||||||
|
},
|
||||||
|
bottomBar = {
|
||||||
|
BottomNavigationBar(navController = navController)
|
||||||
|
}
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
@Composable
|
||||||
|
fun NavigationHost(navController: NavHostController) {
|
||||||
|
NavHost(navController = navController, startDestination = NavRoutes.Home.route) {
|
||||||
|
composable(NavRoutes.Home.route) {
|
||||||
|
HomeScreen()
|
||||||
|
}
|
||||||
|
|
||||||
|
composable(NavRoutes.Help.route) {
|
||||||
|
HelpScreen()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Composable
|
||||||
|
fun BottomNavigationBar(navController: NavHostController) {
|
||||||
|
NavigationBar {
|
||||||
|
val backStackEntry by navController.currentBackStackEntryAsState()
|
||||||
|
val currentRoute = backStackEntry?.destination?.route
|
||||||
|
|
||||||
|
NavBarItems.BarItems.forEach { navItem ->
|
||||||
|
NavigationBarItem(selected = currentRoute == navItem.route,
|
||||||
|
onClick = {
|
||||||
|
navController.navigate(navItem.route) {
|
||||||
|
popUpTo(navController.graph.findStartDestination().id) {
|
||||||
|
saveState = true
|
||||||
|
}
|
||||||
|
launchSingleTop = true
|
||||||
|
restoreState = true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
icon = {
|
||||||
|
Icon(imageVector = navItem.image, contentDescription = navItem.title)
|
||||||
|
}, label = {
|
||||||
|
Text(text = navItem.title)
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Preview(showBackground = true)
|
||||||
|
@Composable
|
||||||
|
fun MainScreenPreview() {
|
||||||
|
SherpaOnnxSpeakerDiarizationTheme {
|
||||||
|
MainScreen()
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,20 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization
|
||||||
|
|
||||||
|
import androidx.compose.material.icons.Icons
|
||||||
|
import androidx.compose.material.icons.filled.Home
|
||||||
|
import androidx.compose.material.icons.filled.Info
|
||||||
|
|
||||||
|
object NavBarItems {
|
||||||
|
val BarItems = listOf(
|
||||||
|
BarItem(
|
||||||
|
title = "Home",
|
||||||
|
image = Icons.Filled.Home,
|
||||||
|
route = "home",
|
||||||
|
),
|
||||||
|
BarItem(
|
||||||
|
title = "Help",
|
||||||
|
image = Icons.Filled.Info,
|
||||||
|
route = "help",
|
||||||
|
),
|
||||||
|
)
|
||||||
|
}
|
||||||
@@ -0,0 +1,6 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization
|
||||||
|
|
||||||
|
sealed class NavRoutes(val route: String) {
|
||||||
|
object Home : NavRoutes("home")
|
||||||
|
object Help : NavRoutes("help")
|
||||||
|
}
|
||||||
@@ -0,0 +1 @@
|
|||||||
|
../../../../../../../../../../../../sherpa-onnx/kotlin-api/OfflineSpeakerDiarization.kt
|
||||||
@@ -0,0 +1,137 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization.screens
|
||||||
|
|
||||||
|
import android.content.Context
|
||||||
|
import android.media.AudioFormat
|
||||||
|
import android.media.MediaCodec
|
||||||
|
import android.media.MediaExtractor
|
||||||
|
import android.media.MediaFormat
|
||||||
|
import android.net.Uri
|
||||||
|
|
||||||
|
data class WaveData(
|
||||||
|
val sampleRate: Int? = null,
|
||||||
|
val samples: FloatArray? = null,
|
||||||
|
val msg: String? = null
|
||||||
|
)
|
||||||
|
|
||||||
|
// It supports only 16-bit encoded wave files
|
||||||
|
//
|
||||||
|
// References
|
||||||
|
// - https://gist.github.com/a-m-s/1991ab18fbcb0fcc2cf9
|
||||||
|
// - https://github.com/taehwandev/MediaCodecExample/blob/master/app/src/main/java/tech/thdev/mediacodecexample/audio/AACAudioDecoderThread.kt
|
||||||
|
fun readUri(context: Context, uri: Uri): WaveData {
|
||||||
|
val extractor = MediaExtractor()
|
||||||
|
extractor.setDataSource(context, uri, null)
|
||||||
|
|
||||||
|
val samplesList: MutableList<FloatArray> = ArrayList()
|
||||||
|
|
||||||
|
for (i in 0 until extractor.trackCount) {
|
||||||
|
val format = extractor.getTrackFormat(i)
|
||||||
|
val mime = format.getString(MediaFormat.KEY_MIME)
|
||||||
|
if (mime?.startsWith("audio/") == true) {
|
||||||
|
extractor.selectTrack(i)
|
||||||
|
|
||||||
|
var encoding: Int = -1
|
||||||
|
try {
|
||||||
|
encoding = format.getInteger(MediaFormat.KEY_PCM_ENCODING)
|
||||||
|
} catch (_: Exception) {
|
||||||
|
}
|
||||||
|
|
||||||
|
if (encoding != AudioFormat.ENCODING_PCM_16BIT) {
|
||||||
|
return WaveData(msg = "We support only 16-bit encoded wave files")
|
||||||
|
}
|
||||||
|
|
||||||
|
val sampleRate = format.getInteger(MediaFormat.KEY_SAMPLE_RATE)
|
||||||
|
val decoder = MediaCodec.createDecoderByType(mime)
|
||||||
|
decoder.configure(format, null, null, 0)
|
||||||
|
decoder.start()
|
||||||
|
|
||||||
|
val inputBuffers = decoder.inputBuffers
|
||||||
|
var outputBuffers = decoder.outputBuffers
|
||||||
|
|
||||||
|
val info = MediaCodec.BufferInfo()
|
||||||
|
var eof = false
|
||||||
|
|
||||||
|
var outputBufferIndex = -1
|
||||||
|
|
||||||
|
while (true) {
|
||||||
|
if (!eof) {
|
||||||
|
val inputBufferIndex = decoder.dequeueInputBuffer(10000)
|
||||||
|
if (inputBufferIndex > 0) {
|
||||||
|
val size = extractor.readSampleData(inputBuffers[inputBufferIndex], 0)
|
||||||
|
if (size < 0) {
|
||||||
|
decoder.queueInputBuffer(
|
||||||
|
inputBufferIndex,
|
||||||
|
0,
|
||||||
|
0,
|
||||||
|
0,
|
||||||
|
MediaCodec.BUFFER_FLAG_END_OF_STREAM
|
||||||
|
)
|
||||||
|
eof = true
|
||||||
|
} else {
|
||||||
|
decoder.queueInputBuffer(
|
||||||
|
inputBufferIndex,
|
||||||
|
0,
|
||||||
|
size,
|
||||||
|
extractor.sampleTime,
|
||||||
|
0
|
||||||
|
)
|
||||||
|
extractor.advance()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
} // if (!eof)
|
||||||
|
|
||||||
|
if (outputBufferIndex >= 0) {
|
||||||
|
outputBuffers[outputBufferIndex].position(0)
|
||||||
|
}
|
||||||
|
|
||||||
|
outputBufferIndex = decoder.dequeueOutputBuffer(info, 10000)
|
||||||
|
if (outputBufferIndex >= 0) {
|
||||||
|
if (info.flags != 0) {
|
||||||
|
decoder.stop()
|
||||||
|
decoder.release()
|
||||||
|
|
||||||
|
var k = 0
|
||||||
|
for (s in samplesList) {
|
||||||
|
k += s.size
|
||||||
|
}
|
||||||
|
if (k == 0) {
|
||||||
|
return WaveData(msg = "Failed to read selected file")
|
||||||
|
}
|
||||||
|
|
||||||
|
val ans = FloatArray(k)
|
||||||
|
k = 0
|
||||||
|
for (s in samplesList) {
|
||||||
|
s.copyInto(ans, k)
|
||||||
|
k += s.size
|
||||||
|
}
|
||||||
|
|
||||||
|
return WaveData(sampleRate = sampleRate, samples = ans)
|
||||||
|
}
|
||||||
|
|
||||||
|
val buffer = outputBuffers[outputBufferIndex]
|
||||||
|
val chunk = ByteArray(info.size)
|
||||||
|
buffer[chunk]
|
||||||
|
buffer.clear()
|
||||||
|
|
||||||
|
val numSamples = info.size / 2
|
||||||
|
|
||||||
|
val samples = FloatArray(numSamples)
|
||||||
|
for (k in 0 until numSamples) {
|
||||||
|
// assume little endian
|
||||||
|
val s = chunk[2 * k] + (chunk[2 * k + 1] * 256.0f)
|
||||||
|
|
||||||
|
samples[k] = s / 32768.0f
|
||||||
|
}
|
||||||
|
samplesList.add(samples)
|
||||||
|
|
||||||
|
decoder.releaseOutputBuffer(outputBufferIndex, false)
|
||||||
|
} else if (outputBufferIndex == MediaCodec.INFO_OUTPUT_BUFFERS_CHANGED) {
|
||||||
|
outputBuffers = decoder.outputBuffers
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
extractor.release()
|
||||||
|
return WaveData(msg = "not an audio file")
|
||||||
|
}
|
||||||
@@ -0,0 +1,66 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization
|
||||||
|
|
||||||
|
import android.content.res.AssetManager
|
||||||
|
import android.util.Log
|
||||||
|
import com.k2fsa.sherpa.onnx.FastClusteringConfig
|
||||||
|
import com.k2fsa.sherpa.onnx.OfflineSpeakerDiarization
|
||||||
|
import com.k2fsa.sherpa.onnx.OfflineSpeakerDiarizationConfig
|
||||||
|
import com.k2fsa.sherpa.onnx.OfflineSpeakerSegmentationModelConfig
|
||||||
|
import com.k2fsa.sherpa.onnx.OfflineSpeakerSegmentationPyannoteModelConfig
|
||||||
|
import com.k2fsa.sherpa.onnx.SpeakerEmbeddingExtractorConfig
|
||||||
|
|
||||||
|
// Please download
|
||||||
|
// https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-segmentation-models/sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
|
||||||
|
// then unzip it, rename model.onnx to segmentation.onnx, and mv
|
||||||
|
// segmentation.onnx to the assets folder
|
||||||
|
val segmentationModel = "segmentation.onnx"
|
||||||
|
|
||||||
|
// please download it from
|
||||||
|
// https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-recongition-models/3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx
|
||||||
|
// and move it to the assets folder
|
||||||
|
val embeddingModel = "3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx"
|
||||||
|
|
||||||
|
// in the end, your assets folder should look like below
|
||||||
|
/*
|
||||||
|
(py38) fangjuns-MacBook-Pro:assets fangjun$ pwd
|
||||||
|
/Users/fangjun/open-source/sherpa-onnx/android/SherpaOnnxSpeakerDiarization/app/src/main/assets
|
||||||
|
(py38) fangjuns-MacBook-Pro:assets fangjun$ ls -lh
|
||||||
|
total 89048
|
||||||
|
-rw-r--r-- 1 fangjun staff 38M Oct 12 20:28 3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx
|
||||||
|
-rw-r--r-- 1 fangjun staff 5.7M Oct 12 20:28 segmentation.onnx
|
||||||
|
*/
|
||||||
|
|
||||||
|
object SpeakerDiarizationObject {
|
||||||
|
var _sd: OfflineSpeakerDiarization? = null
|
||||||
|
val sd: OfflineSpeakerDiarization
|
||||||
|
get() {
|
||||||
|
return _sd!!
|
||||||
|
}
|
||||||
|
|
||||||
|
fun initSpeakerDiarization(assetManager: AssetManager? = null) {
|
||||||
|
synchronized(this) {
|
||||||
|
if (_sd != null) {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
Log.i(TAG, "Initializing sherpa-onnx speaker diarization")
|
||||||
|
|
||||||
|
val config = OfflineSpeakerDiarizationConfig(
|
||||||
|
segmentation = OfflineSpeakerSegmentationModelConfig(
|
||||||
|
pyannote = OfflineSpeakerSegmentationPyannoteModelConfig(
|
||||||
|
segmentationModel
|
||||||
|
),
|
||||||
|
debug = true,
|
||||||
|
),
|
||||||
|
embedding = SpeakerEmbeddingExtractorConfig(
|
||||||
|
model = embeddingModel,
|
||||||
|
debug = true,
|
||||||
|
numThreads = 2,
|
||||||
|
),
|
||||||
|
clustering = FastClusteringConfig(numClusters = -1, threshold = 0.5f),
|
||||||
|
minDurationOn = 0.2f,
|
||||||
|
minDurationOff = 0.5f,
|
||||||
|
)
|
||||||
|
_sd = OfflineSpeakerDiarization(assetManager = assetManager, config = config)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1 @@
|
|||||||
|
../../../../../../../../../../../../sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
|
||||||
@@ -0,0 +1,38 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization.screens
|
||||||
|
|
||||||
|
import androidx.compose.foundation.layout.Box
|
||||||
|
import androidx.compose.foundation.layout.Column
|
||||||
|
import androidx.compose.foundation.layout.Spacer
|
||||||
|
import androidx.compose.foundation.layout.fillMaxSize
|
||||||
|
import androidx.compose.foundation.layout.height
|
||||||
|
import androidx.compose.foundation.layout.padding
|
||||||
|
import androidx.compose.material3.Text
|
||||||
|
import androidx.compose.runtime.Composable
|
||||||
|
import androidx.compose.ui.Modifier
|
||||||
|
import androidx.compose.ui.unit.dp
|
||||||
|
import androidx.compose.ui.unit.sp
|
||||||
|
|
||||||
|
@Composable
|
||||||
|
fun HelpScreen() {
|
||||||
|
Box(modifier = Modifier.fillMaxSize()) {
|
||||||
|
Column(
|
||||||
|
modifier = Modifier.padding(8.dp)
|
||||||
|
) {
|
||||||
|
Text(
|
||||||
|
"This app accepts only 16kHz 16-bit 1-channel *.wav files. " +
|
||||||
|
"It has two arguments: Number of speakers and clustering threshold. " +
|
||||||
|
"If you know the actual number of speakers in the file, please set it. " +
|
||||||
|
"Otherwise, please set it to 0. In that case, you have to set the threshold. " +
|
||||||
|
"A larger threshold leads to fewer segmented speakers."
|
||||||
|
)
|
||||||
|
Spacer(modifier = Modifier.height(5.dp))
|
||||||
|
Text("The speaker segmentation model is from " +
|
||||||
|
"pyannote-audio (https://huggingface.co/pyannote/segmentation-3.0), "+
|
||||||
|
"whereas the embedding extractor model is from 3D-Speaker (https://github.com/modelscope/3D-Speaker)")
|
||||||
|
Spacer(modifier = Modifier.height(5.dp))
|
||||||
|
Text("Please see http://github.com/k2-fsa/sherpa-onnx ")
|
||||||
|
Spacer(modifier = Modifier.height(5.dp))
|
||||||
|
Text("Everything is open-sourced!", fontSize = 20.sp)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,210 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization.screens
|
||||||
|
|
||||||
|
import android.util.Log
|
||||||
|
import androidx.activity.compose.rememberLauncherForActivityResult
|
||||||
|
import androidx.activity.result.contract.ActivityResultContracts
|
||||||
|
import androidx.compose.foundation.layout.Arrangement
|
||||||
|
import androidx.compose.foundation.layout.Column
|
||||||
|
import androidx.compose.foundation.layout.Row
|
||||||
|
import androidx.compose.foundation.layout.Spacer
|
||||||
|
import androidx.compose.foundation.layout.fillMaxWidth
|
||||||
|
import androidx.compose.foundation.layout.padding
|
||||||
|
import androidx.compose.foundation.layout.size
|
||||||
|
import androidx.compose.foundation.rememberScrollState
|
||||||
|
import androidx.compose.foundation.verticalScroll
|
||||||
|
import androidx.compose.material3.Button
|
||||||
|
import androidx.compose.material3.OutlinedTextField
|
||||||
|
import androidx.compose.material3.Text
|
||||||
|
import androidx.compose.runtime.Composable
|
||||||
|
import androidx.compose.runtime.getValue
|
||||||
|
import androidx.compose.runtime.mutableStateOf
|
||||||
|
import androidx.compose.runtime.remember
|
||||||
|
import androidx.compose.runtime.setValue
|
||||||
|
import androidx.compose.ui.Alignment
|
||||||
|
import androidx.compose.ui.Modifier
|
||||||
|
import androidx.compose.ui.platform.LocalClipboardManager
|
||||||
|
import androidx.compose.ui.platform.LocalContext
|
||||||
|
import androidx.compose.ui.text.AnnotatedString
|
||||||
|
import androidx.compose.ui.unit.dp
|
||||||
|
import androidx.compose.ui.unit.sp
|
||||||
|
import androidx.documentfile.provider.DocumentFile
|
||||||
|
import com.k2fsa.sherpa.onnx.speaker.diarization.SpeakerDiarizationObject
|
||||||
|
import com.k2fsa.sherpa.onnx.speaker.diarization.TAG
|
||||||
|
import kotlin.concurrent.thread
|
||||||
|
|
||||||
|
|
||||||
|
private var samples: FloatArray? = null
|
||||||
|
|
||||||
|
@Composable
|
||||||
|
fun HomeScreen() {
|
||||||
|
val context = LocalContext.current
|
||||||
|
|
||||||
|
var sampleRate: Int
|
||||||
|
var filename by remember { mutableStateOf("") }
|
||||||
|
var status by remember { mutableStateOf("") }
|
||||||
|
var progress by remember { mutableStateOf("") }
|
||||||
|
val clipboardManager = LocalClipboardManager.current
|
||||||
|
var done by remember { mutableStateOf(false) }
|
||||||
|
var fileIsOk by remember { mutableStateOf(false) }
|
||||||
|
var started by remember { mutableStateOf(false) }
|
||||||
|
var numSpeakers by remember { mutableStateOf(0) }
|
||||||
|
var threshold by remember { mutableStateOf(0.5f) }
|
||||||
|
|
||||||
|
|
||||||
|
val callback = here@{ numProcessedChunks: Int, numTotalChunks: Int, arg: Long ->
|
||||||
|
Int
|
||||||
|
val percent = 100.0 * numProcessedChunks / numTotalChunks
|
||||||
|
progress = "%.2f%%".format(percent)
|
||||||
|
Log.i(TAG, progress)
|
||||||
|
return@here 0
|
||||||
|
}
|
||||||
|
|
||||||
|
val launcher = rememberLauncherForActivityResult(ActivityResultContracts.OpenDocument()) {
|
||||||
|
it?.let {
|
||||||
|
val documentFile = DocumentFile.fromSingleUri(context, it)
|
||||||
|
filename = documentFile?.name ?: ""
|
||||||
|
|
||||||
|
progress = ""
|
||||||
|
done = false
|
||||||
|
fileIsOk = false
|
||||||
|
|
||||||
|
if (filename.isNotEmpty()) {
|
||||||
|
val data = readUri(context, it)
|
||||||
|
Log.i(TAG, "sample rate: ${data.sampleRate}")
|
||||||
|
Log.i(TAG, "numSamples: ${data.samples?.size ?: 0}")
|
||||||
|
if (data.msg != null) {
|
||||||
|
Log.i(TAG, "failed to read $filename")
|
||||||
|
status = data.msg
|
||||||
|
} else if (data.sampleRate != SpeakerDiarizationObject.sd.sampleRate()) {
|
||||||
|
status =
|
||||||
|
"Expected sample rate: ${SpeakerDiarizationObject.sd.sampleRate()}. Given wave file with sample rate: ${data.sampleRate}"
|
||||||
|
} else {
|
||||||
|
samples = data.samples!!
|
||||||
|
fileIsOk = true
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Column(
|
||||||
|
modifier = Modifier.padding(10.dp),
|
||||||
|
verticalArrangement = Arrangement.Top,
|
||||||
|
) {
|
||||||
|
Row(
|
||||||
|
modifier = Modifier.fillMaxWidth(),
|
||||||
|
horizontalArrangement = Arrangement.SpaceEvenly,
|
||||||
|
verticalAlignment = Alignment.CenterVertically
|
||||||
|
) {
|
||||||
|
|
||||||
|
Button(onClick = {
|
||||||
|
launcher.launch(arrayOf("audio/*"))
|
||||||
|
}) {
|
||||||
|
Text("Select a .wav file")
|
||||||
|
}
|
||||||
|
|
||||||
|
Button(enabled = fileIsOk && !started,
|
||||||
|
onClick = {
|
||||||
|
Log.i(TAG, "started")
|
||||||
|
Log.i(TAG, "num samples: ${samples?.size}")
|
||||||
|
started = true
|
||||||
|
progress = ""
|
||||||
|
|
||||||
|
val config = SpeakerDiarizationObject.sd.config
|
||||||
|
config.clustering.numClusters = numSpeakers
|
||||||
|
config.clustering.threshold = threshold
|
||||||
|
|
||||||
|
SpeakerDiarizationObject.sd.setConfig(config)
|
||||||
|
|
||||||
|
thread(true) {
|
||||||
|
done = false
|
||||||
|
status = "Started! Please wait"
|
||||||
|
val segments = SpeakerDiarizationObject.sd.processWithCallback(
|
||||||
|
samples!!,
|
||||||
|
callback = callback,
|
||||||
|
)
|
||||||
|
done = true
|
||||||
|
started = false
|
||||||
|
status = ""
|
||||||
|
for (s in segments) {
|
||||||
|
val start = "%.2f".format(s.start)
|
||||||
|
val end = "%.2f".format(s.end)
|
||||||
|
val speaker = "speaker_%02d".format(s.speaker)
|
||||||
|
status += "$start -- $end $speaker\n"
|
||||||
|
Log.i(TAG, "$start -- $end $speaker")
|
||||||
|
}
|
||||||
|
|
||||||
|
Log.i(TAG, status)
|
||||||
|
}
|
||||||
|
}) {
|
||||||
|
Text("Start")
|
||||||
|
}
|
||||||
|
if (progress.isNotEmpty()) {
|
||||||
|
Text(progress, fontSize = 25.sp)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Row(
|
||||||
|
modifier = Modifier.fillMaxWidth(),
|
||||||
|
horizontalArrangement = Arrangement.SpaceEvenly,
|
||||||
|
verticalAlignment = Alignment.CenterVertically
|
||||||
|
) {
|
||||||
|
OutlinedTextField(
|
||||||
|
value = numSpeakers.toString(),
|
||||||
|
onValueChange = {
|
||||||
|
if (it.isEmpty() || it.isBlank()) {
|
||||||
|
numSpeakers = 0
|
||||||
|
} else {
|
||||||
|
numSpeakers = it.toIntOrNull() ?: 0
|
||||||
|
}
|
||||||
|
},
|
||||||
|
label = {
|
||||||
|
Text("Number of Speakers")
|
||||||
|
},
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
Row(
|
||||||
|
modifier = Modifier.fillMaxWidth(),
|
||||||
|
horizontalArrangement = Arrangement.SpaceEvenly,
|
||||||
|
verticalAlignment = Alignment.CenterVertically
|
||||||
|
) {
|
||||||
|
OutlinedTextField(
|
||||||
|
value = threshold.toString(),
|
||||||
|
onValueChange = {
|
||||||
|
if (it.isEmpty() || it.isBlank()) {
|
||||||
|
threshold = 0.5f
|
||||||
|
} else {
|
||||||
|
threshold = it.toFloatOrNull() ?: 0.5f
|
||||||
|
}
|
||||||
|
},
|
||||||
|
label = {
|
||||||
|
Text("Clustering threshold")
|
||||||
|
},
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
if (filename.isNotEmpty()) {
|
||||||
|
Text(text = "Selected $filename")
|
||||||
|
Spacer(Modifier.size(20.dp))
|
||||||
|
}
|
||||||
|
|
||||||
|
if (done) {
|
||||||
|
Button(onClick = {
|
||||||
|
clipboardManager.setText(AnnotatedString(status))
|
||||||
|
progress = "Copied!"
|
||||||
|
}) {
|
||||||
|
Text("Copy result")
|
||||||
|
}
|
||||||
|
Spacer(Modifier.size(20.dp))
|
||||||
|
}
|
||||||
|
|
||||||
|
if (status.isNotEmpty()) {
|
||||||
|
Text(
|
||||||
|
status,
|
||||||
|
modifier = Modifier.verticalScroll(rememberScrollState()),
|
||||||
|
)
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,11 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme
|
||||||
|
|
||||||
|
import androidx.compose.ui.graphics.Color
|
||||||
|
|
||||||
|
val Purple80 = Color(0xFFD0BCFF)
|
||||||
|
val PurpleGrey80 = Color(0xFFCCC2DC)
|
||||||
|
val Pink80 = Color(0xFFEFB8C8)
|
||||||
|
|
||||||
|
val Purple40 = Color(0xFF6650a4)
|
||||||
|
val PurpleGrey40 = Color(0xFF625b71)
|
||||||
|
val Pink40 = Color(0xFF7D5260)
|
||||||
@@ -0,0 +1,58 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme
|
||||||
|
|
||||||
|
import android.app.Activity
|
||||||
|
import android.os.Build
|
||||||
|
import androidx.compose.foundation.isSystemInDarkTheme
|
||||||
|
import androidx.compose.material3.MaterialTheme
|
||||||
|
import androidx.compose.material3.darkColorScheme
|
||||||
|
import androidx.compose.material3.dynamicDarkColorScheme
|
||||||
|
import androidx.compose.material3.dynamicLightColorScheme
|
||||||
|
import androidx.compose.material3.lightColorScheme
|
||||||
|
import androidx.compose.runtime.Composable
|
||||||
|
import androidx.compose.ui.platform.LocalContext
|
||||||
|
|
||||||
|
private val DarkColorScheme = darkColorScheme(
|
||||||
|
primary = Purple80,
|
||||||
|
secondary = PurpleGrey80,
|
||||||
|
tertiary = Pink80
|
||||||
|
)
|
||||||
|
|
||||||
|
private val LightColorScheme = lightColorScheme(
|
||||||
|
primary = Purple40,
|
||||||
|
secondary = PurpleGrey40,
|
||||||
|
tertiary = Pink40
|
||||||
|
|
||||||
|
/* Other default colors to override
|
||||||
|
background = Color(0xFFFFFBFE),
|
||||||
|
surface = Color(0xFFFFFBFE),
|
||||||
|
onPrimary = Color.White,
|
||||||
|
onSecondary = Color.White,
|
||||||
|
onTertiary = Color.White,
|
||||||
|
onBackground = Color(0xFF1C1B1F),
|
||||||
|
onSurface = Color(0xFF1C1B1F),
|
||||||
|
*/
|
||||||
|
)
|
||||||
|
|
||||||
|
@Composable
|
||||||
|
fun SherpaOnnxSpeakerDiarizationTheme(
|
||||||
|
darkTheme: Boolean = isSystemInDarkTheme(),
|
||||||
|
// Dynamic color is available on Android 12+
|
||||||
|
dynamicColor: Boolean = true,
|
||||||
|
content: @Composable () -> Unit
|
||||||
|
) {
|
||||||
|
val colorScheme = when {
|
||||||
|
dynamicColor && Build.VERSION.SDK_INT >= Build.VERSION_CODES.S -> {
|
||||||
|
val context = LocalContext.current
|
||||||
|
if (darkTheme) dynamicDarkColorScheme(context) else dynamicLightColorScheme(context)
|
||||||
|
}
|
||||||
|
|
||||||
|
darkTheme -> DarkColorScheme
|
||||||
|
else -> LightColorScheme
|
||||||
|
}
|
||||||
|
|
||||||
|
MaterialTheme(
|
||||||
|
colorScheme = colorScheme,
|
||||||
|
typography = Typography,
|
||||||
|
content = content
|
||||||
|
)
|
||||||
|
}
|
||||||
@@ -0,0 +1,34 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization.ui.theme
|
||||||
|
|
||||||
|
import androidx.compose.material3.Typography
|
||||||
|
import androidx.compose.ui.text.TextStyle
|
||||||
|
import androidx.compose.ui.text.font.FontFamily
|
||||||
|
import androidx.compose.ui.text.font.FontWeight
|
||||||
|
import androidx.compose.ui.unit.sp
|
||||||
|
|
||||||
|
// Set of Material typography styles to start with
|
||||||
|
val Typography = Typography(
|
||||||
|
bodyLarge = TextStyle(
|
||||||
|
fontFamily = FontFamily.Default,
|
||||||
|
fontWeight = FontWeight.Normal,
|
||||||
|
fontSize = 16.sp,
|
||||||
|
lineHeight = 24.sp,
|
||||||
|
letterSpacing = 0.5.sp
|
||||||
|
)
|
||||||
|
/* Other default text styles to override
|
||||||
|
titleLarge = TextStyle(
|
||||||
|
fontFamily = FontFamily.Default,
|
||||||
|
fontWeight = FontWeight.Normal,
|
||||||
|
fontSize = 22.sp,
|
||||||
|
lineHeight = 28.sp,
|
||||||
|
letterSpacing = 0.sp
|
||||||
|
),
|
||||||
|
labelSmall = TextStyle(
|
||||||
|
fontFamily = FontFamily.Default,
|
||||||
|
fontWeight = FontWeight.Medium,
|
||||||
|
fontSize = 11.sp,
|
||||||
|
lineHeight = 16.sp,
|
||||||
|
letterSpacing = 0.5.sp
|
||||||
|
)
|
||||||
|
*/
|
||||||
|
)
|
||||||
@@ -0,0 +1,30 @@
|
|||||||
|
<vector xmlns:android="http://schemas.android.com/apk/res/android"
|
||||||
|
xmlns:aapt="http://schemas.android.com/aapt"
|
||||||
|
android:width="108dp"
|
||||||
|
android:height="108dp"
|
||||||
|
android:viewportWidth="108"
|
||||||
|
android:viewportHeight="108">
|
||||||
|
<path android:pathData="M31,63.928c0,0 6.4,-11 12.1,-13.1c7.2,-2.6 26,-1.4 26,-1.4l38.1,38.1L107,108.928l-32,-1L31,63.928z">
|
||||||
|
<aapt:attr name="android:fillColor">
|
||||||
|
<gradient
|
||||||
|
android:endX="85.84757"
|
||||||
|
android:endY="92.4963"
|
||||||
|
android:startX="42.9492"
|
||||||
|
android:startY="49.59793"
|
||||||
|
android:type="linear">
|
||||||
|
<item
|
||||||
|
android:color="#44000000"
|
||||||
|
android:offset="0.0" />
|
||||||
|
<item
|
||||||
|
android:color="#00000000"
|
||||||
|
android:offset="1.0" />
|
||||||
|
</gradient>
|
||||||
|
</aapt:attr>
|
||||||
|
</path>
|
||||||
|
<path
|
||||||
|
android:fillColor="#FFFFFF"
|
||||||
|
android:fillType="nonZero"
|
||||||
|
android:pathData="M65.3,45.828l3.8,-6.6c0.2,-0.4 0.1,-0.9 -0.3,-1.1c-0.4,-0.2 -0.9,-0.1 -1.1,0.3l-3.9,6.7c-6.3,-2.8 -13.4,-2.8 -19.7,0l-3.9,-6.7c-0.2,-0.4 -0.7,-0.5 -1.1,-0.3C38.8,38.328 38.7,38.828 38.9,39.228l3.8,6.6C36.2,49.428 31.7,56.028 31,63.928h46C76.3,56.028 71.8,49.428 65.3,45.828zM43.4,57.328c-0.8,0 -1.5,-0.5 -1.8,-1.2c-0.3,-0.7 -0.1,-1.5 0.4,-2.1c0.5,-0.5 1.4,-0.7 2.1,-0.4c0.7,0.3 1.2,1 1.2,1.8C45.3,56.528 44.5,57.328 43.4,57.328L43.4,57.328zM64.6,57.328c-0.8,0 -1.5,-0.5 -1.8,-1.2s-0.1,-1.5 0.4,-2.1c0.5,-0.5 1.4,-0.7 2.1,-0.4c0.7,0.3 1.2,1 1.2,1.8C66.5,56.528 65.6,57.328 64.6,57.328L64.6,57.328z"
|
||||||
|
android:strokeWidth="1"
|
||||||
|
android:strokeColor="#00000000" />
|
||||||
|
</vector>
|
||||||
@@ -0,0 +1,170 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<vector xmlns:android="http://schemas.android.com/apk/res/android"
|
||||||
|
android:width="108dp"
|
||||||
|
android:height="108dp"
|
||||||
|
android:viewportWidth="108"
|
||||||
|
android:viewportHeight="108">
|
||||||
|
<path
|
||||||
|
android:fillColor="#3DDC84"
|
||||||
|
android:pathData="M0,0h108v108h-108z" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M9,0L9,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M19,0L19,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M29,0L29,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M39,0L39,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M49,0L49,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M59,0L59,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M69,0L69,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M79,0L79,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M89,0L89,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M99,0L99,108"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,9L108,9"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,19L108,19"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,29L108,29"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,39L108,39"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,49L108,49"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,59L108,59"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,69L108,69"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,79L108,79"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,89L108,89"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M0,99L108,99"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M19,29L89,29"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M19,39L89,39"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M19,49L89,49"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M19,59L89,59"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M19,69L89,69"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M19,79L89,79"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M29,19L29,89"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M39,19L39,89"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M49,19L49,89"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M59,19L59,89"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M69,19L69,89"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
<path
|
||||||
|
android:fillColor="#00000000"
|
||||||
|
android:pathData="M79,19L79,89"
|
||||||
|
android:strokeWidth="0.8"
|
||||||
|
android:strokeColor="#33FFFFFF" />
|
||||||
|
</vector>
|
||||||
@@ -0,0 +1,6 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
|
||||||
|
<background android:drawable="@drawable/ic_launcher_background" />
|
||||||
|
<foreground android:drawable="@drawable/ic_launcher_foreground" />
|
||||||
|
<monochrome android:drawable="@drawable/ic_launcher_foreground" />
|
||||||
|
</adaptive-icon>
|
||||||
@@ -0,0 +1,6 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
|
||||||
|
<background android:drawable="@drawable/ic_launcher_background" />
|
||||||
|
<foreground android:drawable="@drawable/ic_launcher_foreground" />
|
||||||
|
<monochrome android:drawable="@drawable/ic_launcher_foreground" />
|
||||||
|
</adaptive-icon>
|
||||||
|
After Width: | Height: | Size: 1.4 KiB |
|
After Width: | Height: | Size: 2.8 KiB |
|
After Width: | Height: | Size: 982 B |
|
After Width: | Height: | Size: 1.7 KiB |
|
After Width: | Height: | Size: 1.9 KiB |
|
After Width: | Height: | Size: 3.8 KiB |
|
After Width: | Height: | Size: 2.8 KiB |
|
After Width: | Height: | Size: 5.8 KiB |
|
After Width: | Height: | Size: 3.8 KiB |
|
After Width: | Height: | Size: 7.6 KiB |
@@ -0,0 +1,10 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<resources>
|
||||||
|
<color name="purple_200">#FFBB86FC</color>
|
||||||
|
<color name="purple_500">#FF6200EE</color>
|
||||||
|
<color name="purple_700">#FF3700B3</color>
|
||||||
|
<color name="teal_200">#FF03DAC5</color>
|
||||||
|
<color name="teal_700">#FF018786</color>
|
||||||
|
<color name="black">#FF000000</color>
|
||||||
|
<color name="white">#FFFFFFFF</color>
|
||||||
|
</resources>
|
||||||
@@ -0,0 +1,3 @@
|
|||||||
|
<resources>
|
||||||
|
<string name="app_name">SherpaOnnxSpeakerDiarization</string>
|
||||||
|
</resources>
|
||||||
@@ -0,0 +1,5 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<resources>
|
||||||
|
|
||||||
|
<style name="Theme.SherpaOnnxSpeakerDiarization" parent="android:Theme.Material.Light.NoActionBar" />
|
||||||
|
</resources>
|
||||||
@@ -0,0 +1,13 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?><!--
|
||||||
|
Sample backup rules file; uncomment and customize as necessary.
|
||||||
|
See https://developer.android.com/guide/topics/data/autobackup
|
||||||
|
for details.
|
||||||
|
Note: This file is ignored for devices older that API 31
|
||||||
|
See https://developer.android.com/about/versions/12/backup-restore
|
||||||
|
-->
|
||||||
|
<full-backup-content>
|
||||||
|
<!--
|
||||||
|
<include domain="sharedpref" path="."/>
|
||||||
|
<exclude domain="sharedpref" path="device.xml"/>
|
||||||
|
-->
|
||||||
|
</full-backup-content>
|
||||||
@@ -0,0 +1,19 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?><!--
|
||||||
|
Sample data extraction rules file; uncomment and customize as necessary.
|
||||||
|
See https://developer.android.com/about/versions/12/backup-restore#xml-changes
|
||||||
|
for details.
|
||||||
|
-->
|
||||||
|
<data-extraction-rules>
|
||||||
|
<cloud-backup>
|
||||||
|
<!-- TODO: Use <include> and <exclude> to control what is backed up.
|
||||||
|
<include .../>
|
||||||
|
<exclude .../>
|
||||||
|
-->
|
||||||
|
</cloud-backup>
|
||||||
|
<!--
|
||||||
|
<device-transfer>
|
||||||
|
<include .../>
|
||||||
|
<exclude .../>
|
||||||
|
</device-transfer>
|
||||||
|
-->
|
||||||
|
</data-extraction-rules>
|
||||||
@@ -0,0 +1,17 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx.speaker.diarization
|
||||||
|
|
||||||
|
import org.junit.Test
|
||||||
|
|
||||||
|
import org.junit.Assert.*
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Example local unit test, which will execute on the development machine (host).
|
||||||
|
*
|
||||||
|
* See [testing documentation](http://d.android.com/tools/testing).
|
||||||
|
*/
|
||||||
|
class ExampleUnitTest {
|
||||||
|
@Test
|
||||||
|
fun addition_isCorrect() {
|
||||||
|
assertEquals(4, 2 + 2)
|
||||||
|
}
|
||||||
|
}
|
||||||
5
android/SherpaOnnxSpeakerDiarization/build.gradle.kts
Normal file
@@ -0,0 +1,5 @@
|
|||||||
|
// Top-level build file where you can add configuration options common to all sub-projects/modules.
|
||||||
|
plugins {
|
||||||
|
alias(libs.plugins.android.application) apply false
|
||||||
|
alias(libs.plugins.jetbrains.kotlin.android) apply false
|
||||||
|
}
|
||||||
23
android/SherpaOnnxSpeakerDiarization/gradle.properties
Normal file
@@ -0,0 +1,23 @@
|
|||||||
|
# Project-wide Gradle settings.
|
||||||
|
# IDE (e.g. Android Studio) users:
|
||||||
|
# Gradle settings configured through the IDE *will override*
|
||||||
|
# any settings specified in this file.
|
||||||
|
# For more details on how to configure your build environment visit
|
||||||
|
# http://www.gradle.org/docs/current/userguide/build_environment.html
|
||||||
|
# Specifies the JVM arguments used for the daemon process.
|
||||||
|
# The setting is particularly useful for tweaking memory settings.
|
||||||
|
org.gradle.jvmargs=-Xmx2048m -Dfile.encoding=UTF-8
|
||||||
|
# When configured, Gradle will run in incubating parallel mode.
|
||||||
|
# This option should only be used with decoupled projects. For more details, visit
|
||||||
|
# https://developer.android.com/r/tools/gradle-multi-project-decoupled-projects
|
||||||
|
# org.gradle.parallel=true
|
||||||
|
# AndroidX package structure to make it clearer which packages are bundled with the
|
||||||
|
# Android operating system, and which are packaged with your app's APK
|
||||||
|
# https://developer.android.com/topic/libraries/support-library/androidx-rn
|
||||||
|
android.useAndroidX=true
|
||||||
|
# Kotlin code style for this project: "official" or "obsolete":
|
||||||
|
kotlin.code.style=official
|
||||||
|
# Enables namespacing of each library's R class so that its R class includes only the
|
||||||
|
# resources declared in the library itself and none from the library's dependencies,
|
||||||
|
# thereby reducing the size of the R class for that library
|
||||||
|
android.nonTransitiveRClass=true
|
||||||
@@ -0,0 +1,35 @@
|
|||||||
|
[versions]
|
||||||
|
agp = "8.4.0"
|
||||||
|
kotlin = "1.9.0"
|
||||||
|
coreKtx = "1.10.1"
|
||||||
|
junit = "4.13.2"
|
||||||
|
junitVersion = "1.1.5"
|
||||||
|
espressoCore = "3.5.1"
|
||||||
|
lifecycleRuntimeKtx = "2.6.1"
|
||||||
|
activityCompose = "1.8.0"
|
||||||
|
composeBom = "2023.08.00"
|
||||||
|
navigationCompose = "2.8.2"
|
||||||
|
documentfile = "1.0.1"
|
||||||
|
|
||||||
|
[libraries]
|
||||||
|
androidx-core-ktx = { group = "androidx.core", name = "core-ktx", version.ref = "coreKtx" }
|
||||||
|
junit = { group = "junit", name = "junit", version.ref = "junit" }
|
||||||
|
androidx-junit = { group = "androidx.test.ext", name = "junit", version.ref = "junitVersion" }
|
||||||
|
androidx-espresso-core = { group = "androidx.test.espresso", name = "espresso-core", version.ref = "espressoCore" }
|
||||||
|
androidx-lifecycle-runtime-ktx = { group = "androidx.lifecycle", name = "lifecycle-runtime-ktx", version.ref = "lifecycleRuntimeKtx" }
|
||||||
|
androidx-activity-compose = { group = "androidx.activity", name = "activity-compose", version.ref = "activityCompose" }
|
||||||
|
androidx-compose-bom = { group = "androidx.compose", name = "compose-bom", version.ref = "composeBom" }
|
||||||
|
androidx-ui = { group = "androidx.compose.ui", name = "ui" }
|
||||||
|
androidx-ui-graphics = { group = "androidx.compose.ui", name = "ui-graphics" }
|
||||||
|
androidx-ui-tooling = { group = "androidx.compose.ui", name = "ui-tooling" }
|
||||||
|
androidx-ui-tooling-preview = { group = "androidx.compose.ui", name = "ui-tooling-preview" }
|
||||||
|
androidx-ui-test-manifest = { group = "androidx.compose.ui", name = "ui-test-manifest" }
|
||||||
|
androidx-ui-test-junit4 = { group = "androidx.compose.ui", name = "ui-test-junit4" }
|
||||||
|
androidx-material3 = { group = "androidx.compose.material3", name = "material3" }
|
||||||
|
androidx-navigation-compose = { group = "androidx.navigation", name = "navigation-compose", version.ref = "navigationCompose" }
|
||||||
|
androidx-documentfile = { group = "androidx.documentfile", name = "documentfile", version.ref = "documentfile" }
|
||||||
|
|
||||||
|
[plugins]
|
||||||
|
android-application = { id = "com.android.application", version.ref = "agp" }
|
||||||
|
jetbrains-kotlin-android = { id = "org.jetbrains.kotlin.android", version.ref = "kotlin" }
|
||||||
|
|
||||||
BIN
android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.jar
vendored
Normal file
6
android/SherpaOnnxSpeakerDiarization/gradle/wrapper/gradle-wrapper.properties
vendored
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
#Sat Oct 12 14:27:04 CST 2024
|
||||||
|
distributionBase=GRADLE_USER_HOME
|
||||||
|
distributionPath=wrapper/dists
|
||||||
|
distributionUrl=https\://services.gradle.org/distributions/gradle-8.6-bin.zip
|
||||||
|
zipStoreBase=GRADLE_USER_HOME
|
||||||
|
zipStorePath=wrapper/dists
|
||||||
185
android/SherpaOnnxSpeakerDiarization/gradlew
vendored
Executable file
@@ -0,0 +1,185 @@
|
|||||||
|
#!/usr/bin/env sh
|
||||||
|
|
||||||
|
#
|
||||||
|
# Copyright 2015 the original author or authors.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# https://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
#
|
||||||
|
|
||||||
|
##############################################################################
|
||||||
|
##
|
||||||
|
## Gradle start up script for UN*X
|
||||||
|
##
|
||||||
|
##############################################################################
|
||||||
|
|
||||||
|
# Attempt to set APP_HOME
|
||||||
|
# Resolve links: $0 may be a link
|
||||||
|
PRG="$0"
|
||||||
|
# Need this for relative symlinks.
|
||||||
|
while [ -h "$PRG" ] ; do
|
||||||
|
ls=`ls -ld "$PRG"`
|
||||||
|
link=`expr "$ls" : '.*-> \(.*\)$'`
|
||||||
|
if expr "$link" : '/.*' > /dev/null; then
|
||||||
|
PRG="$link"
|
||||||
|
else
|
||||||
|
PRG=`dirname "$PRG"`"/$link"
|
||||||
|
fi
|
||||||
|
done
|
||||||
|
SAVED="`pwd`"
|
||||||
|
cd "`dirname \"$PRG\"`/" >/dev/null
|
||||||
|
APP_HOME="`pwd -P`"
|
||||||
|
cd "$SAVED" >/dev/null
|
||||||
|
|
||||||
|
APP_NAME="Gradle"
|
||||||
|
APP_BASE_NAME=`basename "$0"`
|
||||||
|
|
||||||
|
# Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
|
||||||
|
DEFAULT_JVM_OPTS='"-Xmx64m" "-Xms64m"'
|
||||||
|
|
||||||
|
# Use the maximum available, or set MAX_FD != -1 to use that value.
|
||||||
|
MAX_FD="maximum"
|
||||||
|
|
||||||
|
warn () {
|
||||||
|
echo "$*"
|
||||||
|
}
|
||||||
|
|
||||||
|
die () {
|
||||||
|
echo
|
||||||
|
echo "$*"
|
||||||
|
echo
|
||||||
|
exit 1
|
||||||
|
}
|
||||||
|
|
||||||
|
# OS specific support (must be 'true' or 'false').
|
||||||
|
cygwin=false
|
||||||
|
msys=false
|
||||||
|
darwin=false
|
||||||
|
nonstop=false
|
||||||
|
case "`uname`" in
|
||||||
|
CYGWIN* )
|
||||||
|
cygwin=true
|
||||||
|
;;
|
||||||
|
Darwin* )
|
||||||
|
darwin=true
|
||||||
|
;;
|
||||||
|
MINGW* )
|
||||||
|
msys=true
|
||||||
|
;;
|
||||||
|
NONSTOP* )
|
||||||
|
nonstop=true
|
||||||
|
;;
|
||||||
|
esac
|
||||||
|
|
||||||
|
CLASSPATH=$APP_HOME/gradle/wrapper/gradle-wrapper.jar
|
||||||
|
|
||||||
|
|
||||||
|
# Determine the Java command to use to start the JVM.
|
||||||
|
if [ -n "$JAVA_HOME" ] ; then
|
||||||
|
if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
|
||||||
|
# IBM's JDK on AIX uses strange locations for the executables
|
||||||
|
JAVACMD="$JAVA_HOME/jre/sh/java"
|
||||||
|
else
|
||||||
|
JAVACMD="$JAVA_HOME/bin/java"
|
||||||
|
fi
|
||||||
|
if [ ! -x "$JAVACMD" ] ; then
|
||||||
|
die "ERROR: JAVA_HOME is set to an invalid directory: $JAVA_HOME
|
||||||
|
|
||||||
|
Please set the JAVA_HOME variable in your environment to match the
|
||||||
|
location of your Java installation."
|
||||||
|
fi
|
||||||
|
else
|
||||||
|
JAVACMD="java"
|
||||||
|
which java >/dev/null 2>&1 || die "ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
|
||||||
|
|
||||||
|
Please set the JAVA_HOME variable in your environment to match the
|
||||||
|
location of your Java installation."
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Increase the maximum file descriptors if we can.
|
||||||
|
if [ "$cygwin" = "false" -a "$darwin" = "false" -a "$nonstop" = "false" ] ; then
|
||||||
|
MAX_FD_LIMIT=`ulimit -H -n`
|
||||||
|
if [ $? -eq 0 ] ; then
|
||||||
|
if [ "$MAX_FD" = "maximum" -o "$MAX_FD" = "max" ] ; then
|
||||||
|
MAX_FD="$MAX_FD_LIMIT"
|
||||||
|
fi
|
||||||
|
ulimit -n $MAX_FD
|
||||||
|
if [ $? -ne 0 ] ; then
|
||||||
|
warn "Could not set maximum file descriptor limit: $MAX_FD"
|
||||||
|
fi
|
||||||
|
else
|
||||||
|
warn "Could not query maximum file descriptor limit: $MAX_FD_LIMIT"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
# For Darwin, add options to specify how the application appears in the dock
|
||||||
|
if $darwin; then
|
||||||
|
GRADLE_OPTS="$GRADLE_OPTS \"-Xdock:name=$APP_NAME\" \"-Xdock:icon=$APP_HOME/media/gradle.icns\""
|
||||||
|
fi
|
||||||
|
|
||||||
|
# For Cygwin or MSYS, switch paths to Windows format before running java
|
||||||
|
if [ "$cygwin" = "true" -o "$msys" = "true" ] ; then
|
||||||
|
APP_HOME=`cygpath --path --mixed "$APP_HOME"`
|
||||||
|
CLASSPATH=`cygpath --path --mixed "$CLASSPATH"`
|
||||||
|
|
||||||
|
JAVACMD=`cygpath --unix "$JAVACMD"`
|
||||||
|
|
||||||
|
# We build the pattern for arguments to be converted via cygpath
|
||||||
|
ROOTDIRSRAW=`find -L / -maxdepth 1 -mindepth 1 -type d 2>/dev/null`
|
||||||
|
SEP=""
|
||||||
|
for dir in $ROOTDIRSRAW ; do
|
||||||
|
ROOTDIRS="$ROOTDIRS$SEP$dir"
|
||||||
|
SEP="|"
|
||||||
|
done
|
||||||
|
OURCYGPATTERN="(^($ROOTDIRS))"
|
||||||
|
# Add a user-defined pattern to the cygpath arguments
|
||||||
|
if [ "$GRADLE_CYGPATTERN" != "" ] ; then
|
||||||
|
OURCYGPATTERN="$OURCYGPATTERN|($GRADLE_CYGPATTERN)"
|
||||||
|
fi
|
||||||
|
# Now convert the arguments - kludge to limit ourselves to /bin/sh
|
||||||
|
i=0
|
||||||
|
for arg in "$@" ; do
|
||||||
|
CHECK=`echo "$arg"|egrep -c "$OURCYGPATTERN" -`
|
||||||
|
CHECK2=`echo "$arg"|egrep -c "^-"` ### Determine if an option
|
||||||
|
|
||||||
|
if [ $CHECK -ne 0 ] && [ $CHECK2 -eq 0 ] ; then ### Added a condition
|
||||||
|
eval `echo args$i`=`cygpath --path --ignore --mixed "$arg"`
|
||||||
|
else
|
||||||
|
eval `echo args$i`="\"$arg\""
|
||||||
|
fi
|
||||||
|
i=`expr $i + 1`
|
||||||
|
done
|
||||||
|
case $i in
|
||||||
|
0) set -- ;;
|
||||||
|
1) set -- "$args0" ;;
|
||||||
|
2) set -- "$args0" "$args1" ;;
|
||||||
|
3) set -- "$args0" "$args1" "$args2" ;;
|
||||||
|
4) set -- "$args0" "$args1" "$args2" "$args3" ;;
|
||||||
|
5) set -- "$args0" "$args1" "$args2" "$args3" "$args4" ;;
|
||||||
|
6) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" ;;
|
||||||
|
7) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" ;;
|
||||||
|
8) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" ;;
|
||||||
|
9) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" "$args8" ;;
|
||||||
|
esac
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Escape application args
|
||||||
|
save () {
|
||||||
|
for i do printf %s\\n "$i" | sed "s/'/'\\\\''/g;1s/^/'/;\$s/\$/' \\\\/" ; done
|
||||||
|
echo " "
|
||||||
|
}
|
||||||
|
APP_ARGS=`save "$@"`
|
||||||
|
|
||||||
|
# Collect all arguments for the java command, following the shell quoting and substitution rules
|
||||||
|
eval set -- $DEFAULT_JVM_OPTS $JAVA_OPTS $GRADLE_OPTS "\"-Dorg.gradle.appname=$APP_BASE_NAME\"" -classpath "\"$CLASSPATH\"" org.gradle.wrapper.GradleWrapperMain "$APP_ARGS"
|
||||||
|
|
||||||
|
exec "$JAVACMD" "$@"
|
||||||
89
android/SherpaOnnxSpeakerDiarization/gradlew.bat
vendored
Normal file
@@ -0,0 +1,89 @@
|
|||||||
|
@rem
|
||||||
|
@rem Copyright 2015 the original author or authors.
|
||||||
|
@rem
|
||||||
|
@rem Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
@rem you may not use this file except in compliance with the License.
|
||||||
|
@rem You may obtain a copy of the License at
|
||||||
|
@rem
|
||||||
|
@rem https://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
@rem
|
||||||
|
@rem Unless required by applicable law or agreed to in writing, software
|
||||||
|
@rem distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
@rem WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
@rem See the License for the specific language governing permissions and
|
||||||
|
@rem limitations under the License.
|
||||||
|
@rem
|
||||||
|
|
||||||
|
@if "%DEBUG%" == "" @echo off
|
||||||
|
@rem ##########################################################################
|
||||||
|
@rem
|
||||||
|
@rem Gradle startup script for Windows
|
||||||
|
@rem
|
||||||
|
@rem ##########################################################################
|
||||||
|
|
||||||
|
@rem Set local scope for the variables with windows NT shell
|
||||||
|
if "%OS%"=="Windows_NT" setlocal
|
||||||
|
|
||||||
|
set DIRNAME=%~dp0
|
||||||
|
if "%DIRNAME%" == "" set DIRNAME=.
|
||||||
|
set APP_BASE_NAME=%~n0
|
||||||
|
set APP_HOME=%DIRNAME%
|
||||||
|
|
||||||
|
@rem Resolve any "." and ".." in APP_HOME to make it shorter.
|
||||||
|
for %%i in ("%APP_HOME%") do set APP_HOME=%%~fi
|
||||||
|
|
||||||
|
@rem Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
|
||||||
|
set DEFAULT_JVM_OPTS="-Xmx64m" "-Xms64m"
|
||||||
|
|
||||||
|
@rem Find java.exe
|
||||||
|
if defined JAVA_HOME goto findJavaFromJavaHome
|
||||||
|
|
||||||
|
set JAVA_EXE=java.exe
|
||||||
|
%JAVA_EXE% -version >NUL 2>&1
|
||||||
|
if "%ERRORLEVEL%" == "0" goto execute
|
||||||
|
|
||||||
|
echo.
|
||||||
|
echo ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
|
||||||
|
echo.
|
||||||
|
echo Please set the JAVA_HOME variable in your environment to match the
|
||||||
|
echo location of your Java installation.
|
||||||
|
|
||||||
|
goto fail
|
||||||
|
|
||||||
|
:findJavaFromJavaHome
|
||||||
|
set JAVA_HOME=%JAVA_HOME:"=%
|
||||||
|
set JAVA_EXE=%JAVA_HOME%/bin/java.exe
|
||||||
|
|
||||||
|
if exist "%JAVA_EXE%" goto execute
|
||||||
|
|
||||||
|
echo.
|
||||||
|
echo ERROR: JAVA_HOME is set to an invalid directory: %JAVA_HOME%
|
||||||
|
echo.
|
||||||
|
echo Please set the JAVA_HOME variable in your environment to match the
|
||||||
|
echo location of your Java installation.
|
||||||
|
|
||||||
|
goto fail
|
||||||
|
|
||||||
|
:execute
|
||||||
|
@rem Setup the command line
|
||||||
|
|
||||||
|
set CLASSPATH=%APP_HOME%\gradle\wrapper\gradle-wrapper.jar
|
||||||
|
|
||||||
|
|
||||||
|
@rem Execute Gradle
|
||||||
|
"%JAVA_EXE%" %DEFAULT_JVM_OPTS% %JAVA_OPTS% %GRADLE_OPTS% "-Dorg.gradle.appname=%APP_BASE_NAME%" -classpath "%CLASSPATH%" org.gradle.wrapper.GradleWrapperMain %*
|
||||||
|
|
||||||
|
:end
|
||||||
|
@rem End local scope for the variables with windows NT shell
|
||||||
|
if "%ERRORLEVEL%"=="0" goto mainEnd
|
||||||
|
|
||||||
|
:fail
|
||||||
|
rem Set variable GRADLE_EXIT_CONSOLE if you need the _script_ return code instead of
|
||||||
|
rem the _cmd.exe /c_ return code!
|
||||||
|
if not "" == "%GRADLE_EXIT_CONSOLE%" exit 1
|
||||||
|
exit /b 1
|
||||||
|
|
||||||
|
:mainEnd
|
||||||
|
if "%OS%"=="Windows_NT" endlocal
|
||||||
|
|
||||||
|
:omega
|
||||||
23
android/SherpaOnnxSpeakerDiarization/settings.gradle.kts
Normal file
@@ -0,0 +1,23 @@
|
|||||||
|
pluginManagement {
|
||||||
|
repositories {
|
||||||
|
google {
|
||||||
|
content {
|
||||||
|
includeGroupByRegex("com\\.android.*")
|
||||||
|
includeGroupByRegex("com\\.google.*")
|
||||||
|
includeGroupByRegex("androidx.*")
|
||||||
|
}
|
||||||
|
}
|
||||||
|
mavenCentral()
|
||||||
|
gradlePluginPortal()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
dependencyResolutionManagement {
|
||||||
|
repositoriesMode.set(RepositoriesMode.FAIL_ON_PROJECT_REPOS)
|
||||||
|
repositories {
|
||||||
|
google()
|
||||||
|
mavenCentral()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
rootProject.name = "SherpaOnnxSpeakerDiarization"
|
||||||
|
include(":app")
|
||||||
@@ -0,0 +1 @@
|
|||||||
|
../../../../../../../../../../../../sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
|
||||||
1
kotlin-api-examples/SpeakerEmbeddingExtractorConfig.kt
Symbolic link
@@ -0,0 +1 @@
|
|||||||
|
../sherpa-onnx/kotlin-api/SpeakerEmbeddingExtractorConfig.kt
|
||||||
@@ -48,6 +48,7 @@ function testSpeakerEmbeddingExtractor() {
|
|||||||
test_speaker_id.kt \
|
test_speaker_id.kt \
|
||||||
OnlineStream.kt \
|
OnlineStream.kt \
|
||||||
Speaker.kt \
|
Speaker.kt \
|
||||||
|
SpeakerEmbeddingExtractorConfig.kt \
|
||||||
WaveReader.kt \
|
WaveReader.kt \
|
||||||
faked-asset-manager.kt \
|
faked-asset-manager.kt \
|
||||||
faked-log.kt
|
faked-log.kt
|
||||||
@@ -305,6 +306,7 @@ function testOfflineSpeakerDiarization() {
|
|||||||
test_offline_speaker_diarization.kt \
|
test_offline_speaker_diarization.kt \
|
||||||
OfflineSpeakerDiarization.kt \
|
OfflineSpeakerDiarization.kt \
|
||||||
Speaker.kt \
|
Speaker.kt \
|
||||||
|
SpeakerEmbeddingExtractorConfig.kt \
|
||||||
OnlineStream.kt \
|
OnlineStream.kt \
|
||||||
WaveReader.kt \
|
WaveReader.kt \
|
||||||
faked-asset-manager.kt \
|
faked-asset-manager.kt \
|
||||||
|
|||||||
73
scripts/apk/build-apk-speaker-diarization.sh
Executable file
@@ -0,0 +1,73 @@
|
|||||||
|
#!/usr/bin/env bash
|
||||||
|
#
|
||||||
|
# Please set the environment variable ANDROID_NDK
|
||||||
|
# before running this script
|
||||||
|
|
||||||
|
# Inside the $ANDROID_NDK directory, you can find a binary ndk-build
|
||||||
|
# and some other files like the file "build/cmake/android.toolchain.cmake"
|
||||||
|
|
||||||
|
set -ex
|
||||||
|
|
||||||
|
log() {
|
||||||
|
# This function is from espnet
|
||||||
|
local fname=${BASH_SOURCE[1]##*/}
|
||||||
|
echo -e "$(date '+%Y-%m-%d %H:%M:%S') (${fname}:${BASH_LINENO[0]}:${FUNCNAME[1]}) $*"
|
||||||
|
}
|
||||||
|
|
||||||
|
SHERPA_ONNX_VERSION=$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt | cut -d " " -f 2 | cut -d '"' -f 2)
|
||||||
|
|
||||||
|
log "Building Speaker identification APK for sherpa-onnx v${SHERPA_ONNX_VERSION}"
|
||||||
|
|
||||||
|
export SHERPA_ONNX_ENABLE_TTS=OFF
|
||||||
|
|
||||||
|
log "====================arm64-v8a================="
|
||||||
|
./build-android-arm64-v8a.sh
|
||||||
|
log "====================armv7-eabi================"
|
||||||
|
./build-android-armv7-eabi.sh
|
||||||
|
log "====================x86-64===================="
|
||||||
|
./build-android-x86-64.sh
|
||||||
|
log "====================x86===================="
|
||||||
|
./build-android-x86.sh
|
||||||
|
|
||||||
|
mkdir -p apks
|
||||||
|
|
||||||
|
pushd ./android/SherpaOnnxSpeakerDiarization/app/src/main/assets/
|
||||||
|
|
||||||
|
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-segmentation-models/sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
|
||||||
|
tar xvf sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
|
||||||
|
rm sherpa-onnx-pyannote-segmentation-3-0.tar.bz2
|
||||||
|
mv sherpa-onnx-pyannote-segmentation-3-0/model.onnx segmentation.onnx
|
||||||
|
rm -rf sherpa-onnx-pyannote-segmentation-3-0
|
||||||
|
|
||||||
|
curl -SL -O https://github.com/k2-fsa/sherpa-onnx/releases/download/speaker-recongition-models/3dspeaker_speech_eres2net_base_sv_zh-cn_3dspeaker_16k.onnx
|
||||||
|
|
||||||
|
echo "pwd: $PWD"
|
||||||
|
ls -lh
|
||||||
|
|
||||||
|
popd
|
||||||
|
|
||||||
|
for arch in arm64-v8a armeabi-v7a x86_64 x86; do
|
||||||
|
log "------------------------------------------------------------"
|
||||||
|
log "build speaker diarization apk for $arch"
|
||||||
|
log "------------------------------------------------------------"
|
||||||
|
src_arch=$arch
|
||||||
|
if [ $arch == "armeabi-v7a" ]; then
|
||||||
|
src_arch=armv7-eabi
|
||||||
|
elif [ $arch == "x86_64" ]; then
|
||||||
|
src_arch=x86-64
|
||||||
|
fi
|
||||||
|
|
||||||
|
ls -lh ./build-android-$src_arch/install/lib/*.so
|
||||||
|
|
||||||
|
cp -v ./build-android-$src_arch/install/lib/*.so ./android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/$arch/
|
||||||
|
|
||||||
|
pushd ./android/SherpaOnnxSpeakerDiarization
|
||||||
|
./gradlew build
|
||||||
|
popd
|
||||||
|
|
||||||
|
mv android/SherpaOnnxSpeakerDiarization/app/build/outputs/apk/debug/app-debug.apk ./apks/sherpa-onnx-${SHERPA_ONNX_VERSION}-$arch-speaker-diarization-pyannote_audio-3dspeaker.apk
|
||||||
|
ls -lh apks
|
||||||
|
rm -v ./android/SherpaOnnxSpeakerDiarization/app/src/main/jniLibs/$arch/*.so
|
||||||
|
done
|
||||||
|
|
||||||
|
ls -lh apks
|
||||||
@@ -34,7 +34,7 @@ data class OfflineSpeakerDiarizationSegment(
|
|||||||
|
|
||||||
class OfflineSpeakerDiarization(
|
class OfflineSpeakerDiarization(
|
||||||
assetManager: AssetManager? = null,
|
assetManager: AssetManager? = null,
|
||||||
config: OfflineSpeakerDiarizationConfig,
|
val config: OfflineSpeakerDiarizationConfig,
|
||||||
) {
|
) {
|
||||||
private var ptr: Long
|
private var ptr: Long
|
||||||
|
|
||||||
@@ -84,14 +84,17 @@ class OfflineSpeakerDiarization(
|
|||||||
|
|
||||||
private external fun getSampleRate(ptr: Long): Int
|
private external fun getSampleRate(ptr: Long): Int
|
||||||
|
|
||||||
private external fun process(ptr: Long, samples: FloatArray): Array<OfflineSpeakerDiarizationSegment>
|
private external fun process(
|
||||||
|
ptr: Long,
|
||||||
|
samples: FloatArray
|
||||||
|
): Array<OfflineSpeakerDiarizationSegment>
|
||||||
|
|
||||||
private external fun processWithCallback(
|
private external fun processWithCallback(
|
||||||
ptr: Long,
|
ptr: Long,
|
||||||
samples: FloatArray,
|
samples: FloatArray,
|
||||||
callback: (numProcessedChunks: Int, numTotalChunks: Int, arg: Long) -> Int,
|
callback: (numProcessedChunks: Int, numTotalChunks: Int, arg: Long) -> Int,
|
||||||
arg: Long,
|
arg: Long,
|
||||||
): Array<OfflineSpeakerDiarizationSegment>
|
): Array<OfflineSpeakerDiarizationSegment>
|
||||||
|
|
||||||
companion object {
|
companion object {
|
||||||
init {
|
init {
|
||||||
|
|||||||
@@ -3,13 +3,6 @@ package com.k2fsa.sherpa.onnx
|
|||||||
import android.content.res.AssetManager
|
import android.content.res.AssetManager
|
||||||
import android.util.Log
|
import android.util.Log
|
||||||
|
|
||||||
data class SpeakerEmbeddingExtractorConfig(
|
|
||||||
val model: String,
|
|
||||||
var numThreads: Int = 1,
|
|
||||||
var debug: Boolean = false,
|
|
||||||
var provider: String = "cpu",
|
|
||||||
)
|
|
||||||
|
|
||||||
class SpeakerEmbeddingExtractor(
|
class SpeakerEmbeddingExtractor(
|
||||||
assetManager: AssetManager? = null,
|
assetManager: AssetManager? = null,
|
||||||
config: SpeakerEmbeddingExtractorConfig,
|
config: SpeakerEmbeddingExtractorConfig,
|
||||||
|
|||||||
@@ -0,0 +1,8 @@
|
|||||||
|
package com.k2fsa.sherpa.onnx
|
||||||
|
|
||||||
|
data class SpeakerEmbeddingExtractorConfig(
|
||||||
|
val model: String,
|
||||||
|
var numThreads: Int = 1,
|
||||||
|
var debug: Boolean = false,
|
||||||
|
var provider: String = "cpu",
|
||||||
|
)
|
||||||