Support passing TTS callback in Swift API (#1218)
This commit is contained in:
@@ -757,6 +757,14 @@ class SherpaOnnxGeneratedAudioWrapper {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
typealias TtsCallbackWithArg = (
|
||||||
|
@convention(c) (
|
||||||
|
UnsafePointer<Float>?, // const float* samples
|
||||||
|
Int32, // int32_t n
|
||||||
|
UnsafeMutableRawPointer? // void *arg
|
||||||
|
) -> Int32
|
||||||
|
)?
|
||||||
|
|
||||||
class SherpaOnnxOfflineTtsWrapper {
|
class SherpaOnnxOfflineTtsWrapper {
|
||||||
/// A pointer to the underlying counterpart in C
|
/// A pointer to the underlying counterpart in C
|
||||||
let tts: OpaquePointer!
|
let tts: OpaquePointer!
|
||||||
@@ -780,6 +788,17 @@ class SherpaOnnxOfflineTtsWrapper {
|
|||||||
|
|
||||||
return SherpaOnnxGeneratedAudioWrapper(audio: audio)
|
return SherpaOnnxGeneratedAudioWrapper(audio: audio)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func generateWithCallbackWithArg(
|
||||||
|
text: String, callback: TtsCallbackWithArg, arg: UnsafeMutableRawPointer, sid: Int = 0,
|
||||||
|
speed: Float = 1.0
|
||||||
|
) -> SherpaOnnxGeneratedAudioWrapper {
|
||||||
|
let audio: UnsafePointer<SherpaOnnxGeneratedAudio>? =
|
||||||
|
SherpaOnnxOfflineTtsGenerateWithCallbackWithArg(
|
||||||
|
tts, toCPointer(text), Int32(sid), speed, callback, arg)
|
||||||
|
|
||||||
|
return SherpaOnnxGeneratedAudioWrapper(audio: audio)
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// spoken language identification
|
// spoken language identification
|
||||||
|
|||||||
@@ -1,3 +1,9 @@
|
|||||||
|
class MyClass {
|
||||||
|
func playSamples(samples: [Float]) {
|
||||||
|
print("Play \(samples.count) samples")
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
func run() {
|
func run() {
|
||||||
let model = "./vits-piper-en_US-amy-low/en_US-amy-low.onnx"
|
let model = "./vits-piper-en_US-amy-low/en_US-amy-low.onnx"
|
||||||
let tokens = "./vits-piper-en_US-amy-low/tokens.txt"
|
let tokens = "./vits-piper-en_US-amy-low/tokens.txt"
|
||||||
@@ -11,6 +17,27 @@ func run() {
|
|||||||
let modelConfig = sherpaOnnxOfflineTtsModelConfig(vits: vits)
|
let modelConfig = sherpaOnnxOfflineTtsModelConfig(vits: vits)
|
||||||
var ttsConfig = sherpaOnnxOfflineTtsConfig(model: modelConfig)
|
var ttsConfig = sherpaOnnxOfflineTtsConfig(model: modelConfig)
|
||||||
|
|
||||||
|
let myClass = MyClass()
|
||||||
|
|
||||||
|
// We use Unretained here so myClass must be kept alive as the callback is invoked
|
||||||
|
//
|
||||||
|
// See also
|
||||||
|
// https://medium.com/codex/swift-c-callback-interoperability-6d57da6c8ee6
|
||||||
|
let arg = Unmanaged<MyClass>.passUnretained(myClass).toOpaque()
|
||||||
|
|
||||||
|
let callback: TtsCallbackWithArg = { samples, n, arg in
|
||||||
|
let o = Unmanaged<MyClass>.fromOpaque(arg!).takeUnretainedValue()
|
||||||
|
var savedSamples: [Float] = []
|
||||||
|
for index in 0..<n {
|
||||||
|
savedSamples.append(samples![Int(index)])
|
||||||
|
}
|
||||||
|
|
||||||
|
o.playSamples(samples: savedSamples)
|
||||||
|
|
||||||
|
// return 1 so that it continues generating
|
||||||
|
return 1
|
||||||
|
}
|
||||||
|
|
||||||
let tts = SherpaOnnxOfflineTtsWrapper(config: &ttsConfig)
|
let tts = SherpaOnnxOfflineTtsWrapper(config: &ttsConfig)
|
||||||
|
|
||||||
let text =
|
let text =
|
||||||
@@ -18,11 +45,15 @@ func run() {
|
|||||||
let sid = 99
|
let sid = 99
|
||||||
let speed: Float = 1.0
|
let speed: Float = 1.0
|
||||||
|
|
||||||
let audio = tts.generate(text: text, sid: sid, speed: speed)
|
let audio = tts.generateWithCallbackWithArg(
|
||||||
|
text: text, callback: callback, arg: arg, sid: sid, speed: speed)
|
||||||
let filename = "test.wav"
|
let filename = "test.wav"
|
||||||
audio.save(filename: filename)
|
let ok = audio.save(filename: filename)
|
||||||
|
if ok == 1 {
|
||||||
print("\nSaved to:\n\(filename)")
|
print("\nSaved to:\(filename)")
|
||||||
|
} else {
|
||||||
|
print("Failed to save to \(filename)")
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@main
|
@main
|
||||||
|
|||||||
Reference in New Issue
Block a user