// wasm/sherpa-onnx-wasm-main-tts.cc // // Copyright (c) 2024 Xiaomi Corporation #include #include #include #include "sherpa-onnx/c-api/c-api.h" // see also // https://emscripten.org/docs/porting/connecting_cpp_and_javascript/Interacting-with-code.html extern "C" { static_assert(sizeof(SherpaOnnxOfflineTtsVitsModelConfig) == 8 * 4, ""); static_assert(sizeof(SherpaOnnxOfflineTtsMatchaModelConfig) == 8 * 4, ""); static_assert(sizeof(SherpaOnnxOfflineTtsKokoroModelConfig) == 5 * 4, ""); static_assert(sizeof(SherpaOnnxOfflineTtsModelConfig) == sizeof(SherpaOnnxOfflineTtsVitsModelConfig) + sizeof(SherpaOnnxOfflineTtsMatchaModelConfig) + sizeof(SherpaOnnxOfflineTtsKokoroModelConfig) + 3 * 4, ""); static_assert(sizeof(SherpaOnnxOfflineTtsConfig) == sizeof(SherpaOnnxOfflineTtsModelConfig) + 3 * 4, ""); void MyPrint(SherpaOnnxOfflineTtsConfig *tts_config) { auto tts_model_config = &tts_config->model; auto vits_model_config = &tts_model_config->vits; auto matcha_model_config = &tts_model_config->matcha; auto kokoro = &tts_model_config->kokoro; fprintf(stdout, "----------vits model config----------\n"); fprintf(stdout, "model: %s\n", vits_model_config->model); fprintf(stdout, "lexicon: %s\n", vits_model_config->lexicon); fprintf(stdout, "tokens: %s\n", vits_model_config->tokens); fprintf(stdout, "data_dir: %s\n", vits_model_config->data_dir); fprintf(stdout, "noise scale: %.3f\n", vits_model_config->noise_scale); fprintf(stdout, "noise scale w: %.3f\n", vits_model_config->noise_scale_w); fprintf(stdout, "length scale: %.3f\n", vits_model_config->length_scale); fprintf(stdout, "dict_dir: %s\n", vits_model_config->dict_dir); fprintf(stdout, "----------matcha model config----------\n"); fprintf(stdout, "acoustic_model: %s\n", matcha_model_config->acoustic_model); fprintf(stdout, "vocoder: %s\n", matcha_model_config->vocoder); fprintf(stdout, "lexicon: %s\n", matcha_model_config->lexicon); fprintf(stdout, "tokens: %s\n", matcha_model_config->tokens); fprintf(stdout, "data_dir: %s\n", matcha_model_config->data_dir); fprintf(stdout, "noise scale: %.3f\n", matcha_model_config->noise_scale); fprintf(stdout, "length scale: %.3f\n", matcha_model_config->length_scale); fprintf(stdout, "dict_dir: %s\n", matcha_model_config->dict_dir); fprintf(stdout, "----------kokoro model config----------\n"); fprintf(stdout, "model: %s\n", kokoro->model); fprintf(stdout, "voices: %s\n", kokoro->voices); fprintf(stdout, "tokens: %s\n", kokoro->tokens); fprintf(stdout, "data_dir: %s\n", kokoro->data_dir); fprintf(stdout, "length scale: %.3f\n", kokoro->length_scale); fprintf(stdout, "----------tts model config----------\n"); fprintf(stdout, "num threads: %d\n", tts_model_config->num_threads); fprintf(stdout, "debug: %d\n", tts_model_config->debug); fprintf(stdout, "provider: %s\n", tts_model_config->provider); fprintf(stdout, "----------tts config----------\n"); fprintf(stdout, "rule_fsts: %s\n", tts_config->rule_fsts); fprintf(stdout, "rule_fars: %s\n", tts_config->rule_fars); fprintf(stdout, "max num sentences: %d\n", tts_config->max_num_sentences); } void CopyHeap(const char *src, int32_t num_bytes, char *dst) { std::copy(src, src + num_bytes, dst); } }