// sherpa-onnx/csrc/offline-fire-red-asr-model.h // // Copyright (c) 2025 Xiaomi Corporation #ifndef SHERPA_ONNX_CSRC_OFFLINE_FIRE_RED_ASR_MODEL_H_ #define SHERPA_ONNX_CSRC_OFFLINE_FIRE_RED_ASR_MODEL_H_ #include #include #include #include #include #include #include "onnxruntime_cxx_api.h" // NOLINT #include "sherpa-onnx/csrc/offline-fire-red-asr-model-meta-data.h" #include "sherpa-onnx/csrc/offline-model-config.h" namespace sherpa_onnx { class OfflineFireRedAsrModel { public: explicit OfflineFireRedAsrModel(const OfflineModelConfig &config); template OfflineFireRedAsrModel(Manager *mgr, const OfflineModelConfig &config); ~OfflineFireRedAsrModel(); /** Run the encoder model. * * @param features A tensor of shape (N, T, C). * @param features_len A tensor of shape (N,) with dtype int64. * * @return Return a pair containing: * - n_layer_cross_k: A 4-D tensor of shape * (num_decoder_layers, N, T, d_model) * - n_layer_cross_v: A 4-D tensor of shape * (num_decoder_layers, N, T, d_model) */ std::pair ForwardEncoder( Ort::Value features, Ort::Value features_length) const; /** Run the decoder model. * * @param tokens A int64 tensor of shape (N, num_words) * @param n_layer_self_k_cache A 5-D tensor of shape * (num_decoder_layers, N, max_len, num_head, head_dim). * @param n_layer_self_v_cache A 5-D tensor of shape * (num_decoder_layers, N, max_len, num_head, head_dim). * @param n_layer_cross_k A 5-D tensor of shape * (num_decoder_layers, N, T, d_model). * @param n_layer_cross_v A 5-D tensor of shape * (num_decoder_layers, N, T, d_model). * @param offset A int64 tensor of shape (N,) * * @return Return a tuple containing 6 tensors: * * - logits A 3-D tensor of shape (N, num_words, vocab_size) * - out_n_layer_self_k_cache Same shape as n_layer_self_k_cache * - out_n_layer_self_v_cache Same shape as n_layer_self_v_cache * - out_n_layer_cross_k Same as n_layer_cross_k * - out_n_layer_cross_v Same as n_layer_cross_v * - out_offset Same as offset */ std::tuple ForwardDecoder(Ort::Value tokens, Ort::Value n_layer_self_k_cache, Ort::Value n_layer_self_v_cache, Ort::Value n_layer_cross_k, Ort::Value n_layer_cross_v, Ort::Value offset) const; /** Return the initial self kv cache in a pair * - n_layer_self_k_cache A 5-D tensor of shape * (num_decoder_layers, N, max_len, num_head, head_dim). * - n_layer_self_v_cache A 5-D tensor of shape * (num_decoder_layers, N, max_len, num_head, head_dim). */ std::pair GetInitialSelfKVCache() const; const OfflineFireRedAsrModelMetaData &GetModelMetadata() const; /** Return an allocator for allocating memory */ OrtAllocator *Allocator() const; private: class Impl; std::unique_ptr impl_; }; } // namespace sherpa_onnx #endif // SHERPA_ONNX_CSRC_OFFLINE_FIRE_RED_ASR_MODEL_H_