// sherpa-onnx/csrc/offline-ctc-decoder.h // // Copyright (c) 2023 Xiaomi Corporation #ifndef SHERPA_ONNX_CSRC_OFFLINE_CTC_DECODER_H_ #define SHERPA_ONNX_CSRC_OFFLINE_CTC_DECODER_H_ #include #include "onnxruntime_cxx_api.h" // NOLINT namespace sherpa_onnx { struct OfflineCtcDecoderResult { /// The decoded token IDs std::vector tokens; /// timestamps[i] contains the output frame index where tokens[i] is decoded. /// Note: The index is after subsampling std::vector timestamps; }; class OfflineCtcDecoder { public: virtual ~OfflineCtcDecoder() = default; /** Run CTC decoding given the output from the encoder model. * * @param log_probs A 3-D tensor of shape (N, T, vocab_size) containing * lob_probs. * @param log_probs_length A 1-D tensor of shape (N,) containing number * of valid frames in log_probs before padding. * * @return Return a vector of size `N` containing the decoded results. */ virtual std::vector Decode( Ort::Value log_probs, Ort::Value log_probs_length) = 0; }; } // namespace sherpa_onnx #endif // SHERPA_ONNX_CSRC_OFFLINE_CTC_DECODER_H_