Re-implement LM rescore for online transducer (#1231)

Co-authored-by: Martins Kronis <martins.kuznecovs@tilde.lv>
This commit is contained in:
SilverSulfide
2024-09-06 05:01:25 +03:00
committed by GitHub
parent 1f29e4a1a9
commit 888f74bf3c
11 changed files with 175 additions and 31 deletions

View File

@@ -21,13 +21,17 @@ class OnlineLM {
static std::unique_ptr<OnlineLM> Create(const OnlineLMConfig &config);
virtual std::pair<Ort::Value, std::vector<Ort::Value>> GetInitStates() = 0;
// init states for classic rescore
virtual std::vector<Ort::Value> GetInitStates() = 0;
/** ScoreToken a batch of sentences.
// init states for shallow fusion
virtual std::pair<Ort::Value, std::vector<Ort::Value>> GetInitStatesSF() = 0;
/** ScoreToken a batch of sentences (shallow fusion).
*
* @param x A 2-D tensor of shape (N, 1) with data type int64.
* @param states It contains the states for the LM model
* @return Return a pair containingo
* @return Return a pair containing
* - log_prob of NN LM
* - updated states
*
@@ -35,13 +39,23 @@ class OnlineLM {
virtual std::pair<Ort::Value, std::vector<Ort::Value>> ScoreToken(
Ort::Value x, std::vector<Ort::Value> states) = 0;
/** This function updates lm_lob_prob and nn_lm_scores of hyp
/** This function updates hyp.lm_log_prob of hyps (classic rescore).
*
* @param scale LM score
* @param context_size Context size of the transducer decoder model
* @param hyps It is changed in-place.
*
*/
virtual void ComputeLMScore(float scale, int32_t context_size,
std::vector<Hypotheses> *hyps) = 0;
/** This function updates lm_log_prob and nn_lm_scores of hyp (shallow fusion).
*
* @param scale LM score
* @param hyps It is changed in-place.
*
*/
virtual void ComputeLMScore(float scale, Hypothesis *hyp) = 0;
virtual void ComputeLMScoreSF(float scale, Hypothesis *hyp) = 0;
};
} // namespace sherpa_onnx