[310P]: add torch chunk gated delta rule and 910b parity ut (#7594)
### What this PR does / why we need it? RFC https://github.com/vllm-project/vllm-ascend/issues/7394 Add a PyTorch implementation of the chunk gated delta rule on 310P. ### Does this PR introduce _any_ user-facing change? NO ### How was this patch tested? UT --------- Signed-off-by: Tflowers-0129 <2906339855@qq.com>
This commit is contained in:
@@ -1,7 +1,9 @@
|
||||
from .chunk_gated_delta_rule import chunk_gated_delta_rule_pytorch
|
||||
from .fused_gdn_gating import fused_gdn_gating_pytorch
|
||||
from .fused_recurrent_gated_delta_rule import fused_recurrent_gated_delta_rule_pytorch
|
||||
|
||||
__all__ = [
|
||||
"fused_gdn_gating_pytorch",
|
||||
"fused_recurrent_gated_delta_rule_pytorch",
|
||||
"chunk_gated_delta_rule_pytorch",
|
||||
]
|
||||
|
||||
Reference in New Issue
Block a user