[Bugfix] fix kv buffer register & dp attention & deepepmoe (#9327)
This commit is contained in:
@@ -23,9 +23,7 @@ class AscendKVManager(MooncakeKVManager):
|
||||
)
|
||||
|
||||
def register_buffer_to_engine(self):
|
||||
self.engine.register(
|
||||
self.kv_args.kv_data_ptrs[0], sum(self.kv_args.kv_data_lens)
|
||||
)
|
||||
self.engine.batch_register(self.kv_args.kv_data_ptrs, self.kv_args.kv_data_lens)
|
||||
# The Ascend backend optimize batch registration for small memory blocks.
|
||||
self.engine.batch_register(
|
||||
self.kv_args.aux_data_ptrs, self.kv_args.aux_data_lens
|
||||
|
||||
Reference in New Issue
Block a user