provide an e2e guide for execute duration profiling (#1113)
### What this PR does / why we need it? provide an e2e guide for execute duration profiling Signed-off-by: depeng1994 <depengzhang@foxmail.com>
This commit is contained in:
@@ -1317,8 +1317,8 @@ class NPUModelRunner(LoRAModelRunnerMixin):
|
||||
for tag, duration in durations.items()
|
||||
]
|
||||
captured_name = "Decode" if self.attn_state == AscendAttentionState.DecodeOnly else "Prefill"
|
||||
print(f"Profile execute duration [{captured_name}]:",
|
||||
" ".join(dr_str))
|
||||
logger.info("Profile execute duration [%s]:%s", captured_name,
|
||||
" ".join(dr_str))
|
||||
|
||||
return model_runner_output
|
||||
|
||||
|
||||
Reference in New Issue
Block a user