diff --git a/docs/source/tutorials.md b/docs/source/tutorials.md index b3bda7f..b907c02 100644 --- a/docs/source/tutorials.md +++ b/docs/source/tutorials.md @@ -237,7 +237,10 @@ docker run \ ``` Choose one machine as head node, the other are worker nodes, then start ray on each machine: -:::{note} Check out your `nic_name` by command `ip addr` ::: + +:::{note} +Check out your `nic_name` by command `ip addr`. +::: ```shell # Head node diff --git a/vllm_ascend/model_runner.py b/vllm_ascend/model_runner.py index 3376384..1cf06dd 100644 --- a/vllm_ascend/model_runner.py +++ b/vllm_ascend/model_runner.py @@ -1113,8 +1113,8 @@ class NPUModelRunner(NPUModelRunnerBase[ModelInputForNPUWithSamplingMetadata]): if (self.observability_config is not None and self.observability_config.collect_model_forward_time): - model_forward_start = torch.cuda.Event(enable_timing=True) - model_forward_end = torch.cuda.Event(enable_timing=True) + model_forward_start = torch_npu.npu.Event(enable_timing=True) + model_forward_end = torch_npu.npu.Event(enable_timing=True) model_forward_start.record() if not bypass_model_exec: