[Misc] Adjust the default profiler configuration (#1097)
### What this PR does / why we need it? When profiling, it is often necessary to disable the call stack to reduce profiling overhead, and adjust the profiler_level to level1 to obtain more detailed operator and communication information. Therefore, it is recommended to modify the default profiling configuration. ### Does this PR introduce _any_ user-facing change? No ### How was this patch tested? No Signed-off-by: ApsarasX <apsarax@outlook.com>
This commit is contained in:
@@ -140,7 +140,7 @@ class NPUWorker(LocalOrDistributedWorkerBase):
|
|||||||
|
|
||||||
experimental_config = torch_npu.profiler._ExperimentalConfig(
|
experimental_config = torch_npu.profiler._ExperimentalConfig(
|
||||||
export_type=torch_npu.profiler.ExportType.Text,
|
export_type=torch_npu.profiler.ExportType.Text,
|
||||||
profiler_level=torch_npu.profiler.ProfilerLevel.Level0,
|
profiler_level=torch_npu.profiler.ProfilerLevel.Level1,
|
||||||
msprof_tx=False,
|
msprof_tx=False,
|
||||||
aic_metrics=torch_npu.profiler.AiCMetrics.AiCoreNone,
|
aic_metrics=torch_npu.profiler.AiCMetrics.AiCoreNone,
|
||||||
l2_cache=False,
|
l2_cache=False,
|
||||||
@@ -155,9 +155,9 @@ class NPUWorker(LocalOrDistributedWorkerBase):
|
|||||||
torch_npu.profiler.ProfilerActivity.CPU,
|
torch_npu.profiler.ProfilerActivity.CPU,
|
||||||
torch_npu.profiler.ProfilerActivity.NPU,
|
torch_npu.profiler.ProfilerActivity.NPU,
|
||||||
],
|
],
|
||||||
with_stack=True,
|
with_stack=False,
|
||||||
profile_memory=True,
|
profile_memory=False,
|
||||||
with_modules=True,
|
with_modules=False,
|
||||||
experimental_config=experimental_config,
|
experimental_config=experimental_config,
|
||||||
on_trace_ready=torch_npu.profiler.tensorboard_trace_handler(
|
on_trace_ready=torch_npu.profiler.tensorboard_trace_handler(
|
||||||
torch_profiler_trace_dir))
|
torch_profiler_trace_dir))
|
||||||
|
|||||||
@@ -275,7 +275,7 @@ class NPUWorker(WorkerBase):
|
|||||||
|
|
||||||
experimental_config = torch_npu.profiler._ExperimentalConfig(
|
experimental_config = torch_npu.profiler._ExperimentalConfig(
|
||||||
export_type=torch_npu.profiler.ExportType.Text,
|
export_type=torch_npu.profiler.ExportType.Text,
|
||||||
profiler_level=torch_npu.profiler.ProfilerLevel.Level0,
|
profiler_level=torch_npu.profiler.ProfilerLevel.Level1,
|
||||||
msprof_tx=False,
|
msprof_tx=False,
|
||||||
aic_metrics=torch_npu.profiler.AiCMetrics.AiCoreNone,
|
aic_metrics=torch_npu.profiler.AiCMetrics.AiCoreNone,
|
||||||
l2_cache=False,
|
l2_cache=False,
|
||||||
@@ -290,9 +290,9 @@ class NPUWorker(WorkerBase):
|
|||||||
torch_npu.profiler.ProfilerActivity.CPU,
|
torch_npu.profiler.ProfilerActivity.CPU,
|
||||||
torch_npu.profiler.ProfilerActivity.NPU,
|
torch_npu.profiler.ProfilerActivity.NPU,
|
||||||
],
|
],
|
||||||
with_stack=True,
|
with_stack=False,
|
||||||
profile_memory=True,
|
profile_memory=False,
|
||||||
with_modules=True,
|
with_modules=False,
|
||||||
experimental_config=experimental_config,
|
experimental_config=experimental_config,
|
||||||
on_trace_ready=torch_npu.profiler.tensorboard_trace_handler(
|
on_trace_ready=torch_npu.profiler.tensorboard_trace_handler(
|
||||||
torch_profiler_trace_dir))
|
torch_profiler_trace_dir))
|
||||||
|
|||||||
Reference in New Issue
Block a user