Skip to content

Commit 3f75181

Browse files
committed
opti profiler default param
Signed-off-by: zzzzwwjj <[email protected]>
1 parent 7271f0d commit 3f75181

File tree

3 files changed

+30
-3
lines changed

3 files changed

+30
-3
lines changed

tests/ut/worker/test_worker_v1.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -520,7 +520,7 @@ def test_init_profiler_enabled(
520520
# Set enum mocks
521521
mock_export_type.Text = "Text"
522522
mock_profiler_level.Level1 = "Level1"
523-
mock_aic_metrics.AiCoreNone = "AiCoreNone"
523+
mock_aic_metrics.PipeUtilization = "PipeUtilization"
524524
mock_profiler_activity.CPU = "CPU"
525525
mock_profiler_activity.NPU = "NPU"
526526

@@ -554,7 +554,7 @@ def test_init_profiler_enabled(
554554
"export_type": "Text",
555555
"profiler_level": "Level1",
556556
"msprof_tx": False,
557-
"aic_metrics": "AiCoreNone",
557+
"aic_metrics": "PipeUtilization",
558558
"l2_cache": False,
559559
"op_attr": False,
560560
"data_simplification": False,

vllm_ascend/envs.py

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -176,6 +176,20 @@
176176
# Whether to anbale dynamic EPLB
177177
"DYNAMIC_EPLB":
178178
lambda: os.getenv("DYNAMIC_EPLB", "false").lower(),
179+
# Set torch_npu profiler to profile aicore metrics. There are the following options that can be configured:
180+
# 0: torch_npu.profiler.AiCMetrics.AiCoreNone;
181+
# 1: torch_npu.profiler.AiCMetrics.PipeUtilization;
182+
# 2: torch_npu.profiler.AiCMetrics.ArithmeticUtilization;
183+
# 3: torch_npu.profiler.AiCMetrics.Memory;
184+
# 4: torch_npu.profiler.AiCMetrics.MemoryL0;
185+
# 5: torch_npu.profiler.AiCMetrics.ResourceConflictRatio;
186+
# 6: torch_npu.profiler.AiCMetrics.MemoryUB;
187+
# 7: torch_npu.profiler.AiCMetrics.L2Cache;
188+
# 8: torch_npu.profiler.AiCMetrics.MemoryAccess;
189+
# If not set, it will be torch_npu.profiler.AiCMetrics.PipeUtilization by default.
190+
# The meanings of various options can refer to: https://www.hiascend.com/document/detail/zh/Pytorch/720/apiref/torchnpuCustomsapi/context/torch_npu-profiler-AiCMetrics.md
191+
"VLLM_ASCEND_PROFILER_AIC_METRICS":
192+
lambda: int(os.getenv("VLLM_ASCEND_PROFILER_AIC_METRICS", 1)),
179193
}
180194

181195
# end-env-vars-definition

vllm_ascend/worker/worker_v1.py

Lines changed: 14 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -430,11 +430,24 @@ def _init_profiler(self):
430430
logger.info("Profiling enabled. Traces will be saved to: %s",
431431
torch_profiler_trace_dir)
432432

433+
aic_metrics_list = [
434+
torch_npu.profiler.AiCMetrics.AiCoreNone,
435+
torch_npu.profiler.AiCMetrics.PipeUtilization,
436+
torch_npu.profiler.AiCMetrics.ArithmeticUtilization,
437+
torch_npu.profiler.AiCMetrics.Memory,
438+
torch_npu.profiler.AiCMetrics.MemoryL0,
439+
torch_npu.profiler.AiCMetrics.ResourceConflictRatio,
440+
torch_npu.profiler.AiCMetrics.MemoryUB,
441+
torch_npu.profiler.AiCMetrics.L2Cache,
442+
torch_npu.profiler.AiCMetrics.MemoryAccess
443+
]
444+
433445
experimental_config = torch_npu.profiler._ExperimentalConfig(
434446
export_type=torch_npu.profiler.ExportType.Text,
435447
profiler_level=torch_npu.profiler.ProfilerLevel.Level1,
436448
msprof_tx=False,
437-
aic_metrics=torch_npu.profiler.AiCMetrics.AiCoreNone,
449+
aic_metrics=aic_metrics_list[
450+
envs_ascend.VLLM_ASCEND_PROFILER_AIC_METRICS],
438451
l2_cache=False,
439452
op_attr=False,
440453
data_simplification=False,

0 commit comments

Comments
 (0)