Skip to content

Commit 28de9a8

Browse files
authored
enable metrics by default (#4108)
* enable metrics by default * fix according to reviewer comments
1 parent 4d1eebd commit 28de9a8

File tree

3 files changed

+13
-10
lines changed

3 files changed

+13
-10
lines changed

lmdeploy/cli/serve.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -110,7 +110,7 @@ def add_parser_api_server():
110110
quant_policy = ArgumentHelper.quant_policy(pt_group)
111111
model_format = ArgumentHelper.model_format(pt_group)
112112
hf_overrides = ArgumentHelper.hf_overrides(pt_group)
113-
enable_metrics = ArgumentHelper.enable_metrics(pt_group)
113+
disable_metrics = ArgumentHelper.disable_metrics(pt_group)
114114
ArgumentHelper.dp(pt_group)
115115
ArgumentHelper.ep(pt_group)
116116
ArgumentHelper.enable_microbatch(pt_group)
@@ -135,7 +135,7 @@ def add_parser_api_server():
135135
tb_group._group_actions.append(quant_policy)
136136
tb_group._group_actions.append(model_format)
137137
tb_group._group_actions.append(hf_overrides)
138-
tb_group._group_actions.append(enable_metrics)
138+
tb_group._group_actions.append(disable_metrics)
139139
ArgumentHelper.rope_scaling_factor(tb_group)
140140
ArgumentHelper.num_tokens_per_iter(tb_group)
141141
ArgumentHelper.max_prefill_iters(tb_group)
@@ -217,7 +217,7 @@ def api_server(args):
217217
max_prefill_token_num=args.max_prefill_token_num,
218218
enable_microbatch=args.enable_microbatch,
219219
enable_eplb=args.enable_eplb,
220-
enable_metrics=args.enable_metrics,
220+
enable_metrics=not args.disable_metrics,
221221
role=EngineRole[args.role],
222222
migration_backend=MigrationBackend[args.migration_backend],
223223
model_format=args.model_format,
@@ -245,7 +245,7 @@ def api_server(args):
245245
num_tokens_per_iter=args.num_tokens_per_iter,
246246
max_prefill_iters=args.max_prefill_iters,
247247
communicator=args.communicator,
248-
enable_metrics=args.enable_metrics,
248+
enable_metrics=not args.disable_metrics,
249249
hf_overrides=args.hf_overrides)
250250
chat_template_config = get_chat_template(args.chat_template, args.model_path)
251251

lmdeploy/cli/utils.py

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -594,9 +594,12 @@ def enable_eplb(parser):
594594
return parser.add_argument('--enable-eplb', action='store_true', help='enable eplb for specified model')
595595

596596
@staticmethod
597-
def enable_metrics(parser):
598-
"""Add argument enable_metrics to parser."""
599-
return parser.add_argument('--enable-metrics', action='store_true', default=False, help='enable metrics system')
597+
def disable_metrics(parser):
598+
"""Add argument disable_metrics to parser."""
599+
return parser.add_argument('--disable-metrics',
600+
action='store_true',
601+
default=False,
602+
help='disable metrics system')
600603

601604
# For Disaggregation
602605
@staticmethod
@@ -623,7 +626,7 @@ def disable_vision_encoder(parser):
623626
return parser.add_argument('--disable-vision-encoder',
624627
action='store_true',
625628
default=False,
626-
help='enable metrics system')
629+
help='disable multimodal encoder')
627630

628631
@staticmethod
629632
def logprobs_mode(parser):

lmdeploy/messages.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -259,7 +259,7 @@ class TurbomindEngineConfig:
259259
empty_init: bool = False
260260
communicator: str = 'nccl'
261261
hf_overrides: Optional[Dict[str, Any]] = None
262-
enable_metrics: bool = False
262+
enable_metrics: bool = True
263263

264264
def __post_init__(self):
265265
"""Check input validation."""
@@ -372,7 +372,7 @@ class PytorchEngineConfig:
372372
enable_mp_engine: bool = False
373373
mp_engine_backend: str = 'mp'
374374
model_format: str = None
375-
enable_metrics: bool = False
375+
enable_metrics: bool = True
376376
hf_overrides: Optional[Dict[str, Any]] = None
377377
disable_vision_encoder: bool = False
378378
logprobs_mode: str = None

0 commit comments

Comments
 (0)