@@ -110,7 +110,7 @@ def add_parser_api_server():
110110 quant_policy = ArgumentHelper .quant_policy (pt_group )
111111 model_format = ArgumentHelper .model_format (pt_group )
112112 hf_overrides = ArgumentHelper .hf_overrides (pt_group )
113- enable_metrics = ArgumentHelper .enable_metrics (pt_group )
113+ disable_metrics = ArgumentHelper .disable_metrics (pt_group )
114114 ArgumentHelper .dp (pt_group )
115115 ArgumentHelper .ep (pt_group )
116116 ArgumentHelper .enable_microbatch (pt_group )
@@ -135,7 +135,7 @@ def add_parser_api_server():
135135 tb_group ._group_actions .append (quant_policy )
136136 tb_group ._group_actions .append (model_format )
137137 tb_group ._group_actions .append (hf_overrides )
138- tb_group ._group_actions .append (enable_metrics )
138+ tb_group ._group_actions .append (disable_metrics )
139139 ArgumentHelper .rope_scaling_factor (tb_group )
140140 ArgumentHelper .num_tokens_per_iter (tb_group )
141141 ArgumentHelper .max_prefill_iters (tb_group )
@@ -217,7 +217,7 @@ def api_server(args):
217217 max_prefill_token_num = args .max_prefill_token_num ,
218218 enable_microbatch = args .enable_microbatch ,
219219 enable_eplb = args .enable_eplb ,
220- enable_metrics = args .enable_metrics ,
220+ enable_metrics = not args .disable_metrics ,
221221 role = EngineRole [args .role ],
222222 migration_backend = MigrationBackend [args .migration_backend ],
223223 model_format = args .model_format ,
@@ -245,7 +245,7 @@ def api_server(args):
245245 num_tokens_per_iter = args .num_tokens_per_iter ,
246246 max_prefill_iters = args .max_prefill_iters ,
247247 communicator = args .communicator ,
248- enable_metrics = args .enable_metrics ,
248+ enable_metrics = not args .disable_metrics ,
249249 hf_overrides = args .hf_overrides )
250250 chat_template_config = get_chat_template (args .chat_template , args .model_path )
251251
0 commit comments