10
10
import torch
11
11
12
12
import vllm .envs as envs
13
+ from vllm import version
13
14
from vllm .config import (CacheConfig , CompilationConfig , ConfigFormat ,
14
15
DecodingConfig , DeviceConfig , HfOverrides ,
15
16
KVTransferConfig , LoadConfig , LoadFormat , LoRAConfig ,
@@ -188,6 +189,7 @@ class EngineArgs:
188
189
qlora_adapter_name_or_path : Optional [str ] = None
189
190
disable_logprobs_during_spec_decoding : Optional [bool ] = None
190
191
192
+ show_hidden_metrics_for_version : Optional [str ] = None
191
193
otlp_traces_endpoint : Optional [str ] = None
192
194
collect_detailed_traces : Optional [str ] = None
193
195
disable_async_output_proc : bool = False
@@ -909,6 +911,18 @@ def add_cli_args(parser: FlexibleArgumentParser) -> FlexibleArgumentParser:
909
911
default = None ,
910
912
help = 'Name or path of the QLoRA adapter.' )
911
913
914
+ parser .add_argument ('--show-hidden-metrics-for-version' ,
915
+ type = str ,
916
+ default = None ,
917
+ help = 'Enable deprecated Prometheus metrics that '
918
+ 'have been hidden since the specified version. '
919
+ 'For example, if a previously deprecated metric '
920
+ 'has been hidden since the v0.7.0 release, you '
921
+ 'use --show-hidden-metrics-for-version=0.7 as a '
922
+ 'temporary escape hatch while you migrate to new '
923
+ 'metrics. The metric is likely to be removed '
924
+ 'completely in an upcoming release.' )
925
+
912
926
parser .add_argument (
913
927
'--otlp-traces-endpoint' ,
914
928
type = str ,
@@ -1317,6 +1331,11 @@ def create_engine_config(self,
1317
1331
decoding_config = DecodingConfig (
1318
1332
guided_decoding_backend = self .guided_decoding_backend )
1319
1333
1334
+ show_hidden_metrics = False
1335
+ if self .show_hidden_metrics_for_version is not None :
1336
+ show_hidden_metrics = version ._prev_minor_version_was (
1337
+ self .show_hidden_metrics_for_version )
1338
+
1320
1339
detailed_trace_modules = []
1321
1340
if self .collect_detailed_traces is not None :
1322
1341
detailed_trace_modules = self .collect_detailed_traces .split ("," )
@@ -1326,6 +1345,7 @@ def create_engine_config(self,
1326
1345
f"Invalid module { m } in collect_detailed_traces. "
1327
1346
f"Valid modules are { ALLOWED_DETAILED_TRACE_MODULES } " )
1328
1347
observability_config = ObservabilityConfig (
1348
+ show_hidden_metrics = show_hidden_metrics ,
1329
1349
otlp_traces_endpoint = self .otlp_traces_endpoint ,
1330
1350
collect_model_forward_time = "model" in detailed_trace_modules
1331
1351
or "all" in detailed_trace_modules ,
0 commit comments