diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py index cc7c99e50ac4d..04629b7ffe977 100644 --- a/vllm/engine/arg_utils.py +++ b/vllm/engine/arg_utils.py @@ -1289,7 +1289,7 @@ def _override_v1_engine_args(self, usage_context: UsageContext) -> None: # context. # Use different default values for different hardware. from vllm.platforms import current_platform - device_name = current_platform.get_device_name().lower() + device_name = str(current_platform.get_device_name().lower()) if "h100" in device_name or "h200" in device_name: # For H100 and H200, we use larger default values. default_max_num_batched_tokens = {