diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py index b0383c95e5cb7..03c73686b8ee1 100644 --- a/vllm/engine/arg_utils.py +++ b/vllm/engine/arg_utils.py @@ -571,10 +571,10 @@ def create_engine_config(self, ) -> EngineConfig: self.code_revision, self.rope_scaling, self.tokenizer_revision, self.max_model_len, self.quantization, self.quantization_param_path, self.quantization_weights_path, - self.enforce_eager, - self.max_context_len_to_capture, self.max_seq_len_to_capture, - self.max_logprobs, self.disable_sliding_window, - self.skip_tokenizer_init, self.served_model_name) + self.enforce_eager, self.max_context_len_to_capture, + self.max_seq_len_to_capture, self.max_logprobs, + self.disable_sliding_window, self.skip_tokenizer_init, + self.served_model_name) cache_config = CacheConfig(self.block_size, self.gpu_memory_utilization, self.swap_space, self.kv_cache_dtype,