diff --git a/vllm/engine/llm_engine.py b/vllm/engine/llm_engine.py index 0f6e34ab5142d..e5458b3759b5d 100644 --- a/vllm/engine/llm_engine.py +++ b/vllm/engine/llm_engine.py @@ -256,25 +256,39 @@ def __init__( "use_async_output_proc=%s, use_cached_outputs=%s, " "mm_processor_kwargs=%s, " "pooling_config_type=%s, normalize=%s)", VLLM_VERSION, - model_config.model, speculative_config, model_config.tokenizer, - model_config.skip_tokenizer_init, model_config.tokenizer_mode, - model_config.revision, model_config.override_neuron_config, - model_config.rope_scaling, model_config.rope_theta, - model_config.tokenizer_revision, model_config.trust_remote_code, - model_config.dtype, model_config.max_model_len, - load_config.download_dir, load_config.load_format, + model_config.model, + speculative_config, + model_config.tokenizer, + model_config.skip_tokenizer_init, + model_config.tokenizer_mode, + model_config.revision, + model_config.override_neuron_config, + model_config.rope_scaling, + model_config.rope_theta, + model_config.tokenizer_revision, + model_config.trust_remote_code, + model_config.dtype, + model_config.max_model_len, + load_config.download_dir, + load_config.load_format, parallel_config.tensor_parallel_size, parallel_config.pipeline_parallel_size, parallel_config.disable_custom_all_reduce, - model_config.quantization, model_config.enforce_eager, - cache_config.cache_dtype, model_config.quantization_param_path, - device_config.device, decoding_config, observability_config, - model_config.seed, model_config.served_model_name, + model_config.quantization, + model_config.enforce_eager, + cache_config.cache_dtype, + model_config.quantization_param_path, + device_config.device, + decoding_config, + observability_config, + model_config.seed, + model_config.served_model_name, scheduler_config.num_scheduler_steps, scheduler_config.chunked_prefill_enabled, scheduler_config.multi_step_stream_outputs, cache_config.enable_prefix_caching, - model_config.use_async_output_proc, use_cached_outputs, + model_config.use_async_output_proc, + use_cached_outputs, model_config.mm_processor_kwargs, model_config.pooling_config.pooling_type, model_config.pooling_config.normalize)