diff --git a/tests/models/decoder_only/vision_language/test_models.py b/tests/models/decoder_only/vision_language/test_models.py index d738647c91b66..e49ea6f98324d 100644 --- a/tests/models/decoder_only/vision_language/test_models.py +++ b/tests/models/decoder_only/vision_language/test_models.py @@ -291,6 +291,15 @@ # vllm_output_post_proc=model_utils.phi3v_vllm_to_hf_output, # num_logprobs=10, # ), + "pixtral_hf": VLMTestInfo( + models=["nm-testing/pixtral-12b-FP8-dynamic"], + test_type=(VLMTestType.IMAGE, VLMTestType.MULTI_IMAGE), + prompt_formatter=lambda img_prompt: f"[INST]{img_prompt}[/INST]", + img_idx_to_prompt=lambda idx: "[IMG]", + max_model_len=8192, + max_num_seqs=2, + auto_cls=AutoModelForVision2Seq, + ), "qwen": VLMTestInfo( models=["Qwen/Qwen-VL"], test_type=(VLMTestType.IMAGE, VLMTestType.MULTI_IMAGE),