|
|
|
@ -5,6 +5,7 @@ from typing import Optional, overload
|
|
|
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
import torch
|
|
|
|
|
from packaging.version import Version
|
|
|
|
|
from transformers import AutoConfig, AutoModelForImageTextToText, AutoTokenizer
|
|
|
|
|
from transformers import __version__ as TRANSFORMERS_VERSION
|
|
|
|
|
|
|
|
|
@ -287,8 +288,8 @@ def clear_cache():
|
|
|
|
|
@pytest.mark.parametrize("num_logprobs", [5])
|
|
|
|
|
@pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS)
|
|
|
|
|
@pytest.mark.skipif(
|
|
|
|
|
TRANSFORMERS_VERSION == "4.55.0",
|
|
|
|
|
reason="Transformers v4.55.0 has a regression issue on mllama, "
|
|
|
|
|
Version(TRANSFORMERS_VERSION) <= Version("4.55.2"),
|
|
|
|
|
reason="Transformers v4.55 has a regression issue on mllama, "
|
|
|
|
|
"see: https://github.com/huggingface/transformers/pull/40083")
|
|
|
|
|
def test_models_single_leading_image(hf_runner, vllm_runner, image_assets,
|
|
|
|
|
model, sizes, dtype, max_tokens,
|
|
|
|
@ -319,8 +320,8 @@ def test_models_single_leading_image(hf_runner, vllm_runner, image_assets,
|
|
|
|
|
@pytest.mark.parametrize("num_logprobs", [5])
|
|
|
|
|
@pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS)
|
|
|
|
|
@pytest.mark.skipif(
|
|
|
|
|
TRANSFORMERS_VERSION == "4.55.0",
|
|
|
|
|
reason="Transformers v4.55.0 has a regression issue on mllama, "
|
|
|
|
|
Version(TRANSFORMERS_VERSION) <= Version("4.55.2"),
|
|
|
|
|
reason="Transformers v4.55 has a regression issue on mllama, "
|
|
|
|
|
"see: https://github.com/huggingface/transformers/pull/40083")
|
|
|
|
|
def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets,
|
|
|
|
|
model, dtype, max_tokens, num_logprobs,
|
|
|
|
@ -372,8 +373,8 @@ def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets,
|
|
|
|
|
@pytest.mark.parametrize("num_logprobs", [5])
|
|
|
|
|
@pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS)
|
|
|
|
|
@pytest.mark.skipif(
|
|
|
|
|
TRANSFORMERS_VERSION == "4.55.0",
|
|
|
|
|
reason="Transformers v4.55.0 has a regression issue on mllama, "
|
|
|
|
|
Version(TRANSFORMERS_VERSION) <= Version("4.55.2"),
|
|
|
|
|
reason="Transformers v4.55 has a regression issue on mllama, "
|
|
|
|
|
"see: https://github.com/huggingface/transformers/pull/40083")
|
|
|
|
|
def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model,
|
|
|
|
|
dtype, max_tokens, num_logprobs,
|
|
|
|
@ -416,8 +417,8 @@ def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model,
|
|
|
|
|
@pytest.mark.parametrize("max_tokens", [64])
|
|
|
|
|
@pytest.mark.parametrize("num_logprobs", [5])
|
|
|
|
|
@pytest.mark.skipif(
|
|
|
|
|
TRANSFORMERS_VERSION == "4.55.0",
|
|
|
|
|
reason="Transformers v4.55.0 has a regression issue on mllama, "
|
|
|
|
|
Version(TRANSFORMERS_VERSION) <= Version("4.55.2"),
|
|
|
|
|
reason="Transformers v4.55 has a regression issue on mllama, "
|
|
|
|
|
"see: https://github.com/huggingface/transformers/pull/40083")
|
|
|
|
|
def test_models_distributed(
|
|
|
|
|
hf_runner,
|
|
|
|
|