from typing import List, Optional, Tuple, Type, overload import pytest import transformers from transformers import (AutoConfig, AutoModelForVision2Seq, AutoTokenizer, BatchEncoding) from vllm.multimodal.utils import (rescale_image_size, rescale_video_size, resize_video, sample_frames_from_video) from vllm.sequence import SampleLogprobs from vllm.utils import STR_DTYPE_TO_TORCH_DTYPE from ....conftest import (VIDEO_ASSETS, HfRunner, PromptImageInput, VllmRunner, _VideoAssets) from ...utils import check_logprobs_close # Video test HF_VIDEO_PROMPTS = VIDEO_ASSETS.prompts({ "sample_demo_1": "<|im_start|>user