Skip to content

Commit 737e0ea

Browse files
author
litianjian
committed
update
1 parent ba8ac97 commit 737e0ea

File tree

2 files changed

+10
-8
lines changed

2 files changed

+10
-8
lines changed

tests/models/decoder_only/vision_language/test_llava_onevision.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -9,8 +9,8 @@
99
from vllm.sequence import SampleLogprobs
1010
from vllm.utils import STR_DTYPE_TO_TORCH_DTYPE
1111

12-
from ....conftest import (VIDEO_ASSETS, HfRunner, PromptImageInput, VllmRunner,
13-
_VideoAssets)
12+
from ....conftest import (VIDEO_ASSETS, HfRunner, PromptImageInput, PromptVideoInput,
13+
VllmRunner, _VideoAssets)
1414
from ....utils import large_gpu_test
1515
from ...utils import check_logprobs_close
1616

vllm/model_executor/models/llava_onevision.py

Lines changed: 8 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -348,18 +348,18 @@ def input_processor_when_multimodal_input_video(ctx: InputContext,
348348
tokenizer = cached_get_tokenizer(model_config.tokenizer)
349349
new_prompt, new_token_ids = repeat_and_pad_placeholder_tokens(
350350
tokenizer,
351-
llm_inputs.get("prompt"),
352-
llm_inputs["prompt_token_ids"],
351+
inputs.get("prompt"),
352+
inputs["prompt_token_ids"],
353353
placeholder_token_id=hf_config.video_token_index,
354354
repeat_count=video_feature_size,
355355
)
356-
return LLMInputs(prompt_token_ids=new_token_ids,
357-
prompt=new_prompt,
358-
multi_modal_data=multi_modal_data)
356+
return token_inputs(prompt_token_ids=new_token_ids,
357+
prompt=new_prompt,
358+
multi_modal_data=multi_modal_data)
359359
else:
360360
raise TypeError(f"Invalid video type: {type(video_data)}")
361361

362-
msg = f"Unsupported vision config: {type(vision_config)}"
362+
msg = f"Unsupported video type: {type(video_data)}"
363363
raise NotImplementedError(msg)
364364

365365

@@ -841,6 +841,8 @@ def forward(
841841
batch.
842842
pixel_values_videos: Pixels in each frames for each input videos.
843843
"""
844+
# import pdb; pdb.set_trace()
845+
844846
if intermediate_tensors is not None:
845847
input_ids = None
846848
inputs_embeds = None

0 commit comments

Comments
 (0)