Skip to content
Merged
Show file tree
Hide file tree
Changes from 3 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion vllm/model_executor/models/hunyuan_vision.py
Original file line number Diff line number Diff line change
Expand Up @@ -847,7 +847,7 @@ def get_xdrope_input_positions(
.expand(-1, llm_grid_w + 1)
.reshape(-1)
)
h_index[pos : pos + token_num] = 0
t_index[pos : pos + token_num] = image_index

if xd_num == 4:
llm_positions = torch.stack([p_index, w_index, h_index, t_index])
Expand Down
6 changes: 3 additions & 3 deletions vllm/transformers_utils/processors/hunyuan_vl_image.py
Original file line number Diff line number Diff line change
Expand Up @@ -195,9 +195,9 @@ def _preprocess(
processed_images = []
for image in images:
if do_resize:
resized_width, resized_height = smart_resize(
width,
height,
resized_height, resized_width = smart_resize(
height=height,
width=width,
factor=patch_size * merge_size,
min_pixels=self.min_pixels,
max_pixels=self.max_pixels,
Expand Down