Skip to content

Commit babad6e

Browse files
[Misc] Move DP for ViT code inside model executor dir (#25459)
Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
1 parent 9383cd6 commit babad6e

File tree

13 files changed

+721
-730
lines changed

13 files changed

+721
-730
lines changed

tests/models/test_vision.py

Lines changed: 423 additions & 1 deletion
Large diffs are not rendered by default.

tests/multimodal/test_utils.py

Lines changed: 1 addition & 425 deletions
Large diffs are not rendered by default.

vllm/model_executor/models/glm4_1v.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -69,7 +69,6 @@
6969
BaseProcessingInfo, PromptReplacement,
7070
PromptUpdate, PromptUpdateDetails)
7171
from vllm.multimodal.profiling import BaseDummyInputsBuilder
72-
from vllm.multimodal.utils import run_dp_sharded_mrope_vision_model
7372
from vllm.platforms import _Backend
7473
from vllm.sequence import IntermediateTensors
7574
from vllm.transformers_utils.config import uses_mrope
@@ -83,7 +82,7 @@
8382
from .utils import (AutoWeightsLoader, WeightsMapper,
8483
init_vllm_registered_model, maybe_prefix,
8584
merge_multimodal_embeddings)
86-
from .vision import get_vit_attn_backend
85+
from .vision import get_vit_attn_backend, run_dp_sharded_mrope_vision_model
8786

8887
logger = init_logger(__name__)
8988

vllm/model_executor/models/idefics2_vision_model.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,8 @@
3434
RowParallelLinear)
3535
from vllm.model_executor.layers.quantization import QuantizationConfig
3636
from vllm.model_executor.model_loader.weight_utils import default_weight_loader
37-
from vllm.multimodal.utils import run_dp_sharded_vision_model
37+
38+
from .vision import run_dp_sharded_vision_model
3839

3940

4041
class Idefics2VisionEmbeddings(nn.Module):

vllm/model_executor/models/intern_vit.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,8 @@
2828
RowParallelLinear)
2929
from vllm.model_executor.layers.quantization import QuantizationConfig
3030
from vllm.model_executor.model_loader.weight_utils import default_weight_loader
31-
from vllm.multimodal.utils import run_dp_sharded_vision_model
31+
32+
from .vision import run_dp_sharded_vision_model
3233

3334
NORM2FN = {
3435
'rms_norm': RMSNorm,

vllm/model_executor/models/kimi_vl.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -76,13 +76,13 @@
7676
BaseProcessingInfo, PromptReplacement,
7777
PromptUpdate)
7878
from vllm.multimodal.profiling import BaseDummyInputsBuilder
79-
from vllm.multimodal.utils import run_dp_sharded_mrope_vision_model
8079
from vllm.sequence import IntermediateTensors
8180
from vllm.transformers_utils.configs import KimiVLConfig, MoonViTConfig
8281
from vllm.transformers_utils.configs.deepseek_vl2 import DeepseekV2Config
8382
from vllm.utils.tensor_schema import TensorSchema, TensorShape
8483

8584
from .utils import PPMissingLayer, is_pp_missing_parameter, maybe_prefix
85+
from .vision import run_dp_sharded_mrope_vision_model
8686

8787

8888
# For dummy input only

vllm/model_executor/models/mllama4.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,14 +50,14 @@
5050
BaseProcessingInfo, PromptReplacement,
5151
PromptUpdate, PromptUpdateDetails)
5252
from vllm.multimodal.profiling import BaseDummyInputsBuilder
53-
from vllm.multimodal.utils import run_dp_sharded_vision_model
5453
from vllm.sequence import IntermediateTensors
5554
from vllm.utils.tensor_schema import TensorSchema, TensorShape
5655

5756
from .interfaces import MultiModalEmbeddings, SupportsMultiModal, SupportsPP
5857
from .llama4 import Llama4ForCausalLM
5958
from .utils import (AutoWeightsLoader, flatten_bn, maybe_prefix,
6059
merge_multimodal_embeddings)
60+
from .vision import run_dp_sharded_vision_model
6161

6262

6363
class Llama4ImagePatchInputs(TensorSchema):

vllm/model_executor/models/qwen2_5_vl.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,6 @@
5959
from vllm.model_executor.models.module_mapping import MultiModelKeys
6060
from vllm.multimodal import MULTIMODAL_REGISTRY
6161
from vllm.multimodal.inputs import MultiModalFieldConfig
62-
from vllm.multimodal.utils import run_dp_sharded_mrope_vision_model
6362
from vllm.platforms import _Backend
6463
from vllm.sequence import IntermediateTensors
6564
from vllm.transformers_utils.config import uses_mrope
@@ -74,7 +73,7 @@
7473
from .utils import (AutoWeightsLoader, WeightsMapper, cast_overflow_tensors,
7574
init_vllm_registered_model, maybe_prefix,
7675
merge_multimodal_embeddings)
77-
from .vision import get_vit_attn_backend
76+
from .vision import get_vit_attn_backend, run_dp_sharded_mrope_vision_model
7877

7978
logger = init_logger(__name__)
8079

vllm/model_executor/models/qwen2_vl.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,6 @@
6666
BaseProcessingInfo, PromptReplacement,
6767
PromptUpdate)
6868
from vllm.multimodal.profiling import BaseDummyInputsBuilder
69-
from vllm.multimodal.utils import run_dp_sharded_mrope_vision_model
7069
from vllm.platforms import _Backend, current_platform
7170
from vllm.sequence import IntermediateTensors
7271
from vllm.transformers_utils.config import uses_mrope
@@ -78,7 +77,7 @@
7877
from .utils import (AutoWeightsLoader, WeightsMapper,
7978
init_vllm_registered_model, maybe_prefix,
8079
merge_multimodal_embeddings)
81-
from .vision import get_vit_attn_backend
80+
from .vision import get_vit_attn_backend, run_dp_sharded_mrope_vision_model
8281

8382
logger = init_logger(__name__)
8483

vllm/model_executor/models/qwen3_vl.py

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -83,7 +83,7 @@
8383
from .qwen3 import Qwen3ForCausalLM, Qwen3Model
8484
from .utils import (AutoWeightsLoader, PPMissingLayer, WeightsMapper,
8585
maybe_prefix, merge_multimodal_embeddings)
86-
from .vision import get_vit_attn_backend
86+
from .vision import get_vit_attn_backend, run_dp_sharded_mrope_vision_model
8787

8888
logger = init_logger(__name__)
8989

@@ -1214,8 +1214,6 @@ def _process_image_input(
12141214
else:
12151215
pixel_values = image_input["pixel_values"].type(self.visual.dtype)
12161216
if self.use_data_parallel:
1217-
from vllm.multimodal.utils import (
1218-
run_dp_sharded_mrope_vision_model)
12191217
return run_dp_sharded_mrope_vision_model(self.visual,
12201218
pixel_values,
12211219
grid_thw_list,
@@ -1245,8 +1243,6 @@ def _process_video_input(
12451243
pixel_values_videos = video_input["pixel_values_videos"].type(
12461244
self.visual.dtype)
12471245
if self.use_data_parallel:
1248-
from vllm.multimodal.utils import (
1249-
run_dp_sharded_mrope_vision_model)
12501246
return run_dp_sharded_mrope_vision_model(self.visual,
12511247
pixel_values_videos,
12521248
grid_thw_list,

0 commit comments

Comments
 (0)