Skip to content

Commit 13e44df

Browse files
committed
Use as many batch operations as possible
Signed-off-by: wang.yuqi <noooop@126.com>
1 parent 8ff2418 commit 13e44df

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

vllm/model_executor/layers/pooler.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -469,6 +469,10 @@ def forward(self, pooled_data: Union[list[torch.Tensor], torch.Tensor],
469469

470470
pooling_params = get_pooling_params(pooling_metadata)
471471

472+
if isinstance(pooled_data, list):
473+
pooled_data = torch.stack(pooled_data)
474+
# pooled_data shape: [batchsize, embedding_dimension]
475+
472476
# for matryoshka representation
473477
dimensions_list = [
474478
pooling_param.dimensions for pooling_param in pooling_params
@@ -659,6 +663,10 @@ def forward(
659663
) -> PoolerOutput:
660664
pooled_data = self.pooling(hidden_states, pooling_metadata)
661665

666+
if isinstance(pooled_data, list):
667+
pooled_data = torch.stack(pooled_data)
668+
# pooled_data shape: [batchsize, hidden_size]
669+
662670
if self.classifier is not None:
663671
# apply classifier once on the full batch if possible
664672
if isinstance(pooled_data, torch.Tensor):

0 commit comments

Comments
 (0)