We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 837d9c9 commit 1f14355Copy full SHA for 1f14355
vllm/model_executor/models/utils.py
@@ -508,7 +508,9 @@ def merge_multimodal_embeddings(
508
"""
509
if isinstance(placeholder_token_id, list):
510
placeholder_token_id = torch.tensor(placeholder_token_id,
511
- device=input_ids.device)
+ pin_memory=True).to(
512
+ device=input_ids.device,
513
+ non_blocking=True)
514
return _merge_multimodal_embeddings(
515
inputs_embeds,
516
torch.isin(input_ids, placeholder_token_id),
0 commit comments