Skip to content

Commit

Permalink
restore Pooling name
Browse files Browse the repository at this point in the history
  • Loading branch information
Yehoshua Cohen committed Dec 3, 2024
1 parent b5d4368 commit 1475d21
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions vllm/worker/pooling_model_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,12 +21,12 @@
@dataclasses.dataclass(frozen=True)
class ModelInputForGPUWithPoolingMetadata(ModelInputForGPU):
"""
Used by the EmbeddingModelRunner.
Used by the PoolingModelRunner.
"""
pooling_metadata: Optional["PoolingMetadata"] = None


class EmbeddingModelRunner(
class PoolingModelRunner(
GPUModelRunnerBase[ModelInputForGPUWithPoolingMetadata]):
_model_input_cls: Type[ModelInputForGPUWithPoolingMetadata] = (
ModelInputForGPUWithPoolingMetadata)
Expand All @@ -52,7 +52,7 @@ def execute_model(
) -> Optional[Union[List[PoolerOutput], IntermediateTensors]]:
if num_steps > 1:
raise ValueError(
"EmbeddingModelRunner does not support multi-step execution.")
"PoolingModelRunner does not support multi-step execution.")

if self.lora_config:
assert model_input.lora_requests is not None
Expand Down

0 comments on commit 1475d21

Please sign in to comment.