Skip to content

Commit

Permalink
catch up vllm main
Browse files Browse the repository at this point in the history
  • Loading branch information
noooop committed Sep 29, 2024
1 parent 653da13 commit 653794e
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions vllm/wde/prefill_only/runner/model_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
import torch.nn as nn

from vllm.logger import init_logger
from vllm.utils import CudaMemoryProfiler, is_pin_memory_available
from vllm.utils import DeviceMemoryProfiler, is_pin_memory_available
from vllm.wde.core.config import DeviceConfig, LoadConfig, ModelConfig
from vllm.wde.core.layers.attention import AttentionBackend
from vllm.wde.prefill_only.config import PrefillOnlySchedulerConfig
Expand Down Expand Up @@ -37,7 +37,7 @@ def load_model(self) -> None:
initialize_model)

logger.info("Starting to load model %s...", self.model_config.model)
with CudaMemoryProfiler() as m:
with DeviceMemoryProfiler() as m:
loader = get_model_loader(self.load_config)
self.model = initialize_model(model_config=self.model_config,
load_config=self.load_config,
Expand Down

0 comments on commit 653794e

Please sign in to comment.