diff --git a/vllm_neuron/worker/neuronx_distributed_model_loader.py b/vllm_neuron/worker/neuronx_distributed_model_loader.py index 6d76487..f170375 100644 --- a/vllm_neuron/worker/neuronx_distributed_model_loader.py +++ b/vllm_neuron/worker/neuronx_distributed_model_loader.py @@ -51,7 +51,7 @@ ) from vllm.model_executor.layers.logits_processor import LogitsProcessor from vllm.v1.outputs import SamplerOutput -from vllm.v1.sample import sampler as Sampler +from vllm.v1.sample.sampler import Sampler from vllm_neuron.worker.constants import ( NEURON_MULTI_MODAL_MODELS,