We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent d465e7c commit 2cac2cdCopy full SHA for 2cac2cd
vllm_ascend/worker/multi_step_runner.py
@@ -14,7 +14,6 @@
14
from vllm.model_executor.model_loader.tensorizer import TensorizerConfig
15
from vllm.sequence import (CompletionSequenceGroupOutput, IntermediateTensors,
16
Logprob, SequenceGroupMetadata, SequenceOutput)
17
-from vllm_ascend.utils import current_stream
18
from vllm.worker.model_runner_base import (
19
_init_attn_metadata_from_tensor_dict,
20
_init_frozen_model_input_from_tensor_dict,
@@ -23,6 +22,7 @@
23
22
PythonizationCache,
24
StatefulModelInput)
25
+from vllm_ascend.utils import current_stream
26
from vllm_ascend.worker.model_runner import (
27
ModelInputForNPUWithSamplingMetadata, NPUModelRunnerBase)
28
0 commit comments