Skip to content

Commit 24235b4

Browse files
committed
update
Signed-off-by: shen-shanshan <467638484@qq.com>
1 parent 719519e commit 24235b4

File tree

2 files changed

+6
-3
lines changed

2 files changed

+6
-3
lines changed

vllm_ascend/torchair/torchair_attention.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -164,11 +164,16 @@ def build(self,
164164
num_reqs,
165165
num_actual_tokens,
166166
max_query_len,
167-
graph_pad_size: int = -1,
168167
enable_dbo_across_dp: bool = False,
168+
is_only_prefill: bool = False,
169169
*args,
170170
**kwargs):
171171

172+
if 'graph_pad_size' in kwargs:
173+
graph_pad_size = kwargs['graph_pad_size']
174+
else:
175+
graph_pad_size = -1 # default value
176+
172177
device = self.runner.device
173178

174179
block_table = self.runner.input_batch.block_table[0].get_device_tensor(

vllm_ascend/worker/model_runner_v1.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -84,8 +84,6 @@
8484
from vllm_ascend.platform import NPUPlatform
8585
from vllm_ascend.sample.rejection_sampler import AscendRejectionSampler
8686
from vllm_ascend.torchair.torchair_attention import AscendTorchairMetadata
87-
from vllm_ascend.torchair.utils import (check_torchair_cache_exist,
88-
write_kv_cache_bytes_to_file)
8987
from vllm_ascend.utils import (ACL_FORMAT_FRACTAL_ND, ACL_FORMAT_FRACTAL_NZ,
9088
ProfileExecuteDuration, is_310p,
9189
maybe_converting_weight_acl_format,

0 commit comments

Comments
 (0)