Skip to content

Commit 5f5f356

Browse files
committed
update
Signed-off-by: shen-shanshan <467638484@qq.com>
1 parent 6af2e13 commit 5f5f356

File tree

2 files changed

+6
-3
lines changed

2 files changed

+6
-3
lines changed

vllm_ascend/torchair/torchair_attention.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -164,11 +164,16 @@ def build(self,
164164
num_reqs,
165165
num_actual_tokens,
166166
max_query_len,
167-
graph_pad_size: int = -1,
168167
enable_dbo_across_dp: bool = False,
168+
is_only_prefill: bool = False,
169169
*args,
170170
**kwargs):
171171

172+
if 'graph_pad_size' in kwargs:
173+
graph_pad_size = kwargs['graph_pad_size']
174+
else:
175+
graph_pad_size = -1 # default value
176+
172177
device = self.runner.device
173178

174179
block_table = self.runner.input_batch.block_table[0].get_device_tensor(

vllm_ascend/worker/model_runner_v1.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -85,8 +85,6 @@
8585
from vllm_ascend.platform import NPUPlatform
8686
from vllm_ascend.sample.rejection_sampler import AscendRejectionSampler
8787
from vllm_ascend.torchair.torchair_attention import AscendTorchairMetadata
88-
from vllm_ascend.torchair.utils import (check_torchair_cache_exist,
89-
write_kv_cache_bytes_to_file)
9088
from vllm_ascend.utils import (ACL_FORMAT_FRACTAL_ND, ACL_FORMAT_FRACTAL_NZ,
9189
ProfileExecuteDuration, is_310p,
9290
maybe_converting_weight_acl_format,

0 commit comments

Comments
 (0)