Skip to content

Commit 8c5407d

Browse files
remove cum_offsets from ForwardMeta (#2925)
1 parent 25698d5 commit 8c5407d

File tree

3 files changed

+2
-5
lines changed

3 files changed

+2
-5
lines changed

fastdeploy/model_executor/forward_meta.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -85,8 +85,6 @@ class ForwardMeta:
8585
# The sequence length processed in the current step
8686
seq_lens_this_time: Optional[paddle.Tensor] = None
8787

88-
# Accumulated offset
89-
cum_offsets: Optional[paddle.Tensor] = None
9088
# batch_id_per_token tensor, used to indicate which token belongs which batch after padding removal to the original input_ids
9189
batch_id_per_token: Optional[paddle.Tensor] = None
9290
# Accumulated sequence length of query
@@ -112,7 +110,8 @@ class XPUForwardMeta(ForwardMeta):
112110
"""
113111
XPUForwardMeta is used to store the global meta information of the forward, and some XPU specific meta info.
114112
"""
115-
113+
# Accumulated offset
114+
cum_offsets: Optional[paddle.Tensor] = None
116115
# TODO(wanghaitao): Supplementary notes
117116
#
118117
encoder_batch_map: Optional[paddle.Tensor] = None

fastdeploy/spec_decode/mtp.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -397,7 +397,6 @@ def _initialize_forward_meta(self):
397397
seq_lens_encoder=self.model_inputs["seq_lens_encoder"],
398398
seq_lens_decoder=self.model_inputs["seq_lens_decoder"],
399399
seq_lens_this_time=self.model_inputs["seq_lens_this_time"],
400-
cum_offsets=self.model_inputs["cum_offsets"],
401400
batch_id_per_token=self.model_inputs["batch_id_per_token"],
402401
cu_seqlens_q=self.model_inputs["cu_seqlens_q"],
403402
cu_seqlens_k=self.model_inputs["cu_seqlens_k"],

fastdeploy/worker/gpu_model_runner.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -680,7 +680,6 @@ def initialize_forward_meta(self):
680680
seq_lens_encoder=self.share_inputs["seq_lens_encoder"],
681681
seq_lens_decoder=self.share_inputs["seq_lens_decoder"],
682682
seq_lens_this_time=self.share_inputs["seq_lens_this_time"],
683-
cum_offsets=self.share_inputs["cum_offsets"],
684683
batch_id_per_token=self.share_inputs["batch_id_per_token"],
685684
cu_seqlens_q=self.share_inputs["cu_seqlens_q"],
686685
cu_seqlens_k=self.share_inputs["cu_seqlens_k"],

0 commit comments

Comments
 (0)