Skip to content

Commit a635648

Browse files
author
Sigrid Jin (Sionic AI)
committed
refactor: accept review
Signed-off-by: Sigrid Jin (Sionic AI) <sigrid@sionic.ai>
1 parent 27b28f7 commit a635648

File tree

3 files changed

+3
-5
lines changed

3 files changed

+3
-5
lines changed

benchmarks/jina_embeddings_v4_validation.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -155,9 +155,9 @@ def compute_vllm_embeddings(
155155

156156
for output in outputs:
157157
# Extract based on token type
158-
if 151652 in output.prompt_token_ids: # VISION_START_TOKEN_ID
159-
img_start = output.prompt_token_ids.index(151652)
160-
img_end = output.prompt_token_ids.index(151653)
158+
if VISION_START_TOKEN_ID in output.prompt_token_ids:
159+
img_start = output.prompt_token_ids.index(VISION_START_TOKEN_ID)
160+
img_end = output.prompt_token_ids.index(VISION_END_TOKEN_ID)
161161
embedding_data = output.outputs.data[img_start : img_end + 1]
162162
else:
163163
embedding_data = output.outputs.data

vllm/model_executor/models/jina_embeddings_v4.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,8 +35,6 @@
3535

3636
PoolingMetadata = Union[V0PoolingMetadata, V1PoolingMetadata]
3737

38-
# Triton kernel for optimized vision token extraction
39-
4038

4139
@MULTIMODAL_REGISTRY.register_processor(Qwen2VLMultiModalProcessor,
4240
info=Qwen2VLProcessingInfo,

0 commit comments

Comments
 (0)