mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-25 02:35:01 +08:00
38 lines
1.1 KiB
Python
38 lines
1.1 KiB
Python
# SPDX-License-Identifier: Apache-2.0
|
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
|
import pytest
|
|
|
|
from tests.models.utils import (
|
|
RerankModelInfo,
|
|
)
|
|
|
|
from .mteb_score_utils import mteb_test_rerank_models
|
|
|
|
RERANK_MODELS = [
|
|
RerankModelInfo(
|
|
"cross-encoder/ms-marco-TinyBERT-L-2-v2",
|
|
mteb_score=0.32898,
|
|
architecture="BertForSequenceClassification",
|
|
pooling_type="CLS",
|
|
attn_type="encoder_only",
|
|
is_prefix_caching_supported=False,
|
|
is_chunked_prefill_supported=False,
|
|
),
|
|
RerankModelInfo(
|
|
"tomaarsen/Qwen3-Reranker-0.6B-seq-cls",
|
|
mteb_score=0.25736,
|
|
architecture="Qwen3ForSequenceClassification",
|
|
pooling_type="LAST",
|
|
attn_type="decoder",
|
|
is_prefix_caching_supported=True,
|
|
is_chunked_prefill_supported=True,
|
|
),
|
|
]
|
|
|
|
|
|
@pytest.mark.parametrize("model_info", RERANK_MODELS)
|
|
def test_rerank_models_mteb(
|
|
hf_runner, vllm_runner, model_info: RerankModelInfo
|
|
) -> None:
|
|
mteb_test_rerank_models(hf_runner, vllm_runner, model_info)
|