mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-13 13:25:30 +08:00
[CI] Split mteb test from Language Models Test (#24634)
Signed-off-by: wang.yuqi <noooop@126.com>
This commit is contained in:
parent
d11ec124a0
commit
fd1ce98cdd
@ -642,6 +642,16 @@ steps:
|
|||||||
commands:
|
commands:
|
||||||
- pytest -v -s models/language/pooling -m 'not core_model'
|
- pytest -v -s models/language/pooling -m 'not core_model'
|
||||||
|
|
||||||
|
- label: Language Models Test (MTEB)
|
||||||
|
timeout_in_minutes: 110
|
||||||
|
mirror_hardwares: [amdexperimental]
|
||||||
|
optional: true
|
||||||
|
source_file_dependencies:
|
||||||
|
- vllm/
|
||||||
|
- tests/models/language/pooling_mteb_test
|
||||||
|
commands:
|
||||||
|
- pytest -v -s models/language/pooling_mteb_test
|
||||||
|
|
||||||
- label: Multi-Modal Processor Test # 44min
|
- label: Multi-Modal Processor Test # 44min
|
||||||
timeout_in_minutes: 60
|
timeout_in_minutes: 60
|
||||||
source_file_dependencies:
|
source_file_dependencies:
|
||||||
|
|||||||
@ -4,10 +4,9 @@ import os
|
|||||||
|
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from tests.models.language.pooling.mteb_utils import (MTEB_EMBED_TASKS,
|
from tests.models.language.pooling_mteb_test.mteb_utils import (
|
||||||
MTEB_EMBED_TOL,
|
MTEB_EMBED_TASKS, MTEB_EMBED_TOL, OpenAIClientMtebEncoder,
|
||||||
OpenAIClientMtebEncoder,
|
run_mteb_embed_task)
|
||||||
run_mteb_embed_task)
|
|
||||||
from tests.utils import RemoteOpenAIServer
|
from tests.utils import RemoteOpenAIServer
|
||||||
|
|
||||||
os.environ["VLLM_LOGGING_LEVEL"] = "WARNING"
|
os.environ["VLLM_LOGGING_LEVEL"] = "WARNING"
|
||||||
|
|||||||
@ -4,15 +4,9 @@ import os
|
|||||||
|
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
# yapf conflicts with isort for this block
|
from tests.models.language.pooling_mteb_test.mteb_utils import (
|
||||||
# yapf: disable
|
MTEB_RERANK_LANGS, MTEB_RERANK_TASKS, MTEB_RERANK_TOL,
|
||||||
from tests.models.language.pooling.mteb_utils import (MTEB_RERANK_LANGS,
|
RerankClientMtebEncoder, ScoreClientMtebEncoder, run_mteb_rerank)
|
||||||
MTEB_RERANK_TASKS,
|
|
||||||
MTEB_RERANK_TOL,
|
|
||||||
RerankClientMtebEncoder,
|
|
||||||
ScoreClientMtebEncoder,
|
|
||||||
run_mteb_rerank)
|
|
||||||
# yapf: enable
|
|
||||||
from tests.utils import RemoteOpenAIServer
|
from tests.utils import RemoteOpenAIServer
|
||||||
|
|
||||||
os.environ["VLLM_LOGGING_LEVEL"] = "WARNING"
|
os.environ["VLLM_LOGGING_LEVEL"] = "WARNING"
|
||||||
|
|||||||
0
tests/models/language/pooling_mteb_test/__init__.py
Normal file
0
tests/models/language/pooling_mteb_test/__init__.py
Normal file
@ -2,10 +2,12 @@
|
|||||||
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from ...utils import (CLSPoolingEmbedModelInfo, CLSPoolingRerankModelInfo,
|
from tests.models.language.pooling.embed_utils import (
|
||||||
EmbedModelInfo, LASTPoolingEmbedModelInfo,
|
correctness_test_embed_models)
|
||||||
RerankModelInfo)
|
from tests.models.utils import (CLSPoolingEmbedModelInfo,
|
||||||
from .embed_utils import correctness_test_embed_models
|
CLSPoolingRerankModelInfo, EmbedModelInfo,
|
||||||
|
LASTPoolingEmbedModelInfo, RerankModelInfo)
|
||||||
|
|
||||||
from .mteb_utils import mteb_test_embed_models, mteb_test_rerank_models
|
from .mteb_utils import mteb_test_embed_models, mteb_test_rerank_models
|
||||||
|
|
||||||
MODELS = [
|
MODELS = [
|
||||||
@ -7,9 +7,9 @@ import pytest
|
|||||||
import torch
|
import torch
|
||||||
|
|
||||||
from tests.conftest import HfRunner
|
from tests.conftest import HfRunner
|
||||||
|
from tests.models.language.pooling_mteb_test.mteb_utils import (
|
||||||
from ...utils import LASTPoolingRerankModelInfo, RerankModelInfo
|
VllmMtebEncoder, mteb_test_rerank_models)
|
||||||
from .mteb_utils import VllmMtebEncoder, mteb_test_rerank_models
|
from tests.models.utils import LASTPoolingRerankModelInfo, RerankModelInfo
|
||||||
|
|
||||||
RERANK_MODELS = [
|
RERANK_MODELS = [
|
||||||
LASTPoolingRerankModelInfo("BAAI/bge-reranker-v2-gemma",
|
LASTPoolingRerankModelInfo("BAAI/bge-reranker-v2-gemma",
|
||||||
@ -2,8 +2,9 @@
|
|||||||
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from ...utils import (CLSPoolingRerankModelInfo, LASTPoolingRerankModelInfo,
|
from tests.models.utils import (CLSPoolingRerankModelInfo,
|
||||||
RerankModelInfo)
|
LASTPoolingRerankModelInfo, RerankModelInfo)
|
||||||
|
|
||||||
from .mteb_utils import mteb_test_rerank_models
|
from .mteb_utils import mteb_test_rerank_models
|
||||||
|
|
||||||
RERANK_MODELS = [
|
RERANK_MODELS = [
|
||||||
@ -3,10 +3,12 @@
|
|||||||
|
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from ...utils import (CLSPoolingEmbedModelInfo, CLSPoolingRerankModelInfo,
|
from tests.models.language.pooling.embed_utils import (
|
||||||
EmbedModelInfo, LASTPoolingEmbedModelInfo,
|
correctness_test_embed_models)
|
||||||
RerankModelInfo)
|
from tests.models.utils import (CLSPoolingEmbedModelInfo,
|
||||||
from .embed_utils import correctness_test_embed_models
|
CLSPoolingRerankModelInfo, EmbedModelInfo,
|
||||||
|
LASTPoolingEmbedModelInfo, RerankModelInfo)
|
||||||
|
|
||||||
from .mteb_utils import mteb_test_embed_models, mteb_test_rerank_models
|
from .mteb_utils import mteb_test_embed_models, mteb_test_rerank_models
|
||||||
|
|
||||||
MODELS = [
|
MODELS = [
|
||||||
@ -2,8 +2,10 @@
|
|||||||
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from ...utils import CLSPoolingEmbedModelInfo, EmbedModelInfo
|
from tests.models.language.pooling.embed_utils import (
|
||||||
from .embed_utils import correctness_test_embed_models
|
correctness_test_embed_models)
|
||||||
|
from tests.models.utils import CLSPoolingEmbedModelInfo, EmbedModelInfo
|
||||||
|
|
||||||
from .mteb_utils import mteb_test_embed_models
|
from .mteb_utils import mteb_test_embed_models
|
||||||
|
|
||||||
MODELS = [
|
MODELS = [
|
||||||
@ -4,12 +4,13 @@ from functools import partial
|
|||||||
|
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
|
from tests.models.language.pooling.embed_utils import (
|
||||||
|
check_embeddings_close, correctness_test_embed_models, matryoshka_fy)
|
||||||
|
from tests.models.utils import (CLSPoolingEmbedModelInfo,
|
||||||
|
CLSPoolingRerankModelInfo, EmbedModelInfo,
|
||||||
|
RerankModelInfo)
|
||||||
from vllm import PoolingParams
|
from vllm import PoolingParams
|
||||||
|
|
||||||
from ...utils import (CLSPoolingEmbedModelInfo, CLSPoolingRerankModelInfo,
|
|
||||||
EmbedModelInfo, RerankModelInfo)
|
|
||||||
from .embed_utils import (check_embeddings_close,
|
|
||||||
correctness_test_embed_models, matryoshka_fy)
|
|
||||||
from .mteb_utils import mteb_test_embed_models, mteb_test_rerank_models
|
from .mteb_utils import mteb_test_embed_models, mteb_test_rerank_models
|
||||||
|
|
||||||
EMBEDDING_MODELS = [
|
EMBEDDING_MODELS = [
|
||||||
@ -6,8 +6,8 @@ import pytest
|
|||||||
import torch
|
import torch
|
||||||
|
|
||||||
from tests.conftest import HfRunner
|
from tests.conftest import HfRunner
|
||||||
|
from tests.models.utils import LASTPoolingRerankModelInfo, RerankModelInfo
|
||||||
|
|
||||||
from ...utils import LASTPoolingRerankModelInfo, RerankModelInfo
|
|
||||||
from .mteb_utils import mteb_test_rerank_models
|
from .mteb_utils import mteb_test_rerank_models
|
||||||
|
|
||||||
mxbai_rerank_hf_overrides = {
|
mxbai_rerank_hf_overrides = {
|
||||||
@ -3,8 +3,10 @@
|
|||||||
|
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from ...utils import CLSPoolingEmbedModelInfo, EmbedModelInfo
|
from tests.models.language.pooling.embed_utils import (
|
||||||
from .embed_utils import correctness_test_embed_models
|
correctness_test_embed_models)
|
||||||
|
from tests.models.utils import CLSPoolingEmbedModelInfo, EmbedModelInfo
|
||||||
|
|
||||||
from .mteb_utils import mteb_test_embed_models
|
from .mteb_utils import mteb_test_embed_models
|
||||||
|
|
||||||
MODELS = [
|
MODELS = [
|
||||||
@ -6,9 +6,9 @@ import pytest
|
|||||||
import torch
|
import torch
|
||||||
|
|
||||||
from tests.conftest import HfRunner
|
from tests.conftest import HfRunner
|
||||||
|
from tests.models.utils import LASTPoolingRerankModelInfo, RerankModelInfo
|
||||||
from tests.utils import multi_gpu_test
|
from tests.utils import multi_gpu_test
|
||||||
|
|
||||||
from ...utils import LASTPoolingRerankModelInfo, RerankModelInfo
|
|
||||||
from .mteb_utils import mteb_test_rerank_models
|
from .mteb_utils import mteb_test_rerank_models
|
||||||
|
|
||||||
qwen3_reranker_hf_overrides = {
|
qwen3_reranker_hf_overrides = {
|
||||||
@ -3,8 +3,10 @@
|
|||||||
|
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from ...utils import CLSPoolingEmbedModelInfo, EmbedModelInfo
|
from tests.models.language.pooling.embed_utils import (
|
||||||
from .embed_utils import correctness_test_embed_models
|
correctness_test_embed_models)
|
||||||
|
from tests.models.utils import CLSPoolingEmbedModelInfo, EmbedModelInfo
|
||||||
|
|
||||||
from .mteb_utils import mteb_test_embed_models
|
from .mteb_utils import mteb_test_embed_models
|
||||||
|
|
||||||
MODELS = [
|
MODELS = [
|
||||||
@ -2,8 +2,9 @@
|
|||||||
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
||||||
import pytest
|
import pytest
|
||||||
|
|
||||||
from ...utils import (CLSPoolingEmbedModelInfo, EmbedModelInfo,
|
from tests.models.utils import (CLSPoolingEmbedModelInfo, EmbedModelInfo,
|
||||||
LASTPoolingEmbedModelInfo)
|
LASTPoolingEmbedModelInfo)
|
||||||
|
|
||||||
from .mteb_utils import mteb_test_embed_models
|
from .mteb_utils import mteb_test_embed_models
|
||||||
|
|
||||||
# ST models with projector (Dense) layers
|
# ST models with projector (Dense) layers
|
||||||
Loading…
x
Reference in New Issue
Block a user