mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 01:05:01 +08:00
[CI] Enable encoder model compilation test (#24442)
Signed-off-by: zjy0516 <riverclouds.zhu@qq.com>
This commit is contained in:
parent
8d7f39b48c
commit
7be141b2c5
@ -62,8 +62,12 @@ class TestSetting:
|
|||||||
TestSetting(
|
TestSetting(
|
||||||
model="BAAI/bge-multilingual-gemma2",
|
model="BAAI/bge-multilingual-gemma2",
|
||||||
model_args=[
|
model_args=[
|
||||||
"--runner", "pooling", "--dtype", "bfloat16",
|
"--runner",
|
||||||
"--max-model-len", "2048"
|
"pooling",
|
||||||
|
"--dtype",
|
||||||
|
"bfloat16",
|
||||||
|
"--max-model-len",
|
||||||
|
"2048",
|
||||||
],
|
],
|
||||||
pp_size=1,
|
pp_size=1,
|
||||||
tp_size=1,
|
tp_size=1,
|
||||||
@ -71,17 +75,15 @@ class TestSetting:
|
|||||||
method="encode",
|
method="encode",
|
||||||
fullgraph=True,
|
fullgraph=True,
|
||||||
),
|
),
|
||||||
# TODO: bert models are not supported in V1 yet
|
TestSetting(
|
||||||
# # encoder-based embedding model (BERT)
|
model="BAAI/bge-base-en-v1.5",
|
||||||
# TestSetting(
|
model_args=["--runner", "pooling"],
|
||||||
# model="BAAI/bge-base-en-v1.5",
|
pp_size=1,
|
||||||
# model_args=["--runner", "pooling"],
|
tp_size=1,
|
||||||
# pp_size=1,
|
attn_backend="FLASH_ATTN",
|
||||||
# tp_size=1,
|
method="encode",
|
||||||
# attn_backend="XFORMERS",
|
fullgraph=True,
|
||||||
# method="encode",
|
),
|
||||||
# fullgraph=True,
|
|
||||||
# ),
|
|
||||||
# vision language model
|
# vision language model
|
||||||
TestSetting(
|
TestSetting(
|
||||||
model="microsoft/Phi-3.5-vision-instruct",
|
model="microsoft/Phi-3.5-vision-instruct",
|
||||||
@ -92,7 +94,8 @@ class TestSetting:
|
|||||||
method="generate_with_image",
|
method="generate_with_image",
|
||||||
fullgraph=False,
|
fullgraph=False,
|
||||||
),
|
),
|
||||||
])
|
],
|
||||||
|
)
|
||||||
def test_compile_correctness(
|
def test_compile_correctness(
|
||||||
monkeypatch: pytest.MonkeyPatch,
|
monkeypatch: pytest.MonkeyPatch,
|
||||||
test_setting: TestSetting,
|
test_setting: TestSetting,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user