mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-14 00:07:22 +08:00
[CI/Build][AMD] Use float16 in test_reset_prefix_cache_e2e to avoid accuracy issues (#29997)
Signed-off-by: Randall Smith <ransmith@amd.com> Co-authored-by: Randall Smith <ransmith@amd.com>
This commit is contained in:
parent
6038b1b04b
commit
feecba09af
@ -21,6 +21,7 @@ def test_reset_prefix_cache_e2e(monkeypatch):
|
|||||||
max_num_batched_tokens=32,
|
max_num_batched_tokens=32,
|
||||||
max_model_len=2048,
|
max_model_len=2048,
|
||||||
compilation_config={"mode": 0},
|
compilation_config={"mode": 0},
|
||||||
|
dtype="float16",
|
||||||
)
|
)
|
||||||
engine = LLMEngine.from_engine_args(engine_args)
|
engine = LLMEngine.from_engine_args(engine_args)
|
||||||
sampling_params = SamplingParams(
|
sampling_params = SamplingParams(
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user