mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-09 12:22:19 +08:00
[CI/Build] Temporary fix to LM Eval Small Models (#28324)
Signed-off-by: zhewenli <zhewenli@meta.com>
This commit is contained in:
parent
4a8d6bd168
commit
a65a934ebe
@ -3,3 +3,6 @@ accuracy_threshold: 0.45
|
|||||||
num_questions: 1319
|
num_questions: 1319
|
||||||
num_fewshot: 5
|
num_fewshot: 5
|
||||||
max_model_len: 4096
|
max_model_len: 4096
|
||||||
|
# Duo stream incompatabilbe with this model: https://github.com/vllm-project/vllm/issues/28220
|
||||||
|
env:
|
||||||
|
VLLM_DISABLE_SHARED_EXPERTS_STREAM: "1"
|
||||||
|
|||||||
@ -62,9 +62,11 @@ def test_gsm8k_correctness_param(config_filename, tp_size):
|
|||||||
str(tp_size),
|
str(tp_size),
|
||||||
]
|
]
|
||||||
|
|
||||||
|
env_dict = eval_config.get("env", None)
|
||||||
|
|
||||||
# Launch server and run evaluation
|
# Launch server and run evaluation
|
||||||
with RemoteOpenAIServer(
|
with RemoteOpenAIServer(
|
||||||
eval_config["model_name"], server_args, max_wait_seconds=480
|
eval_config["model_name"], server_args, env_dict=env_dict, max_wait_seconds=480
|
||||||
) as remote_server:
|
) as remote_server:
|
||||||
server_url = remote_server.url_for("v1")
|
server_url = remote_server.url_for("v1")
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user