diff --git a/requirements/rocm.txt b/requirements/rocm.txt index 6f1cca90e5e2b..abbd33d6e1240 100644 --- a/requirements/rocm.txt +++ b/requirements/rocm.txt @@ -15,3 +15,4 @@ setuptools-scm>=8 runai-model-streamer[s3,gcs]==0.15.0 conch-triton-kernels==1.2.1 timm>=1.0.17 +fastsafetensors @ git+https://github.com/foundation-model-stack/fastsafetensors.git@d6f998a03432b2452f8de2bb5cefb5af9795d459 diff --git a/tests/model_executor/model_loader/fastsafetensors_loader/test_fastsafetensors_loader.py b/tests/model_executor/model_loader/fastsafetensors_loader/test_fastsafetensors_loader.py index f154df6dfc232..c5b3c731ffc64 100644 --- a/tests/model_executor/model_loader/fastsafetensors_loader/test_fastsafetensors_loader.py +++ b/tests/model_executor/model_loader/fastsafetensors_loader/test_fastsafetensors_loader.py @@ -19,7 +19,8 @@ sampling_params = SamplingParams(temperature=0.8, top_p=0.95, seed=0) @pytest.mark.skipif( - not current_platform.is_cuda(), reason="fastsafetensors requires CUDA/NVIDIA GPUs" + not current_platform.is_cuda_alike(), + reason="fastsafetensors requires NVIDIA/AMD GPUs", ) def test_model_loader_download_files(vllm_runner): with vllm_runner(test_model, load_format="fastsafetensors") as llm: diff --git a/tests/model_executor/model_loader/fastsafetensors_loader/test_weight_utils.py b/tests/model_executor/model_loader/fastsafetensors_loader/test_weight_utils.py index bd216f0e41a47..1975eb61b25da 100644 --- a/tests/model_executor/model_loader/fastsafetensors_loader/test_weight_utils.py +++ b/tests/model_executor/model_loader/fastsafetensors_loader/test_weight_utils.py @@ -17,7 +17,8 @@ from vllm.platforms import current_platform @pytest.mark.skipif( - not current_platform.is_cuda(), reason="fastsafetensors requires CUDA/NVIDIA GPUs" + not current_platform.is_cuda_alike(), + reason="fastsafetensors requires NVIDIA/AMD GPUs", ) def test_fastsafetensors_model_loader(): with tempfile.TemporaryDirectory() as tmpdir: