From 4046466534b5a470009dc2db33f14a4d61773ae9 Mon Sep 17 00:00:00 2001 From: wassname <1103714+wassname@users.noreply.github.com> Date: Fri, 7 Mar 2025 08:18:58 +0800 Subject: [PATCH] env var to disable pinned memory --- vllm/platforms/interface.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/vllm/platforms/interface.py b/vllm/platforms/interface.py index e7e55e11..28f9165e 100644 --- a/vllm/platforms/interface.py +++ b/vllm/platforms/interface.py @@ -5,7 +5,7 @@ import platform import random from platform import uname from typing import TYPE_CHECKING, NamedTuple, Optional, Tuple, Union - +import os import numpy as np import torch @@ -299,6 +299,8 @@ class Platform: @classmethod def is_pin_memory_available(cls) -> bool: """Checks whether pin memory is available on the current platform.""" + if os.environ.get("VLLM_DISABLE_PIN_MEMORY", "0") == "1": + return False if in_wsl(): # Pinning memory in WSL is not supported. # https://docs.nvidia.com/cuda/wsl-user-guide/index.html#known-limitations-for-linux-cuda-applications