env var to disable pinned memory

2026-06-27 16:17:48 +08:00 · 2025-03-07 08:18:58 +08:00
parent 0578e5a462
commit 4046466534
1 changed files with 3 additions and 1 deletions
@@ -5,7 +5,7 @@ import platform
 import random
 from platform import uname
 from typing import TYPE_CHECKING, NamedTuple, Optional, Tuple, Union
-
+import os
 import numpy as np
 import torch

@@ -299,6 +299,8 @@ class Platform:
    @classmethod
    def is_pin_memory_available(cls) -> bool:
        """Checks whether pin memory is available on the current platform."""
+        if os.environ.get("VLLM_DISABLE_PIN_MEMORY", "0") == "1":
+            return False
        if in_wsl():
            # Pinning memory in WSL is not supported.
            # https://docs.nvidia.com/cuda/wsl-user-guide/index.html#known-limitations-for-linux-cuda-applications