mirror of
https://github.com/wassname/vllm.git
synced 2026-06-28 03:52:15 +08:00
c0292211ce
Signed-off-by: Wallas Santos <wallashss@ibm.com>
7 lines
175 B
Python
7 lines
175 B
Python
from ..utils import compare_two_settings
|
|
|
|
|
|
def test_cpu_offload():
|
|
compare_two_settings("meta-llama/Llama-3.2-1B", [],
|
|
["--cpu-offload-gb", "1"])
|