Increase gpu_emmory_utilisation if in standby

unslothai · danielhanchen · Sep 16, 2025 · Jul 6, 2025 · Jul 7, 2025 · Jul 10, 2025
commit 6cfb2c96b22ffd5422ce5d5c49d6cf7a6a84f794
diff --git a/unsloth_zoo/vllm_utils.py b/unsloth_zoo/vllm_utils.py
@@ -1335,6 +1335,9 @@ def load_vllm(
     assert(conservativeness >= 0.0 and conservativeness <= 1.0)
 
     unsloth_vllm_standby = unsloth_vllm_standby or (os.getenv("UNSLOTH_VLLM_STANDBY", "0") != "0")
+    if unsloth_vllm_standby and gpu_memory_utilization < 0.9:
+        gpu_memory_utilization = 0.9
+        logger.info("Unsloth: Standby mode is enabled. Increasing `gpu_memory_utilization` to 0.9.")
 
     if DEVICE_TYPE == "cuda":
         major_version, minor_version = torch.cuda.get_device_capability()