mm: Lower windows pin threshold

Some workflows have more extranous use of shared GPU memory than is accounted for in the 5% pin headroom. Lower this for safety.
2026-06-09 15:57:24 +08:00 · 2026-03-30 00:32:21 +10:00 · 2026-03-30 00:32:21 +10:00 · d188a67cf9
commit d188a67cf9
parent a500f1edac
1 changed files with 2 additions and 2 deletions
--- a/comfy/model_management.py
+++ b/comfy/model_management.py
@ -1326,9 +1326,9 @@ MAX_PINNED_MEMORY = -1
 if not args.disable_pinned_memory:
    if is_nvidia() or is_amd():
        if WINDOWS:
-            MAX_PINNED_MEMORY = get_total_memory(torch.device("cpu")) * 0.45  # Windows limit is apparently 50%
+            MAX_PINNED_MEMORY = get_total_memory(torch.device("cpu")) * 0.40  # Windows limit is apparently 50%
        else:
-            MAX_PINNED_MEMORY = get_total_memory(torch.device("cpu")) * 0.95
+            MAX_PINNED_MEMORY = get_total_memory(torch.device("cpu")) * 0.90
        logging.info("Enabled pinned memory {}".format(MAX_PINNED_MEMORY // (1024 * 1024)))

 PINNING_ALLOWED_TYPES = set(["Tensor", "Parameter", "QuantizedTensor"])