feat: block swap for inference and initial impl for HunyuanImage LoRA (not working)

2026-04-17 17:24:21 +00:00 · 2025-09-11 22:15:22 +09:00
parent 5149be5a87
commit 7f983c558d
16 changed files with 1363 additions and 1303 deletions
--- a/library/device_utils.py
+++ b/library/device_utils.py
@@ -2,6 +2,7 @@ import functools
 import gc

 import torch
+
 try:
    # intel gpu support for pytorch older than 2.5
    # ipex is not needed after pytorch 2.5
@@ -51,6 +52,15 @@ def clean_memory_on_device(device: torch.device):
        torch.mps.empty_cache()


+def synchronize_device(device: torch.device):
+    if device.type == "cuda":
+        torch.cuda.synchronize()
+    elif device.type == "xpu":
+        torch.xpu.synchronize()
+    elif device.type == "mps":
+        torch.mps.synchronize()
+
+
@functools.lru_cache(maxsize=None)
 def get_preferred_device() -> torch.device:
    r"""