fix gradient accumulation doesn't work

2026-04-08 22:35:09 +00:00 · 2023-07-12 21:35:57 +09:00
parent 814996b14f
commit 3c67e595b8
1 changed files with 1 additions and 2 deletions
--- a/sdxl_train.py
+++ b/sdxl_train.py
@@ -362,8 +362,7 @@ def train(args):
        loss_total = 0
        for step, batch in enumerate(train_dataloader):
            current_step.value = global_step
-            # with accelerator.accumulate(training_models[0]):  # 複数モデルに対応していない模様だがとりあえずこうしておく
+            with accelerator.accumulate(training_models[0]):  # 複数モデルに対応していない模様だがとりあえずこうしておく
            if True:
                if "latents" in batch and batch["latents"] is not None:
                    latents = batch["latents"].to(accelerator.device).to(dtype=weight_dtype)
                else: