Merge pull request #1452 from fireicewolf/sd3-devel

Fix AttributeError: 'T5EncoderModel' object has no attribute 'text_model', while loading T5 model in GPU.
2026-04-08 22:35:09 +00:00 · 2024-08-15 21:12:19 +09:00
parent 7db4222119 9760d097b0
commit e2d822cad7
1 changed files with 6 additions and 2 deletions
--- a/train_network.py
+++ b/train_network.py
@@ -543,9 +543,13 @@ class NetworkTrainer:
            # in case of cpu, dtype is already set to fp32 because cpu does not support fp8/fp16/bf16
            if t_enc.device.type != "cpu":
                t_enc.to(dtype=te_weight_dtype)
-                if hasattr(t_enc.text_model, "embeddings"):
+                if hasattr(t_enc, "text_model") and hasattr(t_enc.text_model, "embeddings"):
                    # nn.Embedding not support FP8
-                    t_enc.text_model.embeddings.to(dtype=(weight_dtype if te_weight_dtype != weight_dtype else te_weight_dtype))
+                    t_enc.text_model.embeddings.to(
                        dtype=(weight_dtype if te_weight_dtype != weight_dtype else te_weight_dtype))
                elif hasattr(t_enc, "encoder") and hasattr(t_enc.encoder, "embeddings"):
                    t_enc.encoder.embeddings.to(
                        dtype=(weight_dtype if te_weight_dtype != weight_dtype else te_weight_dtype))
        # acceleratorがなんかよろしくやってくれるらしい / accelerator will do something good
        if args.deepspeed: