Merge branch 'dev' into dev_device_support

2026-04-08 22:35:09 +00:00 · 2024-02-12 13:01:54 +09:00
parent e579648ce9 35c6053de3
commit 358ca205a3
62 changed files with 1387 additions and 993 deletions
--- a/sdxl_minimal_inference.py
+++ b/sdxl_minimal_inference.py
@@ -22,6 +22,10 @@ from safetensors.torch import load_file

 from library import model_util, sdxl_model_util
 import networks.lora as lora
+from library.utils import setup_logging
+setup_logging()
+import logging
+logger = logging.getLogger(__name__)

 # scheduler: このあたりの設定はSD1/2と同じでいいらしい
 # scheduler: The settings around here seem to be the same as SD1/2
@@ -139,7 +143,7 @@ if __name__ == "__main__":

    vae_dtype = DTYPE
    if DTYPE == torch.float16:
-        print("use float32 for vae")
+        logger.info("use float32 for vae")
        vae_dtype = torch.float32
    vae.to(DEVICE, dtype=vae_dtype)
    vae.eval()
@@ -186,7 +190,7 @@ if __name__ == "__main__":
            emb1 = get_timestep_embedding(torch.FloatTensor([original_height, original_width]).unsqueeze(0), 256)
            emb2 = get_timestep_embedding(torch.FloatTensor([crop_top, crop_left]).unsqueeze(0), 256)
            emb3 = get_timestep_embedding(torch.FloatTensor([target_height, target_width]).unsqueeze(0), 256)
-            # print("emb1", emb1.shape)
+            # logger.info("emb1", emb1.shape)
            c_vector = torch.cat([emb1, emb2, emb3], dim=1).to(DEVICE, dtype=DTYPE)
            uc_vector = c_vector.clone().to(DEVICE, dtype=DTYPE)  # ちょっとここ正しいかどうかわからない I'm not sure if this is right

@@ -216,7 +220,7 @@ if __name__ == "__main__":

                enc_out = text_model2(tokens, output_hidden_states=True, return_dict=True)
                text_embedding2_penu = enc_out["hidden_states"][-2]
-                # print("hidden_states2", text_embedding2_penu.shape)
+                # logger.info("hidden_states2", text_embedding2_penu.shape)
                text_embedding2_pool = enc_out["text_embeds"]   # do not support Textual Inversion

            # 連結して終了 concat and finish
@@ -225,7 +229,7 @@ if __name__ == "__main__":

        # cond
        c_ctx, c_ctx_pool = call_text_encoder(prompt, prompt2)
-        # print(c_ctx.shape, c_ctx_p.shape, c_vector.shape)
+        # logger.info(c_ctx.shape, c_ctx_p.shape, c_vector.shape)
        c_vector = torch.cat([c_ctx_pool, c_vector], dim=1)

        # uncond
@@ -322,4 +326,4 @@ if __name__ == "__main__":
                seed = int(seed)
            generate_image(prompt, prompt2, negative_prompt, seed)

-    print("Done!")
+    logger.info("Done!")