Added support for caching text embeddings. This is just initial support and will probably fail for some models. Still needs to be ompimized

2026-04-25 08:49:14 +00:00 · 2025-08-07 10:27:55 -06:00
parent 4c4a10d439
commit bb6db3d635
16 changed files with 485 additions and 195 deletions
--- a/extensions_built_in/diffusion_models/qwen_image/qwen_image.py
+++ b/extensions_built_in/diffusion_models/qwen_image/qwen_image.py
@@ -168,7 +168,9 @@ class QwenImageModel(BaseModel):
        text_encoder = [pipe.text_encoder]
        tokenizer = [pipe.tokenizer]

-        pipe.transformer = pipe.transformer.to(self.device_torch)
+        # leave it on cpu for now
+        if not self.low_vram:
+            pipe.transformer = pipe.transformer.to(self.device_torch)

        flush()
        # just to make sure everything is on the right device and dtype
@@ -210,6 +212,7 @@ class QwenImageModel(BaseModel):
        generator: torch.Generator,
        extra: dict,
    ):
+        self.model.to(self.device_torch, dtype=self.torch_dtype)
        control_img = None
        if gen_config.ctrl_img is not None:
            raise NotImplementedError(