fix:flux

2026-03-24 10:18:12 +00:00 · 2025-11-18 20:37:14 +08:00
parent 7b756a518e
commit 3f9e9cad9d
1 changed files with 10 additions and 90 deletions
--- a/diffsynth/pipelines/flux_image.py
+++ b/diffsynth/pipelines/flux_image.py
@@ -106,41 +106,7 @@ class FluxImagePipeline(BasePipeline):
    def enable_lora_magic(self):
        pass
-    # def load_lora(self, model, lora_config, alpha=1, hotload=False):
+    def load_lora(self, model, lora_config, alpha=1, hotload=False):
    #     if isinstance(lora_config, str):
    #         path = lora_config
    #     else:
    #         lora_config.download_if_necessary()
    #         path = lora_config.path
    #     state_dict = load_state_dict(path, torch_dtype=self.torch_dtype, device="cpu")
    #     loader = self.lora_loader(torch_dtype=self.torch_dtype, device=self.device)
    #     state_dict = loader.convert_state_dict(state_dict)
    #     loaded_count = 0
    #     for key in tqdm(state_dict, desc="Applying LoRA"):
    #         if ".lora_A." in key:
    #             layer_name = key.split(".lora_A.")[0]
    #             module = model
    #             try:
    #                 parts = layer_name.split(".")
    #                 for part in parts:
    #                     if part.isdigit():
    #                         module = module[int(part)]
    #                     else:
    #                         module = getattr(module, part)
    #             except AttributeError:
    #                 continue
    #             w_a = state_dict[key].to(device=module.weight.device, dtype=module.weight.dtype)
    #             w_b_key = key.replace("lora_A", "lora_B")
    #             if w_b_key not in state_dict: continue
    #             w_b = state_dict[w_b_key].to(device=module.weight.device, dtype=module.weight.dtype)
    #             delta_w = torch.mm(w_b, w_a)
    #             module.weight.data += delta_w * alpha
    #             loaded_count += 1
    def load_lora(self, model, lora_config, alpha=1.0, hotload=False):
        if isinstance(lora_config, str):
            path = lora_config
        else:
@@ -150,74 +116,28 @@ class FluxImagePipeline(BasePipeline):
        state_dict = load_state_dict(path, torch_dtype=self.torch_dtype, device="cpu")
        loader = self.lora_loader(torch_dtype=self.torch_dtype, device=self.device)
        state_dict = loader.convert_state_dict(state_dict)
        print(f"Merging LoRA weights from {path}...")
        loaded_count = 0
        # [新增] 键名映射表，处理 FW2 Loader 与 DiT 模型名称不一致的情况
        # 针对 Single Blocks 常见的命名差异进行修正
        key_mapping = {
            ".linear1.": ".to_qkv_mlp.",     # 常见差异点 1
            ".linear2.": ".proj_out.",       # 常见差异点 2
            ".modulation.lin.": ".norm.linear." # 常见差异点 3
        }
        for key in tqdm(state_dict, desc="Applying LoRA"):
            if ".lora_A." in key:
                layer_name = key.split(".lora_A.")[0]
                # [新增] 尝试应用键名修正
                target_layer_name = layer_name
                for src, dst in key_mapping.items():
                    if src in target_layer_name:
                        target_layer_name = target_layer_name.replace(src, dst)
                # 在模型中查找层
                module = model
                try:
-                    parts = target_layer_name.split(".")
+                    parts = layer_name.split(".")
                    for part in parts:
                        if part.isdigit():
                            module = module[int(part)]
                        else:
                            module = getattr(module, part)
                except AttributeError:
                    # 如果修正后还是找不到，尝试原始名称（作为保底）
                    try:
                        module = model
                        parts = layer_name.split(".")
                        for part in parts:
                            if part.isdigit():
                                module = module[int(part)]
                            else:
                                module = getattr(module, part)
                    except AttributeError:
                        # 确实找不到，跳过并打印警告(可选)
                        # print(f"Warning: Could not find layer for {layer_name}")
                        continue 
                # 获取 LoRA 参数并计算增量
                try:
                    w_a = state_dict[key].to(device=module.weight.device, dtype=module.weight.dtype)
                    w_b_key = key.replace("lora_A", "lora_B")
                    if w_b_key not in state_dict: continue
                    w_b = state_dict[w_b_key].to(device=module.weight.device, dtype=module.weight.dtype)
                    # 检查形状是否匹配 (非常重要，防止 broadcasting 错误掩盖问题)
                    # Linear weight: (out, in). B@A: (out, in)
                    delta_w = torch.mm(w_b, w_a)
                    if delta_w.shape != module.weight.shape:
                        # 形状不匹配通常意味着 QKV 融合/分离状态不一致
                        # 简单跳过或尝试转置（视具体情况，这里保守跳过）
                        continue
                    module.weight.data += delta_w * alpha
                    loaded_count += 1
                except Exception as e:
                    continue
-        print(f"Applied LoRA to {loaded_count} layers.")
+                w_a = state_dict[key].to(device=module.weight.device, dtype=module.weight.dtype)
-
+                w_b_key = key.replace("lora_A", "lora_B")
                if w_b_key not in state_dict: continue
                w_b = state_dict[w_b_key].to(device=module.weight.device, dtype=module.weight.dtype)
                delta_w = torch.mm(w_b, w_a)
                module.weight.data += delta_w * alpha
                loaded_count += 1
    @staticmethod
    def from_pretrained(
        torch_dtype: torch.dtype = torch.bfloat16,