Add: FLUX

2026-03-22 00:38:11 +00:00 · 2025-11-19 15:14:18 +08:00
parent 2d23c897c2
commit c119ce7e64
11 changed files with 2134 additions and 30 deletions
--- a/diffsynth/models/flux_ipadapter.py
+++ b/diffsynth/models/flux_ipadapter.py
@@ -5,34 +5,21 @@ import torch

 class SiglipVisionModelSO400M(SiglipVisionModel):
    def __init__(self):
-        config = SiglipVisionConfig(**{
-            "architectures": [
-                "SiglipModel"
-            ],
-            "initializer_factor": 1.0,
-            "model_type": "siglip",
-            "text_config": {
-                "hidden_size": 1152,
-                "intermediate_size": 4304,
-                "model_type": "siglip_text_model",
-                "num_attention_heads": 16,
-                "num_hidden_layers": 27
-            },
-            "torch_dtype": "float32",
-            "transformers_version": "4.37.0.dev0",
-            "vision_config": {
-                "hidden_size": 1152,
-                "image_size": 384,
-                "intermediate_size": 4304,
-                "model_type": "siglip_vision_model",
-                "num_attention_heads": 16,
-                "num_hidden_layers": 27,
-                "patch_size": 14
-            }
-        })
+        config = SiglipVisionConfig(
+            hidden_size=1152,
+            image_size=384,
+            intermediate_size=4304,
+            model_type="siglip_vision_model",
+            num_attention_heads=16,
+            num_hidden_layers=27,
+            patch_size=14,
+            architectures=["SiglipModel"],
+            initializer_factor=1.0,
+            torch_dtype="float32",
+            transformers_version="4.37.0.dev0"
+        )
        super().__init__(config)

-
 class MLPProjModel(torch.nn.Module):
    def __init__(self, cross_attention_dim=768, id_embeddings_dim=512, num_tokens=4):
        super().__init__()