add examples

2026-03-24 10:18:12 +00:00 · 2026-02-05 17:17:10 +08:00
parent 1635897516
commit 27b1fe240b
3 changed files with 63 additions and 3 deletions
--- a/README.md
+++ b/README.md
@@ -766,9 +766,9 @@ DiffSynth-Studio is not just an engineered model framework, but also an incubato
 - Paper: [Spectral Evolution Search: Efficient Inference-Time Scaling for Reward-Aligned Image Generation
 ](https://arxiv.org/abs/2602.03208)
- Sample Code: []()
+- Sample Code: coming soon
-|FLUX|FLUX + SES|Qwen-Image|Qwen-Image + SES|
+|FLUX.1-dev|FLUX.1-dev + SES|Qwen-Image|Qwen-Image + SES|
 |-|-|-|-|
 |![Image](https://github.com/user-attachments/assets/5be15dc6-2805-4822-b04c-2573fc0f45f0)|![Image](https://github.com/user-attachments/assets/e71b8c20-1629-41d9-b0ff-185805c1da4e)|![Image](https://github.com/user-attachments/assets/7a73c968-133a-4545-9aa2-205533861cd4)|![Image](https://github.com/user-attachments/assets/c8390b22-14fe-48a0-a6e6-d6556d31235e)|
--- a/README_zh.md
+++ b/README_zh.md
@@ -766,7 +766,7 @@ DiffSynth-Studio 不仅仅是一个工程化的模型框架，更是创新成果
 - 论文：[Spectral Evolution Search: Efficient Inference-Time Scaling for Reward-Aligned Image Generation
 ](https://arxiv.org/abs/2602.03208)
- 代码样例：[]()
+- 代码样例：coming soon
 |FLUX.1-dev|FLUX.1-dev + SES|Qwen-Image|Qwen-Image + SES|
 |-|-|-|-|
@@ -774,6 +774,7 @@ DiffSynth-Studio 不仅仅是一个工程化的模型框架，更是创新成果
 </details>
 <details>
 <summary>VIRAL：基于DiT模型的类比视觉上下文推理</summary>
@@ -789,6 +790,7 @@ DiffSynth-Studio 不仅仅是一个工程化的模型框架，更是创新成果
 </details>
 <details>
 <summary>AttriCtrl: 图像生成模型的属性强度控制</summary>
--- a/examples/qwen_image/model_inference_low_vram/Qwen-Image-Edit-2511-ICEdit.py
+++ b/examples/qwen_image/model_inference_low_vram/Qwen-Image-Edit-2511-ICEdit.py
@@ -0,0 +1,58 @@
 from diffsynth.pipelines.qwen_image import QwenImagePipeline, ModelConfig
 from modelscope import snapshot_download
 from PIL import Image
 import torch
 # Load models
 vram_config = {
    "offload_dtype": "disk",
    "offload_device": "disk",
    "onload_dtype": torch.float8_e4m3fn,
    "onload_device": "cpu",
    "preparing_dtype": torch.float8_e4m3fn,
    "preparing_device": "cuda",
    "computation_dtype": torch.bfloat16,
    "computation_device": "cuda",
 }
 pipe = QwenImagePipeline.from_pretrained(
    torch_dtype=torch.bfloat16,
    device="cuda",
    model_configs=[
        ModelConfig(model_id="Qwen/Qwen-Image-Edit-2511", origin_file_pattern="transformer/diffusion_pytorch_model*.safetensors", **vram_config),
        ModelConfig(model_id="Qwen/Qwen-Image", origin_file_pattern="text_encoder/model*.safetensors", **vram_config),
        ModelConfig(model_id="Qwen/Qwen-Image", origin_file_pattern="vae/diffusion_pytorch_model.safetensors", **vram_config),
    ],
    processor_config=ModelConfig(model_id="Qwen/Qwen-Image-Edit", origin_file_pattern="processor/"),
 )
 lora = ModelConfig(
    model_id="DiffSynth-Studio/Qwen-Image-Edit-2511-ICEdit-LoRA",
    origin_file_pattern="model.safetensors"
 )
 pipe.load_lora(pipe.dit, lora)
 # Load images
 snapshot_download(
    "DiffSynth-Studio/Qwen-Image-Edit-2511-ICEdit-LoRA",
    local_dir="./data",
    allow_file_pattern="assets/*"
 )
 edit_image = [
    Image.open("data/assets/image1_original.png"),
    Image.open("data/assets/image1_edit_1.png"),
    Image.open("data/assets/image2_original.png")
 ]
 prompt = "Edit image 3 based on the transformation from image 1 to image 2."
 negative_prompt = "泛黄，AI感，不真实，丑陋，油腻的皮肤，异常的肢体，不协调的肢体"
 # Generate
 image_4 = pipe(
    prompt=prompt, negative_prompt=negative_prompt,
    edit_image=edit_image,
    seed=1,
    num_inference_steps=50,
    height=1280,
    width=720,
    zero_cond_t=True,
 )
 image_4.save("image.png")