mirror of
https://github.com/modelscope/DiffSynth-Studio.git
synced 2026-03-21 16:18:13 +00:00
refine code
This commit is contained in:
@@ -1,58 +1,45 @@
|
||||
import torch
|
||||
from diffsynth import ModelManager, FluxImagePipeline, download_customized_models, FluxImageLoraPipeline
|
||||
from diffsynth import ModelManager, FluxImagePipeline, download_customized_models
|
||||
from modelscope import dataset_snapshot_download
|
||||
from examples.EntityControl.utils import visualize_masks
|
||||
import os
|
||||
import json
|
||||
from PIL import Image
|
||||
import requests
|
||||
from io import BytesIO
|
||||
import torch
|
||||
|
||||
# download and load model
|
||||
lora_path = download_customized_models(
|
||||
model_id="DiffSynth-Studio/Eligen",
|
||||
origin_file_path="model_bf16.safetensors",
|
||||
local_dir="models/lora/entity_control"
|
||||
)[0]
|
||||
model_manager = ModelManager(torch_dtype=torch.bfloat16, device="cuda", model_id_list=["FLUX.1-dev"])
|
||||
model_manager.load_lora(lora_path, lora_alpha=1.)
|
||||
model_manager.load_lora(
|
||||
download_customized_models(
|
||||
model_id="DiffSynth-Studio/Eligen",
|
||||
origin_file_path="model_bf16.safetensors",
|
||||
local_dir="models/lora/entity_control"
|
||||
),
|
||||
lora_alpha=1
|
||||
)
|
||||
pipe = FluxImagePipeline.from_model_manager(model_manager)
|
||||
|
||||
# prepare inputs
|
||||
image_shape = 1024
|
||||
seed = 0
|
||||
# set True to apply regional attention in negative prompt prediction for better results with more time
|
||||
use_seperated_negtive_prompt = False
|
||||
mask_urls = [
|
||||
'https://github.com/user-attachments/assets/0cf78663-5314-4280-a065-31ded7a24a46',
|
||||
'https://github.com/user-attachments/assets/bd3938b8-72a8-4d56-814f-f6445971b91d'
|
||||
]
|
||||
# prepare entity masks, entity prompts, global prompt and negative prompt
|
||||
masks = []
|
||||
for url in mask_urls:
|
||||
response = requests.get(url)
|
||||
mask = Image.open(BytesIO(response.content)).resize((image_shape, image_shape), resample=Image.NEAREST)
|
||||
masks.append(mask)
|
||||
# download and load mask images
|
||||
dataset_snapshot_download(dataset_id="DiffSynth-Studio/examples_in_diffsynth", local_dir="./", allow_file_pattern="data/examples/eligen/inpaint*")
|
||||
masks = [Image.open(f"./data/examples/eligen/inpaint_mask_{i}.png") for i in range(1, 3)]
|
||||
input_image = Image.open("./data/examples/eligen/inpaint_image.jpg")
|
||||
|
||||
entity_prompts = ["A person wear red shirt", "Airplane"]
|
||||
global_prompt = "A person walking on the path in front of a house; An airplane in the sky"
|
||||
negative_prompt = "worst quality, low quality, monochrome, zombie, interlocked fingers, Aissist, cleavage, nsfw, blur"
|
||||
|
||||
response = requests.get('https://github.com/user-attachments/assets/fa4d6ba5-08fd-4fc7-adbb-19898d839364')
|
||||
inpaint_input = Image.open(BytesIO(response.content)).convert('RGB').resize((image_shape, image_shape))
|
||||
|
||||
# generate image
|
||||
torch.manual_seed(seed)
|
||||
image = pipe(
|
||||
prompt=global_prompt,
|
||||
input_image=input_image,
|
||||
cfg_scale=3.0,
|
||||
negative_prompt=negative_prompt,
|
||||
num_inference_steps=50,
|
||||
embedded_guidance=3.5,
|
||||
height=image_shape,
|
||||
width=image_shape,
|
||||
entity_prompts=entity_prompts,
|
||||
entity_masks=masks,
|
||||
inpaint_input=inpaint_input,
|
||||
use_seperated_negtive_prompt=use_seperated_negtive_prompt,
|
||||
seed=0,
|
||||
height=1024,
|
||||
width=1024,
|
||||
eligen_entity_prompts=entity_prompts,
|
||||
eligen_entity_masks=masks,
|
||||
enable_eligen_on_negative=False,
|
||||
enable_eligen_inpaint=True,
|
||||
)
|
||||
image.save(f"entity_inpaint.png")
|
||||
visualize_masks(image, masks, entity_prompts, f"entity_inpaint_with_mask.png")
|
||||
visualize_masks(image, masks, entity_prompts, f"entity_inpaint_with_mask.png")
|
||||
|
||||
Reference in New Issue
Block a user