From cc85388d79036dd2b68559a0f1c07a223e1bddbb Mon Sep 17 00:00:00 2001 From: Artiprocher Date: Wed, 19 Nov 2025 14:37:05 +0800 Subject: [PATCH] bugfix --- examples/test/run.py | 6 +++--- examples/wanvideo/model_training/full/Wan2.2-S2V-14B.sh | 1 - examples/wanvideo/model_training/lora/Wan2.2-S2V-14B.sh | 1 - 3 files changed, 3 insertions(+), 5 deletions(-) diff --git a/examples/test/run.py b/examples/test/run.py index f140d6e..6e5934b 100644 --- a/examples/test/run.py +++ b/examples/test/run.py @@ -37,14 +37,14 @@ def run_tasks_on_single_GPU(script_path, gpu_id, num_gpu): def run_train_multi_GPU(script_path): output_path = os.path.join("data", script_path) - for script in os.listdir(script_path): + for script in os.listdir(script_path)[::-1]: if not script.endswith(".sh"): continue source_path = os.path.join(script_path, script) target_path = os.path.join(output_path, script) os.makedirs(target_path, exist_ok=True) cmd = f"bash {source_path} > {target_path}/log.txt 2>&1" - print(cmd) + print(cmd, flush=True) os.system(cmd) time.sleep(3*60) @@ -79,5 +79,5 @@ if __name__ == "__main__": # run_train_single_GPU("examples/wanvideo/model_training/validate_lora") # move_files("video_", "data/output/validate_lora") # run_train_multi_GPU("examples/wanvideo/model_training/full") - run_train_multi_GPU("examples/wanvideo/model_training/validate_full") + run_train_single_GPU("examples/wanvideo/model_training/validate_full") move_files("video_", "data/output/validate_full") diff --git a/examples/wanvideo/model_training/full/Wan2.2-S2V-14B.sh b/examples/wanvideo/model_training/full/Wan2.2-S2V-14B.sh index 3a9a871..fb4d18c 100644 --- a/examples/wanvideo/model_training/full/Wan2.2-S2V-14B.sh +++ b/examples/wanvideo/model_training/full/Wan2.2-S2V-14B.sh @@ -7,7 +7,6 @@ accelerate launch --config_file examples/wanvideo/model_training/full/accelerate --num_frames 81 \ --dataset_repeat 100 \ --model_id_with_origin_paths "Wan-AI/Wan2.2-S2V-14B:diffusion_pytorch_model*.safetensors,Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/model.safetensors,Wan-AI/Wan2.2-S2V-14B:models_t5_umt5-xxl-enc-bf16.pth,Wan-AI/Wan2.2-S2V-14B:Wan2.1_VAE.pth" \ - --audio_processor_config "Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/" \ --learning_rate 1e-5 \ --num_epochs 1 \ --trainable_models "dit" \ diff --git a/examples/wanvideo/model_training/lora/Wan2.2-S2V-14B.sh b/examples/wanvideo/model_training/lora/Wan2.2-S2V-14B.sh index 84723ec..3865965 100644 --- a/examples/wanvideo/model_training/lora/Wan2.2-S2V-14B.sh +++ b/examples/wanvideo/model_training/lora/Wan2.2-S2V-14B.sh @@ -7,7 +7,6 @@ accelerate launch --config_file examples/wanvideo/model_training/full/accelerate --num_frames 81 \ --dataset_repeat 100 \ --model_id_with_origin_paths "Wan-AI/Wan2.2-S2V-14B:diffusion_pytorch_model*.safetensors,Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/model.safetensors,Wan-AI/Wan2.2-S2V-14B:models_t5_umt5-xxl-enc-bf16.pth,Wan-AI/Wan2.2-S2V-14B:Wan2.1_VAE.pth" \ - --audio_processor_config "Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/" \ --learning_rate 1e-4 \ --num_epochs 5 \ --remove_prefix_in_ckpt "pipe.dit." \