This commit is contained in:
Artiprocher
2025-11-19 14:37:05 +08:00
parent 82378a2815
commit cc85388d79
3 changed files with 3 additions and 5 deletions

View File

@@ -37,14 +37,14 @@ def run_tasks_on_single_GPU(script_path, gpu_id, num_gpu):
def run_train_multi_GPU(script_path):
output_path = os.path.join("data", script_path)
for script in os.listdir(script_path):
for script in os.listdir(script_path)[::-1]:
if not script.endswith(".sh"):
continue
source_path = os.path.join(script_path, script)
target_path = os.path.join(output_path, script)
os.makedirs(target_path, exist_ok=True)
cmd = f"bash {source_path} > {target_path}/log.txt 2>&1"
print(cmd)
print(cmd, flush=True)
os.system(cmd)
time.sleep(3*60)
@@ -79,5 +79,5 @@ if __name__ == "__main__":
# run_train_single_GPU("examples/wanvideo/model_training/validate_lora")
# move_files("video_", "data/output/validate_lora")
# run_train_multi_GPU("examples/wanvideo/model_training/full")
run_train_multi_GPU("examples/wanvideo/model_training/validate_full")
run_train_single_GPU("examples/wanvideo/model_training/validate_full")
move_files("video_", "data/output/validate_full")

View File

@@ -7,7 +7,6 @@ accelerate launch --config_file examples/wanvideo/model_training/full/accelerate
--num_frames 81 \
--dataset_repeat 100 \
--model_id_with_origin_paths "Wan-AI/Wan2.2-S2V-14B:diffusion_pytorch_model*.safetensors,Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/model.safetensors,Wan-AI/Wan2.2-S2V-14B:models_t5_umt5-xxl-enc-bf16.pth,Wan-AI/Wan2.2-S2V-14B:Wan2.1_VAE.pth" \
--audio_processor_config "Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/" \
--learning_rate 1e-5 \
--num_epochs 1 \
--trainable_models "dit" \

View File

@@ -7,7 +7,6 @@ accelerate launch --config_file examples/wanvideo/model_training/full/accelerate
--num_frames 81 \
--dataset_repeat 100 \
--model_id_with_origin_paths "Wan-AI/Wan2.2-S2V-14B:diffusion_pytorch_model*.safetensors,Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/model.safetensors,Wan-AI/Wan2.2-S2V-14B:models_t5_umt5-xxl-enc-bf16.pth,Wan-AI/Wan2.2-S2V-14B:Wan2.1_VAE.pth" \
--audio_processor_config "Wan-AI/Wan2.2-S2V-14B:wav2vec2-large-xlsr-53-english/" \
--learning_rate 1e-4 \
--num_epochs 5 \
--remove_prefix_in_ckpt "pipe.dit." \