style

2026-04-24 06:46:13 +00:00 · 2026-04-23 17:31:34 +08:00
parent 394db06d86
commit a80fb84220
14 changed files with 99 additions and 243 deletions
--- a/diffsynth/utils/state_dict_converters/ace_step_dit.py
+++ b/diffsynth/utils/state_dict_converters/ace_step_dit.py
@@ -1,37 +1,4 @@
-"""
-State dict converter for ACE-Step DiT model.
-
-The original checkpoint stores all model weights in a single file
-(nested in AceStepConditionGenerationModel). The DiT weights are
-prefixed with 'decoder.'.
-
-This converter extracts only keys starting with 'decoder.' and strips
-the prefix to match the standalone AceStepDiTModel in DiffSynth.
-"""
-
-
-def ace_step_dit_converter(state_dict):
-    """
-    Convert ACE-Step DiT checkpoint keys to DiffSynth format.
-
-    参数 state_dict 是 DiskMap 类型。
-    遍历时，key 是 key 名，state_dict[key] 获取实际值。
-
-    Original checkpoint contains all model weights under prefixes:
-    - decoder.* (DiT)
-    - encoder.* (Conditioner)
-    - tokenizer.* (Audio Tokenizer)
-    - detokenizer.* (Audio Detokenizer)
-    - null_condition_emb (CFG null embedding)
-
-    This extracts only 'decoder.' keys and strips the prefix.
-
-    Example mapping:
-        decoder.layers.0.self_attn.q_proj.weight -> layers.0.self_attn.q_proj.weight
-        decoder.proj_in.0.linear_1.weight -> proj_in.0.linear_1.weight
-        decoder.time_embed.linear_1.weight -> time_embed.linear_1.weight
-        decoder.rotary_emb.inv_freq -> rotary_emb.inv_freq
-    """
+def AceStepDiTModelStateDictConverter(state_dict):
    new_state_dict = {}
    prefix = "decoder."