style

2026-04-24 15:06:17 +00:00 · 2026-04-23 17:31:34 +08:00
parent 394db06d86
commit a80fb84220
14 changed files with 99 additions and 243 deletions
--- a/diffsynth/utils/state_dict_converters/ace_step_conditioner.py
+++ b/diffsynth/utils/state_dict_converters/ace_step_conditioner.py
@@ -1,38 +1,4 @@
-"""
-State dict converter for ACE-Step Conditioner model.
-
-The original checkpoint stores all model weights in a single file
-(nested in AceStepConditionGenerationModel). The Conditioner weights are
-prefixed with 'encoder.'.
-
-This converter extracts only keys starting with 'encoder.' and strips
-the prefix to match the standalone AceStepConditionEncoder in DiffSynth.
-"""
-
-
-def ace_step_conditioner_converter(state_dict):
-    """
-    Convert ACE-Step Conditioner checkpoint keys to DiffSynth format.
-
-    参数 state_dict 是 DiskMap 类型。
-    遍历时，key 是 key 名，state_dict[key] 获取实际值。
-
-    Original checkpoint contains all model weights under prefixes:
-    - decoder.* (DiT)
-    - encoder.* (Conditioner)
-    - tokenizer.* (Audio Tokenizer)
-    - detokenizer.* (Audio Detokenizer)
-    - null_condition_emb (CFG null embedding)
-
-    This extracts only 'encoder.' keys and strips the prefix.
-
-    Example mapping:
-        encoder.lyric_encoder.layers.0.self_attn.q_proj.weight -> lyric_encoder.layers.0.self_attn.q_proj.weight
-        encoder.attention_pooler.layers.0.self_attn.q_proj.weight -> attention_pooler.layers.0.self_attn.q_proj.weight
-        encoder.timbre_encoder.layers.0.self_attn.q_proj.weight -> timbre_encoder.layers.0.self_attn.q_proj.weight
-        encoder.audio_tokenizer.audio_acoustic_proj.weight -> audio_tokenizer.audio_acoustic_proj.weight
-        encoder.detokenizer.layers.0.self_attn.q_proj.weight -> detokenizer.layers.0.self_attn.q_proj.weight
-    """
+def AceStepConditionEncoderStateDictConverter(state_dict):
    new_state_dict = {}
    prefix = "encoder."

@@ -41,7 +7,6 @@ def ace_step_conditioner_converter(state_dict):
            new_key = key[len(prefix):]
            new_state_dict[new_key] = state_dict[key]

-    # Extract null_condition_emb from top level (used for CFG negative condition)
    if "null_condition_emb" in state_dict:
        new_state_dict["null_condition_emb"] = state_dict["null_condition_emb"]