Merge pull request #293 from modelscope/dev

hunyuanvideo quantization
2026-04-08 17:18:21 +00:00 · 2024-12-19 16:20:35 +08:00
parent aa23356420 0692e8b1e1
commit c06ea2271a
3 changed files with 3 additions and 3 deletions
--- a/examples/HunyuanVideo/hunyuanvideo_24G.py
+++ b/examples/HunyuanVideo/hunyuanvideo_24G.py
@@ -11,7 +11,7 @@ model_manager.load_models(
    [
        "models/HunyuanVideo/transformers/mp_rank_00_model_states.pt"
    ],
-    torch_dtype=torch.bfloat16,
+    torch_dtype=torch.bfloat16, # you can use torch_dtype=torch.float8_e4m3fn to enable quantization.
    device="cpu"
 )

--- a/examples/HunyuanVideo/hunyuanvideo_6G.py
+++ b/examples/HunyuanVideo/hunyuanvideo_6G.py
@@ -11,7 +11,7 @@ model_manager.load_models(
    [
        "models/HunyuanVideo/transformers/mp_rank_00_model_states.pt"
    ],
-    torch_dtype=torch.bfloat16,
+    torch_dtype=torch.bfloat16, # you can use torch_dtype=torch.float8_e4m3fn to enable quantization.
    device="cpu"
 )

--- a/examples/HunyuanVideo/hunyuanvideo_80G.py
+++ b/examples/HunyuanVideo/hunyuanvideo_80G.py
@@ -11,7 +11,7 @@ model_manager.load_models(
    [
        "models/HunyuanVideo/transformers/mp_rank_00_model_states.pt"
    ],
-    torch_dtype=torch.bfloat16,
+    torch_dtype=torch.bfloat16, # you can use torch_dtype=torch.float8_e4m3fn to enable quantization.
    device="cuda"
 )