[model][NPU]:Add NPU fusion operator patch to Zimage model to improve performance

This commit is contained in:
feng0w0
2026-02-09 09:51:06 +08:00
parent 051b957adb
commit 3f8468893a

View File

@@ -27,4 +27,4 @@ def rotary_emb_Zimage_npu(self, x_in: torch.Tensor, freqs_cis: torch.Tensor):
cos, sin = torch.chunk(torch.view_as_real(freqs_cis), 2, dim=-1)
cos = cos.expand(-1, -1, -1, -1, 2).flatten(-2)
sin = sin.expand(-1, -1, -1, -1, 2).flatten(-2)
return torch_npu.npu_rotary_mul(x_in, cos, sin).to(x_in)
return torch_npu.npu_rotary_mul(x_in, cos, sin, rotary_mode="interleave").to(x_in)