Fix TeaCache bug with usp support integration and optimize memory usage by clearing attn cache
This commit is contained in:
@@ -124,4 +124,6 @@ def usp_attn_forward(self, x, freqs):
|
||||
)
|
||||
x = x.flatten(2)
|
||||
|
||||
del q, k, v
|
||||
torch.cuda.empty_cache()
|
||||
return self.o(x)
|
||||
Reference in New Issue
Block a user