mirror of
https://github.com/Stability-AI/stablediffusion.git
synced 2025-12-05 14:30:01 +01:00
* Use Cutlass ops when possible to +15% speed
This commit is contained in:
@@ -201,7 +201,7 @@ class MemoryEfficientCrossAttention(nn.Module):
|
||||
self.to_v = nn.Linear(context_dim, inner_dim, bias=False)
|
||||
|
||||
self.to_out = nn.Sequential(nn.Linear(inner_dim, query_dim), nn.Dropout(dropout))
|
||||
self.attention_op: Optional[Any] = None
|
||||
self.attention_op: Optional[Any] = xformers.ops.MemoryEfficientAttentionCutlassOp if hasattr(xformers.ops, "MemoryEfficientAttentionCutlassOp") else None
|
||||
|
||||
def forward(self, x, context=None, mask=None):
|
||||
q = self.to_q(x)
|
||||
|
||||
@@ -234,7 +234,7 @@ class MemoryEfficientAttnBlock(nn.Module):
|
||||
kernel_size=1,
|
||||
stride=1,
|
||||
padding=0)
|
||||
self.attention_op: Optional[Any] = None
|
||||
self.attention_op: Optional[Any] = xformers.ops.MemoryEfficientAttentionCutlassOp if hasattr(xformers.ops, "MemoryEfficientAttentionCutlassOp") else None
|
||||
|
||||
def forward(self, x):
|
||||
h_ = x
|
||||
|
||||
Reference in New Issue
Block a user