huggingface · ydshieh · Sep 19, 2022 · Sep 19, 2022 · ydshieh · Sep 19, 2022
diff --git a/src/diffusers/models/attention.py b/src/diffusers/models/attention.py
@@ -249,13 +249,15 @@ def reshape_batch_dim_to_heads(self, tensor):
         return tensor
 
     def forward(self, hidden_states, context=None, mask=None):
-        batch_size, sequence_length, dim = hidden_states.shape
+        batch_size, sequence_length, _ = hidden_states.shape
 
         query = self.to_q(hidden_states)
         context = context if context is not None else hidden_states
         key = self.to_k(context)
         value = self.to_v(context)
 
+        dim = query.shape[-1]
+
         query = self.reshape_heads_to_batch_dim(query)
         key = self.reshape_heads_to_batch_dim(key)
         value = self.reshape_heads_to_batch_dim(value)