Crystalcareai commited on
Commit
2fbb6c8
·
verified ·
1 Parent(s): 99b259e

Update modeling_gemmoe.py

Browse files
Files changed (1) hide show
  1. modeling_gemmoe.py +1 -3
modeling_gemmoe.py CHANGED
@@ -629,9 +629,7 @@ class GemmoeSdpaAttention(GemmoeAttention):
629
  key_states = key_states.contiguous()
630
  value_states = value_states.contiguous()
631
 
632
-
633
- causal_mask = causal_mask.to(query_states.dtype)
634
-
635
  attn_output = torch.nn.functional.scaled_dot_product_attention(
636
  query_states,
637
  key_states,
 
629
  key_states = key_states.contiguous()
630
  value_states = value_states.contiguous()
631
 
632
+
 
 
633
  attn_output = torch.nn.functional.scaled_dot_product_attention(
634
  query_states,
635
  key_states,