ybelkada
/

llama-xformers

ybelkada commited on Nov 15, 2023

Commit

24a2b9b

•

1 Parent(s): d37c4cf

Update llama_xformers_attention.py

Files changed (1) hide show

llama_xformers_attention.py CHANGED Viewed

@@ -70,10 +70,6 @@ class LlamaXFormersAttention(LlamaAttention):
  attn_weights = None
  attn_output = attn_output.reshape(bsz, q_len, self.hidden_size)
  attn_output = self.o_proj(attn_output)
- if not output_attentions:
- attn_weights = None
  return attn_output, attn_weights, past_key_value

  attn_weights = None
  attn_output = attn_output.reshape(bsz, q_len, self.hidden_size)
  attn_output = self.o_proj(attn_output)
  return attn_output, attn_weights, past_key_value