katuni4ka
/

tiny-random-baichuan2

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

katuni4ka commited on Mar 4, 2024

Commit

0d670f1

·

verified ·

1 Parent(s): 2209f5d

Update modeling_baichuan.py

Files changed (1) hide show

modeling_baichuan.py +2 -2

modeling_baichuan.py CHANGED Viewed

@@ -114,8 +114,8 @@ class RotaryEmbedding(torch.nn.Module):
         t = torch.arange(self.max_seq_len_cached, device=self.inv_freq.device, dtype=torch.float32)
         freqs = torch.outer(t, self.inv_freq)
         emb = torch.cat((freqs, freqs), dim=-1)
-        self.register_buffer("cos_cached", emb.cos().to(dtype)[None, None, :, :], persistent=False)
-        self.register_buffer("sin_cached", emb.sin().to(dtype)[None, None, :, :], persistent=False)
     def forward(self, x, seq_len):
         # x: [bs, num_attention_heads, seq_len, head_size]

         t = torch.arange(self.max_seq_len_cached, device=self.inv_freq.device, dtype=torch.float32)
         freqs = torch.outer(t, self.inv_freq)
         emb = torch.cat((freqs, freqs), dim=-1)
+        self.register_buffer("cos_cached", emb.cos().to(self.inv_freq.device)[None, None, :, :], persistent=False)
+        self.register_buffer("sin_cached", emb.sin().to(self.inv_freq.device)[None, None, :, :], persistent=False)
     def forward(self, x, seq_len):
         # x: [bs, num_attention_heads, seq_len, head_size]