Raghavan
/

indictrans2-indic-en-dist-200M

text2text-generation

Model card Files Files and versions Community

Raghavan commited on Jan 20

Commit

d03c1e2

•

1 Parent(s): dd5aa99

Upload 7 files

Files changed (1) hide show

modeling_indictrans.py +9 -6

modeling_indictrans.py CHANGED Viewed

@@ -61,20 +61,23 @@ def shift_tokens_right(input_ids: torch.Tensor, pad_token_id: int, decoder_start
 def prepare_decoder_input_ids_label(decoder_input_ids, decoder_attention_mask):
-    labels = torch.full(decoder_input_ids.size(),-100)
-    labels[:, :-1] = decoder_input_ids[:, 1:]
     labels_mask = labels == 1
     labels[labels_mask] = -100
-    mask = (decoder_input_ids == eos_token_id)
-    decoder_input_ids[mask] = 1
-    decoder_attention_mask[mask] = 0
     return decoder_input_ids, decoder_attention_mask, labels
 # Copied from transformers.models.bart.modeling_bart._make_causal_mask
 def _make_causal_mask(
         input_ids_shape: torch.Size, dtype: torch.dtype, device: torch.device, past_key_values_length: int = 0

 def prepare_decoder_input_ids_label(decoder_input_ids, decoder_attention_mask):
+    new_decoder_input_ids = decoder_input_ids.clone().detach()
+    new_decoder_attention_mask = decoder_attention_mask.clone().detach()
+    labels = torch.full(new_decoder_input_ids.size(),-100)
+    labels[:, :-1] = new_decoder_input_ids[:, 1:]
     labels_mask = labels == 1
     labels[labels_mask] = -100
+    mask = (new_decoder_input_ids == eos_token_id)
+    new_decoder_input_ids[mask] = 1
+    new_decoder_attention_mask[mask] = 0
     return decoder_input_ids, decoder_attention_mask, labels
 # Copied from transformers.models.bart.modeling_bart._make_causal_mask
 def _make_causal_mask(
         input_ids_shape: torch.Size, dtype: torch.dtype, device: torch.device, past_key_values_length: int = 0