Raghavan
/

indictrans2-en-indic-dist-200M

text2text-generation

Model card Files Files and versions Community

Raghavan commited on Jan 21

Commit

1c5c454

•

1 Parent(s): b1e9935

Upload 7 files

Files changed (1) hide show

modeling_indictrans.py +2 -4

modeling_indictrans.py CHANGED Viewed

@@ -64,7 +64,7 @@ def prepare_decoder_input_ids_label(decoder_input_ids, decoder_attention_mask):
     new_decoder_input_ids = decoder_input_ids.clone().detach()
     new_decoder_attention_mask = decoder_attention_mask.clone().detach()
-    labels = torch.full(new_decoder_input_ids.size(),-100)
     labels[:, :-1] = new_decoder_input_ids[:, 1:]
     labels_mask = labels == 1
@@ -74,9 +74,7 @@ def prepare_decoder_input_ids_label(decoder_input_ids, decoder_attention_mask):
     new_decoder_input_ids[mask] = 1
     new_decoder_attention_mask[mask] = 0
-    return new_decoder_input_ids, new_decoder_attention_mask, labels
 # Copied from transformers.models.bart.modeling_bart._make_causal_mask

     new_decoder_input_ids = decoder_input_ids.clone().detach()
     new_decoder_attention_mask = decoder_attention_mask.clone().detach()
+    labels = torch.full(new_decoder_input_ids.size(), -100)
     labels[:, :-1] = new_decoder_input_ids[:, 1:]
     labels_mask = labels == 1
     new_decoder_input_ids[mask] = 1
     new_decoder_attention_mask[mask] = 0
+    return new_decoder_input_ids[:, :-1], new_decoder_attention_mask[:, :-1], labels[:, :-1]
 # Copied from transformers.models.bart.modeling_bart._make_causal_mask