Avoid erasing the attention mask when double padding (#8915)
This commit is contained in:
@@ -3047,8 +3047,7 @@ class PreTrainedTokenizerBase(SpecialTokensMixin):
|
|||||||
encoded_inputs["input_ids"] = [self.pad_token_id] * difference + encoded_inputs["input_ids"]
|
encoded_inputs["input_ids"] = [self.pad_token_id] * difference + encoded_inputs["input_ids"]
|
||||||
else:
|
else:
|
||||||
raise ValueError("Invalid padding strategy:" + str(self.padding_side))
|
raise ValueError("Invalid padding strategy:" + str(self.padding_side))
|
||||||
else:
|
elif return_attention_mask and "attention_mask" not in encoded_inputs:
|
||||||
if return_attention_mask:
|
|
||||||
encoded_inputs["attention_mask"] = [1] * len(encoded_inputs["input_ids"])
|
encoded_inputs["attention_mask"] = [1] * len(encoded_inputs["input_ids"])
|
||||||
|
|
||||||
return encoded_inputs
|
return encoded_inputs
|
||||||
|
|||||||
Reference in New Issue
Block a user