From a638e986f45b338c86482e1c13e045c06cfeccad Mon Sep 17 00:00:00 2001 From: Patrick von Platen Date: Wed, 6 May 2020 00:42:34 +0200 Subject: [PATCH] fix hard wired pad token id (#4138) --- src/transformers/modeling_roberta.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/transformers/modeling_roberta.py b/src/transformers/modeling_roberta.py index 37e2877243..71bea22155 100644 --- a/src/transformers/modeling_roberta.py +++ b/src/transformers/modeling_roberta.py @@ -47,7 +47,7 @@ class RobertaEmbeddings(BertEmbeddings): def __init__(self, config): super().__init__(config) - self.padding_idx = 1 + self.padding_idx = config.pad_token_id self.word_embeddings = nn.Embedding(config.vocab_size, config.hidden_size, padding_idx=self.padding_idx) self.position_embeddings = nn.Embedding( config.max_position_embeddings, config.hidden_size, padding_idx=self.padding_idx