From 0511369a8b6464ca3e51618ac816df1b34590144 Mon Sep 17 00:00:00 2001 From: Arthur <48595927+ArthurZucker@users.noreply.github.com> Date: Fri, 21 Jul 2023 14:32:34 +0200 Subject: [PATCH] [`LlamaConfig`] Nit: pad token should be None by default (#24958) * pad token should be None by default * fix tests * nits --- src/transformers/models/llama/configuration_llama.py | 2 +- tests/models/llama/test_modeling_llama.py | 3 +++ 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/src/transformers/models/llama/configuration_llama.py b/src/transformers/models/llama/configuration_llama.py index ea257b3a7b..4587772137 100644 --- a/src/transformers/models/llama/configuration_llama.py +++ b/src/transformers/models/llama/configuration_llama.py @@ -116,7 +116,7 @@ class LlamaConfig(PretrainedConfig): initializer_range=0.02, rms_norm_eps=1e-6, use_cache=True, - pad_token_id=0, + pad_token_id=None, bos_token_id=1, eos_token_id=2, pretraining_tp=1, diff --git a/tests/models/llama/test_modeling_llama.py b/tests/models/llama/test_modeling_llama.py index 80820a5013..c2efc3f5a3 100644 --- a/tests/models/llama/test_modeling_llama.py +++ b/tests/models/llama/test_modeling_llama.py @@ -58,6 +58,7 @@ class LlamaModelTester: initializer_range=0.02, num_labels=3, num_choices=4, + pad_token_id=0, scope=None, ): self.parent = parent @@ -81,6 +82,7 @@ class LlamaModelTester: self.initializer_range = initializer_range self.num_labels = num_labels self.num_choices = num_choices + self.pad_token_id = pad_token_id self.scope = scope def prepare_config_and_inputs(self): @@ -120,6 +122,7 @@ class LlamaModelTester: type_vocab_size=self.type_vocab_size, is_decoder=False, initializer_range=self.initializer_range, + pad_token_id=self.pad_token_id, ) def create_and_check_model(