From 9830858671f403b398bc81f979232727b7f3b71a Mon Sep 17 00:00:00 2001 From: Lysandre Debut Date: Mon, 19 Feb 2024 13:23:25 +0100 Subject: [PATCH] Fix the `bert-base-cased` tokenizer configuration test (#29105) Fix test --- tests/models/auto/test_tokenization_auto.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/models/auto/test_tokenization_auto.py b/tests/models/auto/test_tokenization_auto.py index 2de5d1a917..7d4a302e4f 100644 --- a/tests/models/auto/test_tokenization_auto.py +++ b/tests/models/auto/test_tokenization_auto.py @@ -223,7 +223,7 @@ class AutoTokenizerTest(unittest.TestCase): config = get_tokenizer_config("google-bert/bert-base-cased") _ = config.pop("_commit_hash", None) # If we ever update google-bert/bert-base-cased tokenizer config, this dict here will need to be updated. - self.assertEqual(config, {"do_lower_case": False}) + self.assertEqual(config, {"do_lower_case": False, "model_max_length": 512}) # This model does not have a tokenizer_config so we get back an empty dict. config = get_tokenizer_config(SMALL_MODEL_IDENTIFIER)