[CodeLlamaTokenizer] Nit, update __init__ to make sure the AddedTokens are not normalized because they are special (#27359)
* make sure tokens are properly initialized for codellama slow * add m ore pretrained models * style * test more tokenizers checkpoints
This commit is contained in:
@@ -150,6 +150,8 @@ class CodeLlamaTokenizationTest(TokenizerTesterMixin, unittest.TestCase):
|
||||
self.tokenizers_list = [
|
||||
(self.rust_tokenizer_class, "hf-internal-testing/llama-code-tokenizer", {}),
|
||||
(self.tokenizer_class, "hf-internal-testing/llama-code-tokenizer", {}),
|
||||
(self.tokenizer_class, "codellama/CodeLlama-34b-Instruct-hf", {}),
|
||||
(self.rust_tokenizer_class, "codellama/CodeLlama-34b-Instruct-hf", {}),
|
||||
]
|
||||
for tokenizer, pretrained_name, kwargs in self.tokenizers_list:
|
||||
with self.subTest(f"{tokenizer.__class__.__name__} ({pretrained_name})"):
|
||||
|
||||
Reference in New Issue
Block a user