Correctly list the chat template file in the Tokenizer saved files list (#34974)
* Correctly list the chat template file in the saved files list * Update src/transformers/tokenization_utils_base.py Co-authored-by: Arthur <48595927+ArthurZucker@users.noreply.github.com> * Add save file checking to test * make fixup * better filename handling * make fixup --------- Co-authored-by: Arthur <48595927+ArthurZucker@users.noreply.github.com>
This commit is contained in:
@@ -1107,7 +1107,9 @@ class TokenizerTesterMixin:
|
||||
tokenizer.apply_chat_template(dummy_conversation, tokenize=True, return_dict=False)
|
||||
|
||||
with tempfile.TemporaryDirectory() as tmp_dir_name:
|
||||
tokenizer.save_pretrained(tmp_dir_name)
|
||||
save_files = tokenizer.save_pretrained(tmp_dir_name)
|
||||
# Check we aren't saving a chat_template.jinja file
|
||||
self.assertFalse(any(file.endswith("chat_template.jinja") for file in save_files))
|
||||
new_tokenizer = tokenizer.from_pretrained(tmp_dir_name)
|
||||
|
||||
self.assertEqual(new_tokenizer.chat_template, dummy_template) # Test template has persisted
|
||||
@@ -1117,7 +1119,9 @@ class TokenizerTesterMixin:
|
||||
new_tokenizer.apply_chat_template(dummy_conversation, tokenize=True, return_dict=False)
|
||||
|
||||
with tempfile.TemporaryDirectory() as tmp_dir_name:
|
||||
tokenizer.save_pretrained(tmp_dir_name, save_raw_chat_template=True)
|
||||
save_files = tokenizer.save_pretrained(tmp_dir_name, save_raw_chat_template=True)
|
||||
# Check we are saving a chat_template.jinja file
|
||||
self.assertTrue(any(file.endswith("chat_template.jinja") for file in save_files))
|
||||
chat_template_file = Path(tmp_dir_name) / "chat_template.jinja"
|
||||
self.assertTrue(chat_template_file.is_file())
|
||||
self.assertEqual(chat_template_file.read_text(), dummy_template)
|
||||
|
||||
Reference in New Issue
Block a user