@@ -55,6 +55,22 @@ class CommonTestCases:
|
||||
def get_input_output_texts(self):
|
||||
raise NotImplementedError
|
||||
|
||||
def test_tokenizers_common_properties(self):
|
||||
tokenizer = self.get_tokenizer()
|
||||
attributes_list = ["bos_token", "eos_token", "unk_token", "sep_token",
|
||||
"pad_token", "cls_token", "mask_token"]
|
||||
for attr in attributes_list:
|
||||
self.assertTrue(hasattr(tokenizer, attr))
|
||||
self.assertTrue(hasattr(tokenizer, attr + "_id"))
|
||||
|
||||
self.assertTrue(hasattr(tokenizer, "additional_special_tokens"))
|
||||
self.assertTrue(hasattr(tokenizer, 'additional_special_tokens_ids'))
|
||||
|
||||
attributes_list = ["max_len", "init_inputs", "init_kwargs", "added_tokens_encoder",
|
||||
"added_tokens_decoder"]
|
||||
for attr in attributes_list:
|
||||
self.assertTrue(hasattr(tokenizer, attr))
|
||||
|
||||
def test_save_and_load_tokenizer(self):
|
||||
# safety check on max_len default value so we are sure the test works
|
||||
tokenizer = self.get_tokenizer()
|
||||
|
||||
Reference in New Issue
Block a user