fix: Updated test_embeded_special_tokens for luke and mluke models (#32413)
Fixed tokenizertests for luke, mluke models.
This commit is contained in:
@@ -146,11 +146,9 @@ class LukeTokenizerTest(TokenizerTesterMixin, unittest.TestCase):
|
|||||||
# token_type_ids should put 0 everywhere
|
# token_type_ids should put 0 everywhere
|
||||||
self.assertEqual(sum(tokens_r["token_type_ids"]), sum(tokens_p["token_type_ids"]))
|
self.assertEqual(sum(tokens_r["token_type_ids"]), sum(tokens_p["token_type_ids"]))
|
||||||
|
|
||||||
# token_type_ids should put 0 everywhere
|
|
||||||
self.assertEqual(sum(tokens_r["token_type_ids"]), sum(tokens_p["token_type_ids"]))
|
|
||||||
|
|
||||||
# attention_mask should put 1 everywhere, so sum over length should be 1
|
# attention_mask should put 1 everywhere, so sum over length should be 1
|
||||||
self.assertEqual(
|
self.assertEqual(
|
||||||
|
sum(tokens_r["attention_mask"]) / len(tokens_r["attention_mask"]),
|
||||||
sum(tokens_p["attention_mask"]) / len(tokens_p["attention_mask"]),
|
sum(tokens_p["attention_mask"]) / len(tokens_p["attention_mask"]),
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
@@ -109,11 +109,9 @@ class MLukeTokenizerTest(TokenizerTesterMixin, unittest.TestCase):
|
|||||||
# token_type_ids should put 0 everywhere
|
# token_type_ids should put 0 everywhere
|
||||||
self.assertEqual(sum(tokens_r["token_type_ids"]), sum(tokens_p["token_type_ids"]))
|
self.assertEqual(sum(tokens_r["token_type_ids"]), sum(tokens_p["token_type_ids"]))
|
||||||
|
|
||||||
# token_type_ids should put 0 everywhere
|
|
||||||
self.assertEqual(sum(tokens_r["token_type_ids"]), sum(tokens_p["token_type_ids"]))
|
|
||||||
|
|
||||||
# attention_mask should put 1 everywhere, so sum over length should be 1
|
# attention_mask should put 1 everywhere, so sum over length should be 1
|
||||||
self.assertEqual(
|
self.assertEqual(
|
||||||
|
sum(tokens_r["attention_mask"]) / len(tokens_r["attention_mask"]),
|
||||||
sum(tokens_p["attention_mask"]) / len(tokens_p["attention_mask"]),
|
sum(tokens_p["attention_mask"]) / len(tokens_p["attention_mask"]),
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user