ByT5 model (#11971)
* allow tf to use uneven num of layers * add tokenizer * finish docs * finish docs * Apply suggestions from code review * include in index * finish * Update docs/source/model_doc/byt5.rst Co-authored-by: NielsRogge <48327001+NielsRogge@users.noreply.github.com> * apply sylvais suggestions * make style Co-authored-by: NielsRogge <48327001+NielsRogge@users.noreply.github.com>
This commit is contained in:
committed by
GitHub
parent
1eb58b4560
commit
47a98fc4cb
@@ -30,7 +30,7 @@ from .test_modeling_common import ModelTesterMixin, ids_tensor
|
||||
if is_torch_available():
|
||||
import torch
|
||||
|
||||
from transformers import T5Config, T5EncoderModel, T5ForConditionalGeneration, T5Model, T5Tokenizer
|
||||
from transformers import ByT5Tokenizer, T5Config, T5EncoderModel, T5ForConditionalGeneration, T5Model, T5Tokenizer
|
||||
from transformers.models.t5.modeling_t5 import T5_PRETRAINED_MODEL_ARCHIVE_LIST
|
||||
|
||||
|
||||
@@ -846,6 +846,30 @@ class T5ModelIntegrationTests(unittest.TestCase):
|
||||
EXPECTED_SCORE = -59.0293
|
||||
self.assertTrue(abs(mtf_score - EXPECTED_SCORE) < 1e-4)
|
||||
|
||||
@slow
|
||||
def test_small_byt5_integration_test(self):
|
||||
"""
|
||||
For comparision run:
|
||||
>>> import t5 # pip install t5==0.9.1
|
||||
|
||||
>>> path_to_byt5_small_checkpoint = '<fill_in>'
|
||||
>>> t5_model = t5.models.MtfModel(model_dir=path_to_tf_checkpoint, batch_size=1, tpu=None)
|
||||
>>> vocab = t5.data.ByteVocabulary()
|
||||
>>> score = t5_model.score(inputs=["Hello there"], targets=["Hi I am"], vocabulary=vocab)
|
||||
"""
|
||||
|
||||
model = T5ForConditionalGeneration.from_pretrained("google/byt5-small").to(torch_device)
|
||||
tokenizer = ByT5Tokenizer.from_pretrained("google/byt5-small")
|
||||
|
||||
input_ids = tokenizer("Hello there", return_tensors="pt").input_ids
|
||||
labels = tokenizer("Hi I am", return_tensors="pt").input_ids
|
||||
|
||||
loss = model(input_ids.to(torch_device), labels=labels.to(torch_device)).loss
|
||||
mtf_score = -(labels.shape[-1] * loss.item())
|
||||
|
||||
EXPECTED_SCORE = -60.7397
|
||||
self.assertTrue(abs(mtf_score - EXPECTED_SCORE) < 1e-4)
|
||||
|
||||
@slow
|
||||
def test_summarization(self):
|
||||
model = self.model
|
||||
|
||||
Reference in New Issue
Block a user