fix train_new_from_iterator in the case of byte-level tokenizers (#17549)

This commit is contained in:
SaulLu
2022-06-08 15:30:41 +02:00
committed by GitHub
parent 264128cb9d
commit ae7bae8fe7
13 changed files with 56 additions and 0 deletions

View File

@@ -166,6 +166,11 @@ class GPT2ModelTester:
reorder_and_upcast_attn=reorder_and_upcast_attn,
)
def get_pipeline_config(self):
config = self.get_config()
config.vocab_size = 300
return config
def prepare_config_and_inputs_for_decoder(self):
(
config,