From d3c3e722d69627d6334d7ef8faaced7df3103174 Mon Sep 17 00:00:00 2001 From: Stefan Schweter Date: Tue, 27 Jul 2021 16:18:04 +0200 Subject: [PATCH] [FLAX] Minor fixes in CLM example (#12914) * readme: fix retrieval of vocab size for flax clm example * examples: fix flax clm example when using training/evaluation files --- examples/flax/language-modeling/README.md | 2 +- examples/flax/language-modeling/run_clm_flax.py | 6 +++--- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/examples/flax/language-modeling/README.md b/examples/flax/language-modeling/README.md index 0024beb848..b3efa047a6 100644 --- a/examples/flax/language-modeling/README.md +++ b/examples/flax/language-modeling/README.md @@ -211,7 +211,7 @@ from transformers import GPT2Config model_dir = "./norwegian-gpt2" # ${MODEL_DIR} -config = GPT2Config.from_pretrained("gpt2", resid_pdrop=0.0, embd_pdrop=0.0, attn_pdrop=0.0, vocab_size=tokenizer.vocab_size) +config = GPT2Config.from_pretrained("gpt2", resid_pdrop=0.0, embd_pdrop=0.0, attn_pdrop=0.0, vocab_size=tokenizer.get_vocab_size()) config.save_pretrained(model_dir) ``` diff --git a/examples/flax/language-modeling/run_clm_flax.py b/examples/flax/language-modeling/run_clm_flax.py index 23e550f51d..e763a63d63 100755 --- a/examples/flax/language-modeling/run_clm_flax.py +++ b/examples/flax/language-modeling/run_clm_flax.py @@ -308,14 +308,14 @@ def main(): extension = "text" dataset = load_dataset(extension, data_files=data_files, cache_dir=model_args.cache_dir) - if "validation" not in datasets.keys(): - datasets["validation"] = load_dataset( + if "validation" not in dataset.keys(): + dataset["validation"] = load_dataset( extension, data_files=data_files, split=f"train[:{data_args.validation_split_percentage}%]", cache_dir=model_args.cache_dir, ) - datasets["train"] = load_dataset( + dataset["train"] = load_dataset( extension, data_files=data_files, split=f"train[{data_args.validation_split_percentage}%:]",