From 1fbaa3c117e197be7b842198da633dac62053925 Mon Sep 17 00:00:00 2001 From: Anthony MOI Date: Tue, 9 Feb 2021 21:48:22 -0500 Subject: [PATCH] Fix tokenizers training in notebook (#10110) --- notebooks/01-training-tokenizers.ipynb | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/notebooks/01-training-tokenizers.ipynb b/notebooks/01-training-tokenizers.ipynb index 96c25c7998..218970647b 100644 --- a/notebooks/01-training-tokenizers.ipynb +++ b/notebooks/01-training-tokenizers.ipynb @@ -229,7 +229,7 @@ "\n", "# We initialize our trainer, giving him the details about the vocabulary we want to generate\n", "trainer = BpeTrainer(vocab_size=25000, show_progress=True, initial_alphabet=ByteLevel.alphabet())\n", - "tokenizer.train(trainer, [\"big.txt\"])\n", + "tokenizer.train(files=[\"big.txt\"], trainer=trainer)\n", "\n", "print(\"Trained vocab size: {}\".format(tokenizer.get_vocab_size()))" ]