Fix tokenizers training in notebook (#10110)

2025-07-03 12:50:06 +06:00 · 2021-02-09 21:48:22 -05:00 · 2021-02-09 21:48:22 -05:00 · 1fbaa3c117
commit 1fbaa3c117
parent 85395e4901
1 changed files with 1 additions and 1 deletions
--- a/notebooks/01-training-tokenizers.ipynb
+++ b/notebooks/01-training-tokenizers.ipynb
@ -229,7 +229,7 @@
    "\n",
    "# We initialize our trainer, giving him the details about the vocabulary we want to generate\n",
    "trainer = BpeTrainer(vocab_size=25000, show_progress=True, initial_alphabet=ByteLevel.alphabet())\n",
-    "tokenizer.train(trainer, [\"big.txt\"])\n",
+    "tokenizer.train(files=[\"big.txt\"], trainer=trainer)\n",
    "\n",
    "print(\"Trained vocab size: {}\".format(tokenizer.get_vocab_size()))"
   ]