update readme to mention add_special_tokens more clearly in example

2025-08-03 03:31:05 +06:00 · 2019-08-30 11:30:51 +02:00 · 2019-08-30 11:30:51 +02:00 · 306af132d7
commit 306af132d7
parent 50e6daf83a
1 changed files with 1 additions and 1 deletions
--- a/README.md
+++ b/README.md
@ -93,7 +93,7 @@ for model_class, tokenizer_class, pretrained_weights in MODELS:
    model = model_class.from_pretrained(pretrained_weights)

    # Encode text
-    input_ids = torch.tensor([tokenizer.encode("Here is some text to encode")])
+    input_ids = torch.tensor([tokenizer.encode("Here is some text to encode", add_special_tokens=True)])  # Add special tokens takes care of adding [CLS], [SEP], <s>... tokens in the right way for each model.
    with torch.no_grad():
        last_hidden_states = model(input_ids)[0]  # Models outputs are now tuples