mirror of
https://github.com/huggingface/transformers.git
synced 2025-07-31 02:02:21 +06:00
Correct segment ID for XLNet single sequence
This commit is contained in:
parent
073219b43f
commit
088fa7b759
@ -240,7 +240,7 @@ class XLNetTokenizer(PreTrainedTokenizer):
|
||||
cls_segment_id = [2]
|
||||
|
||||
if token_ids_1 is None:
|
||||
return len(token_ids_0 + sep + cls) * [0]
|
||||
return len(token_ids_0 + sep) * [0] + cls_segment_id
|
||||
return len(token_ids_0 + sep) * [0] + len(token_ids_1 + sep) * [1] + cls_segment_id
|
||||
|
||||
def save_vocabulary(self, save_directory):
|
||||
|
Loading…
Reference in New Issue
Block a user