From fd0ef8b66d957ac0fc94d715262dca1a6005a5ed Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Thu, 26 Jan 2023 14:50:09 +0100 Subject: [PATCH] Small QoL for qa. (#21316) --- src/transformers/pipelines/question_answering.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/transformers/pipelines/question_answering.py b/src/transformers/pipelines/question_answering.py index 94b332aabd1..d4bb7f21029 100644 --- a/src/transformers/pipelines/question_answering.py +++ b/src/transformers/pipelines/question_answering.py @@ -404,6 +404,9 @@ class QuestionAnsweringPipeline(ChunkPipeline): if doc_stride is None: doc_stride = min(max_seq_len // 2, 128) + if doc_stride > max_seq_len: + raise ValueError(f"`doc_stride` ({doc_stride}) is larger than `max_seq_len` ({max_seq_len})") + if not self.tokenizer.is_fast: features = squad_convert_examples_to_features( examples=[example],