diff --git a/tests/big_bird/test_modeling_big_bird.py b/tests/big_bird/test_modeling_big_bird.py index 711708ac2c9..df2ca8a157b 100644 --- a/tests/big_bird/test_modeling_big_bird.py +++ b/tests/big_bird/test_modeling_big_bird.py @@ -70,7 +70,7 @@ class BigBirdModelTester: attention_type="block_sparse", use_bias=True, rescale_embeddings=False, - block_size=16, + block_size=8, num_rand_blocks=3, position_embedding_type="absolute", scope=None, @@ -581,7 +581,7 @@ class BigBirdModelTest(ModelTesterMixin, unittest.TestCase): self.assertTrue( torch.allclose( hidden_states[0, 0, :5], - torch.tensor([1.4943, 0.0928, 0.8254, -0.2816, -0.9788], device=torch_device), + torch.tensor([1.4825, 0.0774, 0.8226, -0.2962, -0.9593], device=torch_device), atol=1e-3, ) )