Remove @slow for test_eager_matches_sdpa_inference (#34558)

* update

* update

* update

* update

* update

* update

* update

* update

* update

* update

* update

---------

Co-authored-by: ydshieh <ydshieh@users.noreply.github.com>
This commit is contained in:
Yih-Dar
2024-11-05 16:10:42 +01:00
committed by GitHub
parent 082e57e0d4
commit f2d5dfbab2
21 changed files with 271 additions and 626 deletions

View File

@@ -19,7 +19,6 @@ import tempfile
import unittest
import pytest
from parameterized import parameterized
from transformers import NemotronConfig, is_torch_available
from transformers.testing_utils import (
@@ -99,15 +98,6 @@ class NemotronModelTest(GemmaModelTest):
self.model_tester = NemotronModelTester(self)
self.config_tester = ConfigTester(self, config_class=NemotronConfig, hidden_size=37)
@require_torch_sdpa
@slow
@unittest.skip(
reason="Due to custom causal mask, there is a slightly too big difference between eager and sdpa in bfloat16."
)
@parameterized.expand([("float16",), ("bfloat16",), ("float32",)])
def test_eager_matches_sdpa_inference(self, torch_dtype: str):
pass
@unittest.skip("Eager and SDPA do not produce the same outputs, thus this test fails")
def test_model_outputs_equivalence(self, **kwargs):
pass