Fix the check of models supporting FA/SDPA not run (#28202)

* add check_support_list.py * fix * fix --------- Co-authored-by: ydshieh <ydshieh@users.noreply.github.com>
2023-12-22 12:56:11 +01:00
parent e37ab52dff
commit bb3bd44739
4 changed files with 97 additions and 58 deletions
--- a/tests/utils/test_doc_samples.py
+++ b/tests/utils/test_doc_samples.py
@@ -16,7 +16,6 @@ import doctest
 import logging
 import os
 import unittest
-from glob import glob
 from pathlib import Path
 from typing import List, Union

@@ -27,63 +26,6 @@ from transformers.testing_utils import require_tf, require_torch, slow
 logger = logging.getLogger()


-@require_torch
-class TestDocLists(unittest.TestCase):
-    def test_flash_support_list(self):
-        with open("./docs/source/en/perf_infer_gpu_one.md", "r") as f:
-            doctext = f.read()
-
-            doctext = doctext.split("FlashAttention-2 is currently supported for the following architectures:")[1]
-            doctext = doctext.split("You can request to add FlashAttention-2 support")[0]
-
-        patterns = glob("./src/transformers/models/**/modeling_*.py")
-        patterns_tf = glob("./src/transformers/models/**/modeling_tf_*.py")
-        patterns_flax = glob("./src/transformers/models/**/modeling_flax_*.py")
-        patterns = list(set(patterns) - set(patterns_tf) - set(patterns_flax))
-        archs_supporting_fa2 = []
-        for filename in patterns:
-            with open(filename, "r") as f:
-                text = f.read()
-
-                if "_supports_flash_attn_2 = True" in text:
-                    model_name = os.path.basename(filename).replace(".py", "").replace("modeling_", "")
-                    archs_supporting_fa2.append(model_name)
-
-        for arch in archs_supporting_fa2:
-            if arch not in doctext:
-                raise ValueError(
-                    f"{arch} should be in listed in the flash attention documentation but is not. Please update the documentation."
-                )
-
-    def test_sdpa_support_list(self):
-        with open("./docs/source/en/perf_infer_gpu_one.md", "r") as f:
-            doctext = f.read()
-
-            doctext = doctext.split(
-                "For now, Transformers supports SDPA inference and training for the following architectures:"
-            )[1]
-            doctext = doctext.split("Note that FlashAttention can only be used for models using the")[0]
-
-        patterns = glob("./src/transformers/models/**/modeling_*.py")
-        patterns_tf = glob("./src/transformers/models/**/modeling_tf_*.py")
-        patterns_flax = glob("./src/transformers/models/**/modeling_flax_*.py")
-        patterns = list(set(patterns) - set(patterns_tf) - set(patterns_flax))
-        archs_supporting_sdpa = []
-        for filename in patterns:
-            with open(filename, "r") as f:
-                text = f.read()
-
-                if "_supports_sdpa = True" in text:
-                    model_name = os.path.basename(filename).replace(".py", "").replace("modeling_", "")
-                    archs_supporting_sdpa.append(model_name)
-
-        for arch in archs_supporting_sdpa:
-            if arch not in doctext:
-                raise ValueError(
-                    f"{arch} should be in listed in the SDPA documentation but is not. Please update the documentation."
-                )
-
-
@unittest.skip("Temporarily disable the doc tests.")
@require_torch
@require_tf