diff --git a/tests/models/deepseek_v3/test_modeling_deepseek_v3.py b/tests/models/deepseek_v3/test_modeling_deepseek_v3.py index e6a02626d8..6c0c3a19d0 100644 --- a/tests/models/deepseek_v3/test_modeling_deepseek_v3.py +++ b/tests/models/deepseek_v3/test_modeling_deepseek_v3.py @@ -318,6 +318,10 @@ class DeepseekV3ModelTest(ModelTesterMixin, GenerationTesterMixin, PipelineTeste def test_greedy_generate_dict_outputs_use_cache(self): pass + @unittest.skip(reason="SDPA can't dispatch on flash due to unsupported head dims") + def test_sdpa_can_dispatch_on_flash(self): + pass + def test_config(self): self.config_tester.run_common_tests()