[generate] return Cache object even if passed in a legacy format (#35673)

* generate returns a Cache object by default

* fix tests

* fix test for encoder-decoder models
This commit is contained in:
Joao Gante
2025-01-16 17:06:24 +00:00
committed by GitHub
parent 2818307e93
commit 94af1c0aa2
9 changed files with 36 additions and 156 deletions

View File

@@ -268,18 +268,6 @@ class AriaForConditionalGenerationModelTest(ModelTesterMixin, GenerationTesterMi
def test_sdpa_can_dispatch_on_flash(self):
pass
@unittest.skip(reason="")
def test_new_cache_format_0(self):
pass
@unittest.skip(reason="")
def test_new_cache_format_1(self):
pass
@unittest.skip(reason="")
def test_new_cache_format_2(self):
pass
@unittest.skip(reason="Feedforward chunking is not yet supported")
def test_feed_forward_chunking(self):
pass