[generate] return Cache object even if passed in a legacy format (#35673)
* generate returns a Cache object by default * fix tests * fix test for encoder-decoder models
This commit is contained in:
@@ -268,18 +268,6 @@ class AriaForConditionalGenerationModelTest(ModelTesterMixin, GenerationTesterMi
|
||||
def test_sdpa_can_dispatch_on_flash(self):
|
||||
pass
|
||||
|
||||
@unittest.skip(reason="")
|
||||
def test_new_cache_format_0(self):
|
||||
pass
|
||||
|
||||
@unittest.skip(reason="")
|
||||
def test_new_cache_format_1(self):
|
||||
pass
|
||||
|
||||
@unittest.skip(reason="")
|
||||
def test_new_cache_format_2(self):
|
||||
pass
|
||||
|
||||
@unittest.skip(reason="Feedforward chunking is not yet supported")
|
||||
def test_feed_forward_chunking(self):
|
||||
pass
|
||||
|
||||
Reference in New Issue
Block a user