🚨 Don't use cache in non-generative models (#38751)

* deprecate for 1 version

* style

* fix some tests

* fix esm

* skip for now, GC requires positional args but we have keyword args

* remove transpose for scores in modified models only

* skip fx trace tests
This commit is contained in:
Raushan Turganbay
2025-07-01 11:08:21 +02:00
committed by GitHub
parent dbc98328da
commit e435574721
37 changed files with 969 additions and 2328 deletions

View File

@@ -276,6 +276,9 @@ SPECIAL_CASES_TO_ALLOW = {
"attention_chunk_size",
],
"Llama4VisionConfig": ["multi_modal_projector_bias", "norm_eps"],
# position_embedding_type not used and deprecated. Should be deleted in v4.55
"LayoutLMConfig": ["position_embedding_type"],
"MarkupLMConfig": ["position_embedding_type"],
"SmolLM3Config": ["no_rope_layer_interval"],
"Gemma3nVisionConfig": ["architecture", "do_pooling", "model_args"], # this is for use in `timm`
}