🚨 Don't use cache in non-generative models (#38751)
* deprecate for 1 version * style * fix some tests * fix esm * skip for now, GC requires positional args but we have keyword args * remove transpose for scores in modified models only * skip fx trace tests
This commit is contained in:
committed by
GitHub
parent
dbc98328da
commit
e435574721
@@ -276,6 +276,9 @@ SPECIAL_CASES_TO_ALLOW = {
|
||||
"attention_chunk_size",
|
||||
],
|
||||
"Llama4VisionConfig": ["multi_modal_projector_bias", "norm_eps"],
|
||||
# position_embedding_type not used and deprecated. Should be deleted in v4.55
|
||||
"LayoutLMConfig": ["position_embedding_type"],
|
||||
"MarkupLMConfig": ["position_embedding_type"],
|
||||
"SmolLM3Config": ["no_rope_layer_interval"],
|
||||
"Gemma3nVisionConfig": ["architecture", "do_pooling", "model_args"], # this is for use in `timm`
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user