Add ModernBERT Decoder Models - ModernBERT, but trained with CLM! (#38967)
* working locally; need to style and test * added docs and initial tests; need to debug and flesh out * fixed tests * working long context; batches * working fa2 and eager * update tests * add missing confnigs * remove default autoset * fix spacing * fix most tests * fixed tests * fix to init * refactor to match new transformers updates * remove static cache option * fa2 fix * fix docs * in progress * working on tests * fixed issue with attn outputs * remove debug * fix local config attr * update doc string * fix docstring * add docs to toc * correct typo in toc * add new updates from main w.r.t. ModernBERT RoPE * fix local param --------- Co-authored-by: oweller2 <oweller2@dsailogin.mgmt.ai.cluster> Co-authored-by: oweller2 <oweller2@l07.mgmt.ai.cluster> Co-authored-by: oweller2 <oweller2@n02.mgmt.ai.cluster> Co-authored-by: oweller2 <oweller2@l08.mgmt.ai.cluster> Co-authored-by: oweller2 <oweller2@l01.mgmt.ai.cluster> Co-authored-by: oweller2 <oweller2@l02.mgmt.ai.cluster>
This commit is contained in:
@@ -277,6 +277,19 @@ SPECIAL_CASES_TO_ALLOW = {
|
||||
"attention_chunk_size",
|
||||
],
|
||||
"Llama4VisionConfig": ["multi_modal_projector_bias", "norm_eps"],
|
||||
"ModernBertDecoderConfig": [
|
||||
"embedding_dropout",
|
||||
"hidden_activation",
|
||||
"initializer_cutoff_factor",
|
||||
"intermediate_size",
|
||||
"max_position_embeddings",
|
||||
"mlp_bias",
|
||||
"mlp_dropout",
|
||||
"classifier_activation",
|
||||
"global_attn_every_n_layers",
|
||||
"local_attention",
|
||||
"local_rope_theta",
|
||||
],
|
||||
# position_embedding_type not used and deprecated. Should be deleted in v4.55
|
||||
"LayoutLMConfig": ["position_embedding_type"],
|
||||
"MarkupLMConfig": ["position_embedding_type"],
|
||||
|
||||
Reference in New Issue
Block a user