From 380b2a031761e444a169f4d3379b30b718c16df6 Mon Sep 17 00:00:00 2001
From: Cyril Vallez <cyril.vallez@huggingface.co>
Date: Mon, 4 Aug 2025 14:41:09 +0200
Subject: [PATCH] Rework add-new-model-like with modular and make test
 filenames coherent (#39612)

* remove tf/flax

* fix

* style

* Update add_new_model_like.py

* work in progress

* continue

* more cleanup

* simplify and first final version

* fixes -> it works

* add linter checks

* Update add_new_model_like.py

* fix

* add modular conversion at the end

* Update add_new_model_like.py

* add video processor

* Update add_new_model_like.py

* Update add_new_model_like.py

* Update add_new_model_like.py

* fix

* Update image_processing_auto.py

* Update image_processing_auto.py

* fix post rebase

* start test filenames replacement

* rename all test_processor -> test_processing

* fix copied from

* add docstrings

* Update add_new_model_like.py

* fix regex

* improve wording

* Update add_new_model_like.py

* Update add_new_model_like.py

* Update add_new_model_like.py

* start adding test

* fix

* fix

* proper first test

* tests

* fix

* fix

* fix

* fix

* modular can be used from anywhere

* protect import

* fix

* Update add_new_model_like.py

* fix
---
 conftest.py                                   |    1 -
 .../commands/add_new_model_like.py            | 2182 +++++------------
 .../models/auto/image_processing_auto.py      |   78 +-
 src/transformers/utils/__init__.py            |    1 +
 src/transformers/utils/import_utils.py        |    5 +
 ...ssor_align.py => test_processing_align.py} |    0
 ..._altclip.py => test_processing_altclip.py} |    0
 ...cessor_aria.py => test_processing_aria.py} |    2 +-
 ...ision.py => test_processing_aya_vision.py} |    2 +-
 ...cessor_bark.py => test_processing_bark.py} |    0
 ...cessor_blip.py => test_processing_blip.py} |    0
 ...or_blip_2.py => test_processing_blip_2.py} |    0
 ...ower.py => test_processing_bridgetower.py} |    0
 ...meleon.py => test_processing_chameleon.py} |    2 +-
 ...lip.py => test_processing_chinese_clip.py} |    0
 ...cessor_clap.py => test_processing_clap.py} |    0
 ...cessor_clip.py => test_processing_clip.py} |    0
 ..._clipseg.py => test_processing_clipseg.py} |    0
 ...cessor_clvp.py => test_processing_clvp.py} |   12 +-
 .../models/colpali/test_processing_colpali.py |    2 +-
 .../colqwen2/test_processing_colqwen2.py      |    2 +-
 ...rocessor_csm.py => test_processing_csm.py} |    0
 ...k_vl.py => test_processing_deepseek_vl.py} |    0
 ... => test_processing_deepseek_vl_hybrid.py} |    0
 ...rocessor_dia.py => test_processing_dia.py} |    0
 ...ssor_donut.py => test_processing_donut.py} |    0
 ...cessor_emu3.py => test_processing_emu3.py} |    2 +-
 ...or_evolla.py => test_processing_evolla.py} |    0
 ...ssor_flava.py => test_processing_flava.py} |    0
 ...cessor_fuyu.py => test_processing_fuyu.py} |    2 +-
 tests/models/gemma3/test_processing_gemma3.py |    2 +-
 ...rocessor_git.py => test_processing_git.py} |    0
 ...ot_ocr2.py => test_processing_got_ocr2.py} |    0
 ...h.py => test_processing_granite_speech.py} |    0
 ...o.py => test_processing_grounding_dino.py} |   18 +-
 ..._idefics.py => test_processing_idefics.py} |    0
 ...defics2.py => test_processing_idefics2.py} |    0
 ...defics3.py => test_processing_idefics3.py} |    4 +-
 ...lip.py => test_processing_instructblip.py} |    0
 ...y => test_processing_instructblipvideo.py} |    0
 ...nternvl.py => test_processing_internvl.py} |    2 +-
 ...l.py => test_video_processing_internvl.py} |    0
 ...ssor_janus.py => test_processing_janus.py} |    0
 ..._kosmos2.py => test_processing_kosmos2.py} |    0
 ...tlmv2.py => test_processing_layoutlmv2.py} |    0
 ...tlmv3.py => test_processing_layoutlmv3.py} |    0
 ...outxlm.py => test_processing_layoutxlm.py} |    0
 ...or_llama4.py => test_processing_llama4.py} |    0
 ...ssor_llava.py => test_processing_llava.py} |    0
 ..._next.py => test_processing_llava_next.py} |    4 +-
 ...py => test_processing_llava_next_video.py} |    4 +-
 ....py => test_processing_llava_onevision.py} |    4 +-
 ...arkuplm.py => test_processing_markuplm.py} |    0
 ..._mgp_str.py => test_processing_mgp_str.py} |    0
 ...istral3.py => test_processing_mistral3.py} |    0
 ...or_mllama.py => test_processing_mllama.py} |    0
 ...usicgen.py => test_processing_musicgen.py} |    0
 ....py => test_processing_musicgen_melody.py} |    2 +-
 ...urbo.py => test_processing_omdet_turbo.py} |    0
 ...former.py => test_processing_oneformer.py} |    0
 ...ssor_owlv2.py => test_processing_owlv2.py} |    0
 ...or_owlvit.py => test_processing_owlvit.py} |    0
 ...igemma.py => test_processing_paligemma.py} |    2 +-
 ...lm.py => test_processing_perception_lm.py} |    0
 ...est_feature_extraction_phi4_multimodal.py} |    0
 ...truct.py => test_processing_pix2struct.py} |    0
 ..._pixtral.py => test_processing_pixtral.py} |    0
 ...2piano.py => test_processing_pop2piano.py} |    0
 ...mni.py => test_processing_qwen2_5_omni.py} |    0
 ..._5_vl.py => test_processing_qwen2_5_vl.py} |    2 +-
 ...udio.py => test_processing_qwen2_audio.py} |    0
 ...wen2_vl.py => test_processing_qwen2_vl.py} |    2 +-
 ...rocessor_sam.py => test_processing_sam.py} |    0
 ...ssor_samhq.py => test_processing_samhq.py} |    0
 ...m4t.py => test_processing_seamless_m4t.py} |    6 +-
 ..._smolvlm.py => test_processing_smolvlm.py} |    2 +-
 ...t.py => test_processing_speech_to_text.py} |    0
 ...peecht5.py => test_processing_speecht5.py} |    0
 ...ssor_trocr.py => test_processing_trocr.py} |    0
 ...cessor_udop.py => test_processing_udop.py} |    0
 ...st_processing_vision_text_dual_encoder.py} |    0
 ...av2vec2.py => test_processing_wav2vec2.py} |    0
 ...rt.py => test_processing_wav2vec2_bert.py} |    0
 ...py => test_processing_wav2vec2_with_lm.py} |    0
 ..._whisper.py => test_processing_whisper.py} |    0
 tests/utils/test_add_new_model_like.py        | 1948 ++++++---------
 utils/modular_model_converter.py              |   12 +-
 87 files changed, 1438 insertions(+), 2869 deletions(-)
 rename tests/models/align/{test_processor_align.py => test_processing_align.py} (100%)
 rename tests/models/altclip/{test_processor_altclip.py => test_processing_altclip.py} (100%)
 rename tests/models/aria/{test_processor_aria.py => test_processing_aria.py} (99%)
 rename tests/models/aya_vision/{test_processor_aya_vision.py => test_processing_aya_vision.py} (98%)
 rename tests/models/bark/{test_processor_bark.py => test_processing_bark.py} (100%)
 rename tests/models/blip/{test_processor_blip.py => test_processing_blip.py} (100%)
 rename tests/models/blip_2/{test_processor_blip_2.py => test_processing_blip_2.py} (100%)
 rename tests/models/bridgetower/{test_processor_bridgetower.py => test_processing_bridgetower.py} (100%)
 rename tests/models/chameleon/{test_processor_chameleon.py => test_processing_chameleon.py} (96%)
 rename tests/models/chinese_clip/{test_processor_chinese_clip.py => test_processing_chinese_clip.py} (100%)
 rename tests/models/clap/{test_processor_clap.py => test_processing_clap.py} (100%)
 rename tests/models/clip/{test_processor_clip.py => test_processing_clip.py} (100%)
 rename tests/models/clipseg/{test_processor_clipseg.py => test_processing_clipseg.py} (100%)
 rename tests/models/clvp/{test_processor_clvp.py => test_processing_clvp.py} (91%)
 rename tests/models/csm/{test_processor_csm.py => test_processing_csm.py} (100%)
 rename tests/models/deepseek_vl/{test_processor_deepseek_vl.py => test_processing_deepseek_vl.py} (100%)
 rename tests/models/deepseek_vl_hybrid/{test_processor_deepseek_vl_hybrid.py => test_processing_deepseek_vl_hybrid.py} (100%)
 rename tests/models/dia/{test_processor_dia.py => test_processing_dia.py} (100%)
 rename tests/models/donut/{test_processor_donut.py => test_processing_donut.py} (100%)
 rename tests/models/emu3/{test_processor_emu3.py => test_processing_emu3.py} (97%)
 rename tests/models/evolla/{test_processor_evolla.py => test_processing_evolla.py} (100%)
 rename tests/models/flava/{test_processor_flava.py => test_processing_flava.py} (100%)
 rename tests/models/fuyu/{test_processor_fuyu.py => test_processing_fuyu.py} (99%)
 rename tests/models/git/{test_processor_git.py => test_processing_git.py} (100%)
 rename tests/models/got_ocr2/{test_processor_got_ocr2.py => test_processing_got_ocr2.py} (100%)
 rename tests/models/granite_speech/{test_processor_granite_speech.py => test_processing_granite_speech.py} (100%)
 rename tests/models/grounding_dino/{test_processor_grounding_dino.py => test_processing_grounding_dino.py} (91%)
 rename tests/models/idefics/{test_processor_idefics.py => test_processing_idefics.py} (100%)
 rename tests/models/idefics2/{test_processor_idefics2.py => test_processing_idefics2.py} (100%)
 rename tests/models/idefics3/{test_processor_idefics3.py => test_processing_idefics3.py} (98%)
 rename tests/models/instructblip/{test_processor_instructblip.py => test_processing_instructblip.py} (100%)
 rename tests/models/instructblipvideo/{test_processor_instructblipvideo.py => test_processing_instructblipvideo.py} (100%)
 rename tests/models/internvl/{test_processor_internvl.py => test_processing_internvl.py} (99%)
 rename tests/models/internvl/{test_video_processor_internvl.py => test_video_processing_internvl.py} (100%)
 rename tests/models/janus/{test_processor_janus.py => test_processing_janus.py} (100%)
 rename tests/models/kosmos2/{test_processor_kosmos2.py => test_processing_kosmos2.py} (100%)
 rename tests/models/layoutlmv2/{test_processor_layoutlmv2.py => test_processing_layoutlmv2.py} (100%)
 rename tests/models/layoutlmv3/{test_processor_layoutlmv3.py => test_processing_layoutlmv3.py} (100%)
 rename tests/models/layoutxlm/{test_processor_layoutxlm.py => test_processing_layoutxlm.py} (100%)
 rename tests/models/llama4/{test_processor_llama4.py => test_processing_llama4.py} (100%)
 rename tests/models/llava/{test_processor_llava.py => test_processing_llava.py} (100%)
 rename tests/models/llava_next/{test_processor_llava_next.py => test_processing_llava_next.py} (96%)
 rename tests/models/llava_next_video/{test_processor_llava_next_video.py => test_processing_llava_next_video.py} (96%)
 rename tests/models/llava_onevision/{test_processor_llava_onevision.py => test_processing_llava_onevision.py} (96%)
 rename tests/models/markuplm/{test_processor_markuplm.py => test_processing_markuplm.py} (100%)
 rename tests/models/mgp_str/{test_processor_mgp_str.py => test_processing_mgp_str.py} (100%)
 rename tests/models/mistral3/{test_processor_mistral3.py => test_processing_mistral3.py} (100%)
 rename tests/models/mllama/{test_processor_mllama.py => test_processing_mllama.py} (100%)
 rename tests/models/musicgen/{test_processor_musicgen.py => test_processing_musicgen.py} (100%)
 rename tests/models/musicgen_melody/{test_processor_musicgen_melody.py => test_processing_musicgen_melody.py} (97%)
 rename tests/models/omdet_turbo/{test_processor_omdet_turbo.py => test_processing_omdet_turbo.py} (100%)
 rename tests/models/oneformer/{test_processor_oneformer.py => test_processing_oneformer.py} (100%)
 rename tests/models/owlv2/{test_processor_owlv2.py => test_processing_owlv2.py} (100%)
 rename tests/models/owlvit/{test_processor_owlvit.py => test_processing_owlvit.py} (100%)
 rename tests/models/paligemma/{test_processor_paligemma.py => test_processing_paligemma.py} (98%)
 rename tests/models/perception_lm/{test_processor_perception_lm.py => test_processing_perception_lm.py} (100%)
 rename tests/models/phi4_multimodal/{test_feature_extractor_phi4_multimodal.py => test_feature_extraction_phi4_multimodal.py} (100%)
 rename tests/models/pix2struct/{test_processor_pix2struct.py => test_processing_pix2struct.py} (100%)
 rename tests/models/pixtral/{test_processor_pixtral.py => test_processing_pixtral.py} (100%)
 rename tests/models/pop2piano/{test_processor_pop2piano.py => test_processing_pop2piano.py} (100%)
 rename tests/models/qwen2_5_omni/{test_processor_qwen2_5_omni.py => test_processing_qwen2_5_omni.py} (100%)
 rename tests/models/qwen2_5_vl/{test_processor_qwen2_5_vl.py => test_processing_qwen2_5_vl.py} (99%)
 rename tests/models/qwen2_audio/{test_processor_qwen2_audio.py => test_processing_qwen2_audio.py} (100%)
 rename tests/models/qwen2_vl/{test_processor_qwen2_vl.py => test_processing_qwen2_vl.py} (99%)
 rename tests/models/sam/{test_processor_sam.py => test_processing_sam.py} (100%)
 rename tests/models/sam_hq/{test_processor_samhq.py => test_processing_samhq.py} (100%)
 rename tests/models/seamless_m4t/{test_processor_seamless_m4t.py => test_processing_seamless_m4t.py} (92%)
 rename tests/models/smolvlm/{test_processor_smolvlm.py => test_processing_smolvlm.py} (99%)
 rename tests/models/speech_to_text/{test_processor_speech_to_text.py => test_processing_speech_to_text.py} (100%)
 rename tests/models/speecht5/{test_processor_speecht5.py => test_processing_speecht5.py} (100%)
 rename tests/models/trocr/{test_processor_trocr.py => test_processing_trocr.py} (100%)
 rename tests/models/udop/{test_processor_udop.py => test_processing_udop.py} (100%)
 rename tests/models/vision_text_dual_encoder/{test_processor_vision_text_dual_encoder.py => test_processing_vision_text_dual_encoder.py} (100%)
 rename tests/models/wav2vec2/{test_processor_wav2vec2.py => test_processing_wav2vec2.py} (100%)
 rename tests/models/wav2vec2_bert/{test_processor_wav2vec2_bert.py => test_processing_wav2vec2_bert.py} (100%)
 rename tests/models/wav2vec2_with_lm/{test_processor_wav2vec2_with_lm.py => test_processing_wav2vec2_with_lm.py} (100%)
 rename tests/models/whisper/{test_processor_whisper.py => test_processing_whisper.py} (100%)

diff --git a/conftest.py b/conftest.py
index 67e6eddfb8..e07103e4c3 100644
--- a/conftest.py
+++ b/conftest.py
@@ -29,7 +29,6 @@ from transformers.testing_utils import HfDoctestModule, HfDocTestParser
 NOT_DEVICE_TESTS = {
     "test_tokenization",
     "test_tokenization_mistral_common",
-    "test_processor",
     "test_processing",
     "test_beam_constraints",
     "test_configuration_utils",
diff --git a/src/transformers/commands/add_new_model_like.py b/src/transformers/commands/add_new_model_like.py
index cbb751ad75..74330b8d3c 100644
--- a/src/transformers/commands/add_new_model_like.py
+++ b/src/transformers/commands/add_new_model_like.py
@@ -11,1562 +11,569 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-# 1. Standard library
 import difflib
-import json
 import os
 import re
+import subprocess
+import textwrap
 from argparse import ArgumentParser, Namespace
-from dataclasses import dataclass
 from datetime import date
-from itertools import chain
 from pathlib import Path
-from re import Pattern
 from typing import Any, Callable, Optional, Union
 
-import yaml
-
-from ..models import auto as auto_module
-from ..models.auto.configuration_auto import model_type_to_module_name
-from ..utils import (
-    is_flax_available,
-    is_tf_available,
-    is_torch_available,
-    logging,
-)
+from ..models.auto.configuration_auto import CONFIG_MAPPING_NAMES, MODEL_NAMES_MAPPING
+from ..models.auto.feature_extraction_auto import FEATURE_EXTRACTOR_MAPPING_NAMES
+from ..models.auto.image_processing_auto import IMAGE_PROCESSOR_MAPPING_NAMES
+from ..models.auto.processing_auto import PROCESSOR_MAPPING_NAMES
+from ..models.auto.tokenization_auto import TOKENIZER_MAPPING_NAMES
+from ..models.auto.video_processing_auto import VIDEO_PROCESSOR_MAPPING_NAMES
+from ..utils import is_libcst_available
 from . import BaseTransformersCLICommand
 from .add_fast_image_processor import add_fast_image_processor
 
 
-logger = logging.get_logger(__name__)  # pylint: disable=invalid-name
+# We protect this import to avoid requiring it for all `transformers` CLI commands - however it is actually
+# strictly required for this one (we need it both for modular and for the following Visitor)
+if is_libcst_available():
+    import libcst as cst
+    from libcst import CSTVisitor
+    from libcst import matchers as m
+
+    class ClassFinder(CSTVisitor):
+        """
+        A visitor to find all classes in a python module.
+        """
+
+        def __init__(self):
+            self.classes: list = []
+            self.public_classes: list = []
+            self.is_in_class = False
+
+        def visit_ClassDef(self, node: cst.ClassDef) -> None:
+            """Record class names. We assume classes always only appear at top-level (i.e. no class definition in function or similar)"""
+            self.classes.append(node.name.value)
+            self.is_in_class = True
+
+        def leave_ClassDef(self, node: cst.ClassDef):
+            self.is_in_class = False
+
+        def visit_SimpleStatementLine(self, node: cst.SimpleStatementLine):
+            """Record all public classes inside the `__all__` assignment."""
+            simple_top_level_assign_structure = m.SimpleStatementLine(
+                body=[m.Assign(targets=[m.AssignTarget(target=m.Name())])]
+            )
+            if not self.is_in_class and m.matches(node, simple_top_level_assign_structure):
+                assigned_variable = node.body[0].targets[0].target.value
+                if assigned_variable == "__all__":
+                    elements = node.body[0].value.elements
+                    self.public_classes = [element.value.value for element in elements]
 
 
 CURRENT_YEAR = date.today().year
 TRANSFORMERS_PATH = Path(__file__).parent.parent
 REPO_PATH = TRANSFORMERS_PATH.parent.parent
 
+COPYRIGHT = f"""
+# coding=utf-8
+# Copyright {CURRENT_YEAR} the HuggingFace Team. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+""".lstrip()
 
-@dataclass
-class ModelPatterns:
+
+class ModelInfos(object):
     """
-    Holds the basic information about a new model for the add-new-model-like command.
-
-    Args:
-        model_name (`str`): The model name.
-        checkpoint (`str`): The checkpoint to use for doc examples.
-        model_type (`str`, *optional*):
-            The model type, the identifier used internally in the library like `bert` or `xlm-roberta`. Will default to
-            `model_name` lowercased with spaces replaced with minuses (-).
-        model_lower_cased (`str`, *optional*):
-            The lowercased version of the model name, to use for the module name or function names. Will default to
-            `model_name` lowercased with spaces and minuses replaced with underscores.
-        model_camel_cased (`str`, *optional*):
-            The camel-cased version of the model name, to use for the class names. Will default to `model_name`
-            camel-cased (with spaces and minuses both considered as word separators.
-        model_upper_cased (`str`, *optional*):
-            The uppercased version of the model name, to use for the constant names. Will default to `model_name`
-            uppercased with spaces and minuses replaced with underscores.
-        config_class (`str`, *optional*):
-            The tokenizer class associated with this model. Will default to `"{model_camel_cased}Config"`.
-        tokenizer_class (`str`, *optional*):
-            The tokenizer class associated with this model (leave to `None` for models that don't use a tokenizer).
-        image_processor_class (`str`, *optional*):
-            The image processor class associated with this model (leave to `None` for models that don't use an image
-            processor).
-        image_processor_fast_class (`str`, *optional*):
-            The fast image processor class associated with this model (leave to `None` for models that don't use a fast
-            image processor).
-        feature_extractor_class (`str`, *optional*):
-            The feature extractor class associated with this model (leave to `None` for models that don't use a feature
-            extractor).
-        processor_class (`str`, *optional*):
-            The processor class associated with this model (leave to `None` for models that don't use a processor).
+    Retrieve the basic informations about an existing model classes.
     """
 
-    model_name: str
-    checkpoint: str
-    model_type: Optional[str] = None
-    model_lower_cased: Optional[str] = None
-    model_camel_cased: Optional[str] = None
-    model_upper_cased: Optional[str] = None
-    config_class: Optional[str] = None
-    tokenizer_class: Optional[str] = None
-    image_processor_class: Optional[str] = None
-    image_processor_fast_class: Optional[str] = None
-    feature_extractor_class: Optional[str] = None
-    processor_class: Optional[str] = None
+    def __init__(self, lowercase_name: str):
+        # Just to make sure it's indeed lowercase
+        self.lowercase_name = lowercase_name.lower().replace(" ", "_").replace("-", "_")
+        if self.lowercase_name not in CONFIG_MAPPING_NAMES:
+            self.lowercase_name.replace("_", "-")
+        if self.lowercase_name not in CONFIG_MAPPING_NAMES:
+            raise ValueError(f"{lowercase_name} is not a valid model name")
 
-    def __post_init__(self):
-        if self.model_type is None:
-            self.model_type = self.model_name.lower().replace(" ", "-")
-        if self.model_lower_cased is None:
-            self.model_lower_cased = self.model_name.lower().replace(" ", "_").replace("-", "_")
-        if self.model_camel_cased is None:
-            # Split the model name on - and space
-            words = self.model_name.split(" ")
-            words = list(chain(*[w.split("-") for w in words]))
-            # Make sure each word is capitalized
-            words = [w[0].upper() + w[1:] for w in words]
-            self.model_camel_cased = "".join(words)
-        if self.model_upper_cased is None:
-            self.model_upper_cased = self.model_name.upper().replace(" ", "_").replace("-", "_")
-        if self.config_class is None:
-            self.config_class = f"{self.model_camel_cased}Config"
+        self.paper_name = MODEL_NAMES_MAPPING[self.lowercase_name]
+        self.config_class = CONFIG_MAPPING_NAMES[self.lowercase_name]
+        self.camelcase_name = self.config_class.replace("Config", "")
 
-
-ATTRIBUTE_TO_PLACEHOLDER = {
-    "config_class": "[CONFIG_CLASS]",
-    "tokenizer_class": "[TOKENIZER_CLASS]",
-    "image_processor_class": "[IMAGE_PROCESSOR_CLASS]",
-    "image_processor_fast_class": "[IMAGE_PROCESSOR_FAST_CLASS]",
-    "feature_extractor_class": "[FEATURE_EXTRACTOR_CLASS]",
-    "processor_class": "[PROCESSOR_CLASS]",
-    "checkpoint": "[CHECKPOINT]",
-    "model_type": "[MODEL_TYPE]",
-    "model_upper_cased": "[MODEL_UPPER_CASED]",
-    "model_camel_cased": "[MODEL_CAMELCASED]",
-    "model_lower_cased": "[MODEL_LOWER_CASED]",
-    "model_name": "[MODEL_NAME]",
-}
-
-
-def is_empty_line(line: str) -> bool:
-    """
-    Determines whether a line is empty or not.
-    """
-    return len(line) == 0 or line.isspace()
-
-
-def find_indent(line: str) -> int:
-    """
-    Returns the number of spaces that start a line indent.
-    """
-    search = re.search(r"^(\s*)(?:\S|$)", line)
-    if search is None:
-        return 0
-    return len(search.groups()[0])
-
-
-def parse_module_content(content: str) -> list[str]:
-    """
-    Parse the content of a module in the list of objects it defines.
-
-    Args:
-        content (`str`): The content to parse
-
-    Returns:
-        `list[str]`: The list of objects defined in the module.
-    """
-    objects = []
-    current_object = []
-    lines = content.split("\n")
-    # Doc-styler takes everything between two triple quotes in docstrings, so we need a fake """ here to go with this.
-    end_markers = [")", "]", "}", '"""']
-
-    for line in lines:
-        # End of an object
-        is_valid_object = len(current_object) > 0
-        if is_valid_object and len(current_object) == 1:
-            is_valid_object = not current_object[0].startswith("# Copied from")
-        if not is_empty_line(line) and find_indent(line) == 0 and is_valid_object:
-            # Closing parts should be included in current object
-            if line in end_markers:
-                current_object.append(line)
-                objects.append("\n".join(current_object))
-                current_object = []
-            else:
-                objects.append("\n".join(current_object))
-                current_object = [line]
-        else:
-            current_object.append(line)
-
-    # Add last object
-    if len(current_object) > 0:
-        objects.append("\n".join(current_object))
-
-    return objects
-
-
-def extract_block(content: str, indent_level: int = 0) -> str:
-    """Return the first block in `content` with the indent level `indent_level`.
-
-    The first line in `content` should be indented at `indent_level` level, otherwise an error will be thrown.
-
-    This method will immediately stop the search when a (non-empty) line with indent level less than `indent_level` is
-    encountered.
-
-    Args:
-        content (`str`): The content to parse
-        indent_level (`int`, *optional*, default to 0): The indent level of the blocks to search for
-
-    Returns:
-        `str`: The first block in `content` with the indent level `indent_level`.
-    """
-    current_object = []
-    lines = content.split("\n")
-    # Doc-styler takes everything between two triple quotes in docstrings, so we need a fake """ here to go with this.
-    end_markers = [")", "]", "}", '"""']
-
-    for idx, line in enumerate(lines):
-        if idx == 0 and indent_level > 0 and not is_empty_line(line) and find_indent(line) != indent_level:
-            raise ValueError(
-                f"When `indent_level > 0`, the first line in `content` should have indent level {indent_level}. Got "
-                f"{find_indent(line)} instead."
+        # Get tokenizer class
+        if self.lowercase_name in TOKENIZER_MAPPING_NAMES:
+            self.tokenizer_class, self.fast_tokenizer_class = TOKENIZER_MAPPING_NAMES[self.lowercase_name]
+            self.fast_tokenizer_class = (
+                None if self.fast_tokenizer_class == "PreTrainedTokenizerFast" else self.fast_tokenizer_class
             )
-
-        if find_indent(line) < indent_level and not is_empty_line(line):
-            break
-
-        # End of an object
-        is_valid_object = len(current_object) > 0
-        if (
-            not is_empty_line(line)
-            and not line.endswith(":")
-            and find_indent(line) == indent_level
-            and is_valid_object
-        ):
-            # Closing parts should be included in current object
-            if line.lstrip() in end_markers:
-                current_object.append(line)
-            return "\n".join(current_object)
         else:
-            current_object.append(line)
+            self.tokenizer_class, self.fast_tokenizer_class = None, None
 
-    # Add last object
-    if len(current_object) > 0:
-        return "\n".join(current_object)
+        self.image_processor_class, self.fast_image_processor_class = IMAGE_PROCESSOR_MAPPING_NAMES.get(
+            self.lowercase_name, (None, None)
+        )
+        self.video_processor_class = VIDEO_PROCESSOR_MAPPING_NAMES.get(self.lowercase_name, None)
+        self.feature_extractor_class = FEATURE_EXTRACTOR_MAPPING_NAMES.get(self.lowercase_name, None)
+        self.processor_class = PROCESSOR_MAPPING_NAMES.get(self.lowercase_name, None)
 
 
-def add_content_to_text(
-    text: str,
-    content: str,
-    add_after: Optional[Union[str, Pattern]] = None,
-    add_before: Optional[Union[str, Pattern]] = None,
-    exact_match: bool = False,
-) -> str:
-    """
-    A utility to add some content inside a given text.
-
-    Args:
-       text (`str`): The text in which we want to insert some content.
-       content (`str`): The content to add.
-       add_after (`str` or `Pattern`):
-           The pattern to test on a line of `text`, the new content is added after the first instance matching it.
-       add_before (`str` or `Pattern`):
-           The pattern to test on a line of `text`, the new content is added before the first instance matching it.
-       exact_match (`bool`, *optional*, defaults to `False`):
-           A line is considered a match with `add_after` or `add_before` if it matches exactly when `exact_match=True`,
-           otherwise, if `add_after`/`add_before` is present in the line.
-
-    <Tip warning={true}>
-
-    The arguments `add_after` and `add_before` are mutually exclusive, and one exactly needs to be provided.
-
-    </Tip>
-
-    Returns:
-        `str`: The text with the new content added if a match was found.
-    """
-    if add_after is None and add_before is None:
-        raise ValueError("You need to pass either `add_after` or `add_before`")
-    if add_after is not None and add_before is not None:
-        raise ValueError("You can't pass both `add_after` or `add_before`")
-    pattern = add_after if add_before is None else add_before
-
-    def this_is_the_line(line):
-        if isinstance(pattern, Pattern):
-            return pattern.search(line) is not None
-        elif exact_match:
-            return pattern == line
-        else:
-            return pattern in line
-
-    new_lines = []
-    for line in text.split("\n"):
-        if this_is_the_line(line):
-            if add_before is not None:
-                new_lines.append(content)
-            new_lines.append(line)
-            if add_after is not None:
-                new_lines.append(content)
-        else:
-            new_lines.append(line)
-
-    return "\n".join(new_lines)
-
-
-def add_content_to_file(
-    file_name: Union[str, os.PathLike],
-    content: str,
-    add_after: Optional[Union[str, Pattern]] = None,
-    add_before: Optional[Union[str, Pattern]] = None,
-    exact_match: bool = False,
-):
+def add_content_to_file(file_name: Union[str, os.PathLike], new_content: str, add_after: str):
     """
     A utility to add some content inside a given file.
 
     Args:
-       file_name (`str` or `os.PathLike`): The name of the file in which we want to insert some content.
-       content (`str`): The content to add.
-       add_after (`str` or `Pattern`):
-           The pattern to test on a line of `text`, the new content is added after the first instance matching it.
-       add_before (`str` or `Pattern`):
-           The pattern to test on a line of `text`, the new content is added before the first instance matching it.
-       exact_match (`bool`, *optional*, defaults to `False`):
-           A line is considered a match with `add_after` or `add_before` if it matches exactly when `exact_match=True`,
-           otherwise, if `add_after`/`add_before` is present in the line.
-
-    <Tip warning={true}>
-
-    The arguments `add_after` and `add_before` are mutually exclusive, and one exactly needs to be provided.
-
-    </Tip>
+        file_name (`str` or `os.PathLike`):
+            The name of the file in which we want to insert some content.
+        new_content (`str`):
+            The content to add.
+       add_after (`str`):
+           The new content is added just after the first instance matching it.
     """
     with open(file_name, "r", encoding="utf-8") as f:
         old_content = f.read()
 
-    new_content = add_content_to_text(
-        old_content, content, add_after=add_after, add_before=add_before, exact_match=exact_match
-    )
+    before, after = old_content.split(add_after, 1)
+    new_content = before + add_after + new_content + after
 
     with open(file_name, "w", encoding="utf-8") as f:
         f.write(new_content)
 
 
-def replace_model_patterns(
-    text: str, old_model_patterns: ModelPatterns, new_model_patterns: ModelPatterns
-) -> tuple[str, str]:
-    """
-    Replace all patterns present in a given text.
-
-    Args:
-        text (`str`): The text to treat.
-        old_model_patterns (`ModelPatterns`): The patterns for the old model.
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
-
-    Returns:
-        `Tuple(str, str)`: A tuple of with the treated text and the replacement actually done in it.
-    """
-    # The order is crucially important as we will check and replace in that order. For instance the config probably
-    # contains the camel-cased named, but will be treated before.
-    attributes_to_check = ["config_class"]
-    # Add relevant preprocessing classes
-    for attr in [
-        "tokenizer_class",
-        "image_processor_class",
-        "image_processor_fast_class",
-        "feature_extractor_class",
-        "processor_class",
-    ]:
-        if getattr(old_model_patterns, attr) is not None and getattr(new_model_patterns, attr) is not None:
-            attributes_to_check.append(attr)
-
-    # Special cases for checkpoint and model_type
-    if old_model_patterns.checkpoint not in [old_model_patterns.model_type, old_model_patterns.model_lower_cased]:
-        attributes_to_check.append("checkpoint")
-    if old_model_patterns.model_type != old_model_patterns.model_lower_cased:
-        attributes_to_check.append("model_type")
-    else:
-        text = re.sub(
-            rf'(\s*)model_type = "{old_model_patterns.model_type}"',
-            r'\1model_type = "[MODEL_TYPE]"',
-            text,
-        )
-
-    # Special case when the model camel cased and upper cased names are the same for the old model (like for GPT2) but
-    # not the new one. We can't just do a replace in all the text and will need a special regex
-    if old_model_patterns.model_upper_cased == old_model_patterns.model_camel_cased:
-        old_model_value = old_model_patterns.model_upper_cased
-        if re.search(rf"{old_model_value}_[A-Z_]*[^A-Z_]", text) is not None:
-            text = re.sub(rf"{old_model_value}([A-Z_]*)([^a-zA-Z_])", r"[MODEL_UPPER_CASED]\1\2", text)
-    else:
-        attributes_to_check.append("model_upper_cased")
-
-    attributes_to_check.extend(["model_camel_cased", "model_lower_cased", "model_name"])
-
-    # Now let's replace every other attribute by their placeholder
-    for attr in attributes_to_check:
-        text = text.replace(getattr(old_model_patterns, attr), ATTRIBUTE_TO_PLACEHOLDER[attr])
-
-    # Finally we can replace the placeholder byt the new values.
-    replacements = []
-    for attr, placeholder in ATTRIBUTE_TO_PLACEHOLDER.items():
-        if placeholder in text:
-            replacements.append((getattr(old_model_patterns, attr), getattr(new_model_patterns, attr)))
-            text = text.replace(placeholder, getattr(new_model_patterns, attr))
-
-    # If we have two inconsistent replacements, we don't return anything (ex: GPT2->GPT_NEW and GPT2->GPTNew)
-    old_replacement_values = [old for old, new in replacements]
-    if len(set(old_replacement_values)) != len(old_replacement_values):
-        return text, ""
-
-    replacements = simplify_replacements(replacements)
-    replacements = [f"{old}->{new}" for old, new in replacements]
-    return text, ",".join(replacements)
-
-
-def simplify_replacements(replacements):
-    """
-    Simplify a list of replacement patterns to make sure there are no needless ones.
-
-    For instance in the sequence "Bert->BertNew, BertConfig->BertNewConfig, bert->bert_new", the replacement
-    "BertConfig->BertNewConfig" is implied by "Bert->BertNew" so not needed.
-
-    Args:
-        replacements (`list[tuple[str, str]]`): List of patterns (old, new)
-
-    Returns:
-        `list[tuple[str, str]]`: The list of patterns simplified.
-    """
-    if len(replacements) <= 1:
-        # Nothing to simplify
-        return replacements
-
-    # Next let's sort replacements by length as a replacement can only "imply" another replacement if it's shorter.
-    replacements.sort(key=lambda x: len(x[0]))
-
-    idx = 0
-    while idx < len(replacements):
-        old, new = replacements[idx]
-        # Loop through all replacements after
-        j = idx + 1
-        while j < len(replacements):
-            old_2, new_2 = replacements[j]
-            # If the replacement is implied by the current one, we can drop it.
-            if old_2.replace(old, new) == new_2:
-                replacements.pop(j)
-            else:
-                j += 1
-        idx += 1
-
-    return replacements
-
-
-def get_module_from_file(module_file: Union[str, os.PathLike]) -> str:
-    """
-    Returns the module name corresponding to a module file.
-    """
-    full_module_path = Path(module_file).absolute()
-    module_parts = full_module_path.with_suffix("").parts
-
-    # Find the first part named transformers, starting from the end.
-    idx = len(module_parts) - 1
-    while idx >= 0 and module_parts[idx] != "transformers":
-        idx -= 1
-    if idx < 0:
-        raise ValueError(f"{module_file} is not a transformers module.")
-
-    return ".".join(module_parts[idx:])
-
-
-SPECIAL_PATTERNS = {
-    "_CHECKPOINT_FOR_DOC =": "checkpoint",
-    "_CONFIG_FOR_DOC =": "config_class",
-    "_TOKENIZER_FOR_DOC =": "tokenizer_class",
-    "_IMAGE_PROCESSOR_FOR_DOC =": "image_processor_class",
-    "_FEAT_EXTRACTOR_FOR_DOC =": "feature_extractor_class",
-    "_PROCESSOR_FOR_DOC =": "processor_class",
-}
-
-
-_re_class_func = re.compile(r"^(?:class|def)\s+([^\s:\(]+)\s*(?:\(|\:)", flags=re.MULTILINE)
-
-
-def remove_attributes(obj, target_attr):
-    """Remove `target_attr` in `obj`."""
-    lines = obj.split(os.linesep)
-
-    target_idx = None
-    for idx, line in enumerate(lines):
-        # search for assignment
-        if line.lstrip().startswith(f"{target_attr} = "):
-            target_idx = idx
-            break
-        # search for function/method definition
-        elif line.lstrip().startswith(f"def {target_attr}("):
-            target_idx = idx
-            break
-
-    # target not found
-    if target_idx is None:
-        return obj
-
-    line = lines[target_idx]
-    indent_level = find_indent(line)
-    # forward pass to find the ending of the block (including empty lines)
-    parsed = extract_block("\n".join(lines[target_idx:]), indent_level)
-    num_lines = len(parsed.split("\n"))
-    for idx in range(num_lines):
-        lines[target_idx + idx] = None
-
-    # backward pass to find comments or decorator
-    for idx in range(target_idx - 1, -1, -1):
-        line = lines[idx]
-        if (line.lstrip().startswith("#") or line.lstrip().startswith("@")) and find_indent(line) == indent_level:
-            lines[idx] = None
-        else:
-            break
-
-    new_obj = os.linesep.join([x for x in lines if x is not None])
-
-    return new_obj
-
-
-def duplicate_module(
-    module_file: Union[str, os.PathLike],
-    old_model_patterns: ModelPatterns,
-    new_model_patterns: ModelPatterns,
-    dest_file: Optional[str] = None,
-    add_copied_from: bool = True,
-    attrs_to_remove: Optional[list[str]] = None,
+def add_model_to_auto_mappings(
+    old_model_infos: ModelInfos,
+    new_lowercase_name: str,
+    new_model_paper_name: str,
+    filenames_to_add: list[tuple[str, bool]],
 ):
     """
-    Create a new module from an existing one and adapting all function and classes names from old patterns to new ones.
+    Add a model to all the relevant mappings in the auto module.
 
     Args:
-        module_file (`str` or `os.PathLike`): Path to the module to duplicate.
-        old_model_patterns (`ModelPatterns`): The patterns for the old model.
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
-        dest_file (`str` or `os.PathLike`, *optional*): Path to the new module.
-        add_copied_from (`bool`, *optional*, defaults to `True`):
-            Whether or not to add `# Copied from` statements in the duplicated module.
+        old_model_infos (`ModelInfos`):
+            The structure containing the class informations of the old model.
+        new_lowercase_name (`str`):
+            The new lowercase model name.
+        new_model_paper_name (`str`):
+            The fully cased name (as in the official paper name) of the new model.
+        filenames_to_add (`list[tuple[str, bool]]`):
+            A list of tuples of all potential filenames to add for a new model, along a boolean flag describing if we
+            should add this file or not. For example, [(`modeling_xxx.px`, True), (`configuration_xxx.py`, True), (`tokenization_xxx.py`, False),...]
     """
-    if dest_file is None:
-        dest_file = str(module_file).replace(
-            old_model_patterns.model_lower_cased, new_model_patterns.model_lower_cased
-        )
-
-    with open(module_file, "r", encoding="utf-8") as f:
-        content = f.read()
-
-    content = re.sub(r"# Copyright (\d+)\s", f"# Copyright {CURRENT_YEAR} ", content)
-    objects = parse_module_content(content)
-
-    # Loop and treat all objects
-    new_objects = []
-    for obj in objects:
-        special_pattern = False
-        for pattern, attr in SPECIAL_PATTERNS.items():
-            if pattern in obj:
-                obj = obj.replace(getattr(old_model_patterns, attr), getattr(new_model_patterns, attr))
-                new_objects.append(obj)
-                special_pattern = True
-                break
-
-        if special_pattern:
-            continue
-
-        # Regular classes functions
-        old_obj = obj
-        obj, replacement = replace_model_patterns(obj, old_model_patterns, new_model_patterns)
-        has_copied_from = re.search(r"^#\s+Copied from", obj, flags=re.MULTILINE) is not None
-        if add_copied_from and not has_copied_from and _re_class_func.search(obj) is not None and len(replacement) > 0:
-            # Copied from statement must be added just before the class/function definition, which may not be the
-            # first line because of decorators.
-            module_name = get_module_from_file(module_file)
-            old_object_name = _re_class_func.search(old_obj).groups()[0]
-            obj = add_content_to_text(
-                obj, f"# Copied from {module_name}.{old_object_name} with {replacement}", add_before=_re_class_func
-            )
-        # In all cases, we remove Copied from statement with indent on methods.
-        obj = re.sub("\n[ ]+# Copied from [^\n]*\n", "\n", obj)
-
-        new_objects.append(obj)
-
-    content = "\n".join(new_objects)
-    # Remove some attributes that we don't want to copy to the new file(s)
-    if attrs_to_remove is not None:
-        for attr in attrs_to_remove:
-            content = remove_attributes(content, target_attr=attr)
-
-    with open(dest_file, "w", encoding="utf-8") as f:
-        f.write(content)
-
-
-def filter_framework_files(
-    files: list[Union[str, os.PathLike]], frameworks: Optional[list[str]] = None
-) -> list[Union[str, os.PathLike]]:
-    """
-    Filter a list of files to only keep the ones corresponding to a list of frameworks.
-
-    Args:
-        files (`list[Union[str, os.PathLike]]`): The list of files to filter.
-        frameworks (`list[str]`, *optional*): The list of allowed frameworks.
-
-    Returns:
-        `list[Union[str, os.PathLike]]`: The list of filtered files.
-    """
-    if frameworks is None:
-        frameworks = get_default_frameworks()
-
-    framework_to_file = {}
-    others = []
-    for f in files:
-        parts = Path(f).name.split("_")
-        if "modeling" not in parts:
-            others.append(f)
-            continue
-        if "tf" in parts:
-            framework_to_file["tf"] = f
-        elif "flax" in parts:
-            framework_to_file["flax"] = f
-        else:
-            framework_to_file["pt"] = f
-
-    return [framework_to_file[f] for f in frameworks if f in framework_to_file] + others
-
-
-def get_model_files(model_type: str, frameworks: Optional[list[str]] = None) -> dict[str, Union[Path, list[Path]]]:
-    """
-    Retrieves all the files associated to a model.
-
-    Args:
-        model_type (`str`): A valid model type (like "bert" or "gpt2")
-        frameworks (`list[str]`, *optional*):
-            If passed, will only keep the model files corresponding to the passed frameworks.
-
-    Returns:
-        `dict[str, Union[Path, list[Path]]]`: A dictionary with the following keys:
-        - **doc_file** -- The documentation file for the model.
-        - **model_files** -- All the files in the model module.
-        - **test_files** -- The test files for the model.
-    """
-    module_name = model_type_to_module_name(model_type)
-
-    model_module = TRANSFORMERS_PATH / "models" / module_name
-    model_files = list(model_module.glob("*.py"))
-    model_files = filter_framework_files(model_files, frameworks=frameworks)
-
-    doc_file = REPO_PATH / "docs" / "source" / "en" / "model_doc" / f"{model_type}.md"
-
-    # Basic pattern for test files
-    test_files = [
-        f"test_modeling_{module_name}.py",
-        f"test_modeling_tf_{module_name}.py",
-        f"test_modeling_flax_{module_name}.py",
-        f"test_tokenization_{module_name}.py",
-        f"test_image_processing_{module_name}.py",
-        f"test_feature_extraction_{module_name}.py",
-        f"test_processor_{module_name}.py",
+    new_cased_name = "".join(x.title() for x in new_lowercase_name.replace("-", "_").split("_"))
+    old_lowercase_name = old_model_infos.lowercase_name
+    old_cased_name = old_model_infos.camelcase_name
+    filenames_to_add = [
+        (filename.replace(old_lowercase_name, "auto"), to_add) for filename, to_add in filenames_to_add[1:]
     ]
-    test_files = filter_framework_files(test_files, frameworks=frameworks)
-    # Add the test directory
-    test_files = [REPO_PATH / "tests" / "models" / module_name / f for f in test_files]
-    # Filter by existing files
-    test_files = [f for f in test_files if f.exists()]
+    # fast tokenizer/image processor have the same auto mappings as normal ones
+    corrected_filenames_to_add = []
+    for file, to_add in filenames_to_add:
+        if re.search(r"(?:tokenization)|(?:image_processing)_auto_fast.py", file):
+            previous_file, previous_to_add = corrected_filenames_to_add[-1]
+            corrected_filenames_to_add[-1] = (previous_file, previous_to_add or to_add)
+        else:
+            corrected_filenames_to_add.append((file, to_add))
 
-    return {"doc_file": doc_file, "model_files": model_files, "module_name": module_name, "test_files": test_files}
-
-
-_re_checkpoint_in_config = re.compile(r"\[(.+?)\]\((https://huggingface\.co/.+?)\)")
-
-
-def find_base_model_checkpoint(
-    model_type: str, model_files: Optional[dict[str, Union[Path, list[Path]]]] = None
-) -> str:
-    """
-    Finds the model checkpoint used in the docstrings for a given model.
-
-    Args:
-        model_type (`str`): A valid model type (like "bert" or "gpt2")
-        model_files (`dict[str, Union[Path, list[Path]]`, *optional*):
-            The files associated to `model_type`. Can be passed to speed up the function, otherwise will be computed.
-
-    Returns:
-        `str`: The checkpoint used.
-    """
-    if model_files is None:
-        model_files = get_model_files(model_type)
-    module_files = model_files["model_files"]
-    for fname in module_files:
-        # After the @auto_docstring refactor, we expect the checkpoint to be in the configuration file's docstring
-        if "configuration" not in str(fname):
-            continue
-
-        with open(fname, "r", encoding="utf-8") as f:
-            content = f.read()
-            if _re_checkpoint_in_config.search(content) is not None:
-                checkpoint = _re_checkpoint_in_config.search(content).groups()[0]
-                # Remove quotes
-                checkpoint = checkpoint.replace('"', "")
-                checkpoint = checkpoint.replace("'", "")
-                return checkpoint
-
-    # TODO: Find some kind of fallback if there is no _CHECKPOINT_FOR_DOC in any of the modeling file.
-    return ""
-
-
-def get_default_frameworks():
-    """
-    Returns the list of frameworks (PyTorch, TensorFlow, Flax) that are installed in the environment.
-    """
-    frameworks = []
-    if is_torch_available():
-        frameworks.append("pt")
-    if is_tf_available():
-        frameworks.append("tf")
-    if is_flax_available():
-        frameworks.append("flax")
-    return frameworks
-
-
-_re_model_mapping = re.compile("MODEL_([A-Z_]*)MAPPING_NAMES")
-
-
-def retrieve_model_classes(model_type: str, frameworks: Optional[list[str]] = None) -> dict[str, list[str]]:
-    """
-    Retrieve the model classes associated to a given model.
-
-    Args:
-        model_type (`str`): A valid model type (like "bert" or "gpt2")
-        frameworks (`list[str]`, *optional*):
-            The frameworks to look for. Will default to `["pt", "tf", "flax"]`, passing a smaller list will restrict
-            the classes returned.
-
-    Returns:
-        `dict[str, list[str]]`: A dictionary with one key per framework and the list of model classes associated to
-        that framework as values.
-    """
-    if frameworks is None:
-        frameworks = get_default_frameworks()
-
-    modules = {
-        "pt": auto_module.modeling_auto if is_torch_available() else None,
-        "tf": auto_module.modeling_tf_auto if is_tf_available() else None,
-        "flax": auto_module.modeling_flax_auto if is_flax_available() else None,
-    }
-
-    model_classes = {}
-    for framework in frameworks:
-        new_model_classes = []
-        if modules[framework] is None:
-            raise ValueError(f"You selected {framework} in the frameworks, but it is not installed.")
-        model_mappings = [attr for attr in dir(modules[framework]) if _re_model_mapping.search(attr) is not None]
-        for model_mapping_name in model_mappings:
-            model_mapping = getattr(modules[framework], model_mapping_name)
-            if model_type in model_mapping:
-                new_model_classes.append(model_mapping[model_type])
-
-        if len(new_model_classes) > 0:
-            # Remove duplicates
-            model_classes[framework] = list(set(new_model_classes))
-
-    return model_classes
-
-
-def retrieve_info_for_model(model_type, frameworks: Optional[list[str]] = None):
-    """
-    Retrieves all the information from a given model_type.
-
-    Args:
-        model_type (`str`): A valid model type (like "bert" or "gpt2")
-        frameworks (`list[str]`, *optional*):
-            If passed, will only keep the info corresponding to the passed frameworks.
-
-    Returns:
-        `Dict`: A dictionary with the following keys:
-        - **frameworks** (`list[str]`): The list of frameworks that back this model type.
-        - **model_classes** (`dict[str, list[str]]`): The model classes implemented for that model type.
-        - **model_files** (`dict[str, Union[Path, list[Path]]]`): The files associated with that model type.
-        - **model_patterns** (`ModelPatterns`): The various patterns for the model.
-    """
-    if model_type not in auto_module.MODEL_NAMES_MAPPING:
-        raise ValueError(f"{model_type} is not a valid model type.")
-
-    model_name = auto_module.MODEL_NAMES_MAPPING[model_type]
-    config_class = auto_module.configuration_auto.CONFIG_MAPPING_NAMES[model_type]
-    if model_type in auto_module.tokenization_auto.TOKENIZER_MAPPING_NAMES:
-        tokenizer_classes = auto_module.tokenization_auto.TOKENIZER_MAPPING_NAMES[model_type]
-        tokenizer_class = tokenizer_classes[0] if tokenizer_classes[0] is not None else tokenizer_classes[1]
-    else:
-        tokenizer_class = None
-    image_processor_classes = auto_module.image_processing_auto.IMAGE_PROCESSOR_MAPPING_NAMES.get(model_type, None)
-    if isinstance(image_processor_classes, tuple):
-        image_processor_class, image_processor_fast_class = image_processor_classes
-    else:
-        image_processor_class = image_processor_classes
-        image_processor_fast_class = None
-    feature_extractor_class = auto_module.feature_extraction_auto.FEATURE_EXTRACTOR_MAPPING_NAMES.get(model_type, None)
-    processor_class = auto_module.processing_auto.PROCESSOR_MAPPING_NAMES.get(model_type, None)
-
-    model_files = get_model_files(model_type, frameworks=frameworks)
-    model_camel_cased = config_class.replace("Config", "")
-
-    available_frameworks = []
-    for fname in model_files["model_files"]:
-        if "modeling_tf" in str(fname):
-            available_frameworks.append("tf")
-        elif "modeling_flax" in str(fname):
-            available_frameworks.append("flax")
-        elif "modeling" in str(fname):
-            available_frameworks.append("pt")
-
-    if frameworks is None:
-        frameworks = get_default_frameworks()
-
-    frameworks = [f for f in frameworks if f in available_frameworks]
-
-    model_classes = retrieve_model_classes(model_type, frameworks=frameworks)
-
-    model_upper_cased = model_camel_cased.upper()
-    model_patterns = ModelPatterns(
-        model_name,
-        checkpoint=find_base_model_checkpoint(model_type, model_files=model_files),
-        model_type=model_type,
-        model_camel_cased=model_camel_cased,
-        model_lower_cased=model_files["module_name"],
-        model_upper_cased=model_upper_cased,
-        config_class=config_class,
-        tokenizer_class=tokenizer_class,
-        image_processor_class=image_processor_class,
-        image_processor_fast_class=image_processor_fast_class,
-        feature_extractor_class=feature_extractor_class,
-        processor_class=processor_class,
+    # Add the config mappings directly as the handling for config is a bit different
+    add_content_to_file(
+        TRANSFORMERS_PATH / "models" / "auto" / "configuration_auto.py",
+        new_content=f'        ("{new_lowercase_name}", "{new_cased_name}Config"),\n',
+        add_after="CONFIG_MAPPING_NAMES = OrderedDict[str, str](\n    [\n        # Add configs here\n",
+    )
+    add_content_to_file(
+        TRANSFORMERS_PATH / "models" / "auto" / "configuration_auto.py",
+        new_content=f'        ("{new_lowercase_name}", "{new_model_paper_name}"),\n',
+        add_after="MODEL_NAMES_MAPPING = OrderedDict[str, str](\n    [\n        # Add full (and cased) model names here\n",
     )
 
-    return {
-        "frameworks": frameworks,
-        "model_classes": model_classes,
-        "model_files": model_files,
-        "model_patterns": model_patterns,
-    }
-
-
-def clean_frameworks_in_init(
-    init_file: Union[str, os.PathLike], frameworks: Optional[list[str]] = None, keep_processing: bool = True
-):
-    """
-    Removes all the import lines that don't belong to a given list of frameworks or concern tokenizers/feature
-    extractors/image processors/processors in an init.
-
-    Args:
-        init_file (`str` or `os.PathLike`): The path to the init to treat.
-        frameworks (`list[str]`, *optional*):
-           If passed, this will remove all imports that are subject to a framework not in frameworks
-        keep_processing (`bool`, *optional*, defaults to `True`):
-            Whether or not to keep the preprocessing (tokenizer, feature extractor, image processor, processor) imports
-            in the init.
-    """
-    if frameworks is None:
-        frameworks = get_default_frameworks()
-
-    names = {"pt": "torch"}
-    to_remove = [names.get(f, f) for f in ["pt", "tf", "flax"] if f not in frameworks]
-    if not keep_processing:
-        to_remove.extend(["sentencepiece", "tokenizers", "vision"])
-
-    if len(to_remove) == 0:
-        # Nothing to do
-        return
-
-    remove_pattern = "|".join(to_remove)
-    re_conditional_imports = re.compile(rf"^\s*if not is_({remove_pattern})_available\(\):\s*$")
-    re_try = re.compile(r"\s*try:")
-    re_else = re.compile(r"\s*else:")
-    re_is_xxx_available = re.compile(rf"is_({remove_pattern})_available")
-
-    with open(init_file, "r", encoding="utf-8") as f:
-        content = f.read()
-
-    lines = content.split("\n")
-    new_lines = []
-    idx = 0
-    while idx < len(lines):
-        # Conditional imports in try-except-else blocks
-        if (re_conditional_imports.search(lines[idx]) is not None) and (re_try.search(lines[idx - 1]) is not None):
-            # Remove the preceding `try:`
-            new_lines.pop()
-            idx += 1
-            # Iterate until `else:`
-            while is_empty_line(lines[idx]) or re_else.search(lines[idx]) is None:
-                idx += 1
-            idx += 1
-            indent = find_indent(lines[idx])
-            while find_indent(lines[idx]) >= indent or is_empty_line(lines[idx]):
-                idx += 1
-        # Remove the import from utils
-        elif re_is_xxx_available.search(lines[idx]) is not None:
-            line = lines[idx]
-            for framework in to_remove:
-                line = line.replace(f", is_{framework}_available", "")
-                line = line.replace(f"is_{framework}_available, ", "")
-                line = line.replace(f"is_{framework}_available,", "")
-                line = line.replace(f"is_{framework}_available", "")
-
-            if len(line.strip()) > 0:
-                new_lines.append(line)
-            idx += 1
-        # Otherwise we keep the line, except if it's a tokenizer import and we don't want to keep it.
-        elif keep_processing or (
-            re.search(r'^\s*"(tokenization|processing|feature_extraction|image_processing)', lines[idx]) is None
-            and re.search(r"^\s*from .(tokenization|processing|feature_extraction|image_processing)", lines[idx])
-            is None
-        ):
-            new_lines.append(lines[idx])
-            idx += 1
-        else:
-            idx += 1
-
-    with open(init_file, "w", encoding="utf-8") as f:
-        f.write("\n".join(new_lines))
-
-
-def add_model_to_main_init(
-    old_model_patterns: ModelPatterns,
-    new_model_patterns: ModelPatterns,
-    frameworks: Optional[list[str]] = None,
-    with_processing: bool = True,
-):
-    """
-    Add a model to the main init of Transformers.
-
-    Args:
-        old_model_patterns (`ModelPatterns`): The patterns for the old model.
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
-        frameworks (`list[str]`, *optional*):
-            If specified, only the models implemented in those frameworks will be added.
-        with_processing (`bool`, *optional*, defaults to `True`):
-            Whether the tokenizer/feature extractor/processor of the model should also be added to the init or not.
-    """
-    with open(TRANSFORMERS_PATH / "__init__.py", "r", encoding="utf-8") as f:
-        content = f.read()
-
-    lines = content.split("\n")
-    idx = 0
-    new_lines = []
-    framework = None
-    while idx < len(lines):
-        new_framework = False
-        if not is_empty_line(lines[idx]) and find_indent(lines[idx]) == 0:
-            framework = None
-        elif lines[idx].lstrip().startswith("if not is_torch_available"):
-            framework = "pt"
-            new_framework = True
-        elif lines[idx].lstrip().startswith("if not is_tf_available"):
-            framework = "tf"
-            new_framework = True
-        elif lines[idx].lstrip().startswith("if not is_flax_available"):
-            framework = "flax"
-            new_framework = True
-
-        if new_framework:
-            # For a new framework, we need to skip until the else: block to get where the imports are.
-            while lines[idx].strip() != "else:":
-                new_lines.append(lines[idx])
-                idx += 1
-
-        # Skip if we are in a framework not wanted.
-        if framework is not None and frameworks is not None and framework not in frameworks:
-            new_lines.append(lines[idx])
-            idx += 1
-        elif re.search(rf'models.{old_model_patterns.model_lower_cased}( |")', lines[idx]) is not None:
-            block = [lines[idx]]
-            indent = find_indent(lines[idx])
-            idx += 1
-            while find_indent(lines[idx]) > indent:
-                block.append(lines[idx])
-                idx += 1
-            if lines[idx].strip() in [")", "]", "],"]:
-                block.append(lines[idx])
-                idx += 1
-            block = "\n".join(block)
-            new_lines.append(block)
-
-            add_block = True
-            if not with_processing:
-                processing_classes = [
-                    old_model_patterns.tokenizer_class,
-                    old_model_patterns.image_processor_class,
-                    old_model_patterns.image_processor_fast_class,
-                    old_model_patterns.feature_extractor_class,
-                    old_model_patterns.processor_class,
-                ]
-                # Only keep the ones that are not None
-                processing_classes = [c for c in processing_classes if c is not None]
-                for processing_class in processing_classes:
-                    block = block.replace(f' "{processing_class}",', "")
-                    block = block.replace(f', "{processing_class}"', "")
-                    block = block.replace(f" {processing_class},", "")
-                    block = block.replace(f", {processing_class}", "")
-
-                    if processing_class in block:
-                        add_block = False
-            if add_block:
-                new_lines.append(replace_model_patterns(block, old_model_patterns, new_model_patterns)[0])
-        else:
-            new_lines.append(lines[idx])
-            idx += 1
-
-    with open(TRANSFORMERS_PATH / "__init__.py", "w", encoding="utf-8") as f:
-        f.write("\n".join(new_lines))
-
-
-def insert_tokenizer_in_auto_module(old_model_patterns: ModelPatterns, new_model_patterns: ModelPatterns):
-    """
-    Add a tokenizer to the relevant mappings in the auto module.
-
-    Args:
-        old_model_patterns (`ModelPatterns`): The patterns for the old model.
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
-    """
-    if old_model_patterns.tokenizer_class is None or new_model_patterns.tokenizer_class is None:
-        return
-
-    with open(TRANSFORMERS_PATH / "models" / "auto" / "tokenization_auto.py", "r", encoding="utf-8") as f:
-        content = f.read()
-
-    pattern_tokenizer = re.compile(r"^\s*TOKENIZER_MAPPING_NAMES\s*=\s*OrderedDict\b")
-    lines = content.split("\n")
-    idx = 0
-    # First we get to the TOKENIZER_MAPPING_NAMES block.
-    while not pattern_tokenizer.search(lines[idx]):
-        idx += 1
-    idx += 1
-
-    # That block will end at this prompt:
-    while not lines[idx].startswith("TOKENIZER_MAPPING = _LazyAutoMapping"):
-        # Either all the tokenizer block is defined on one line, in which case, it ends with "),"
-        if lines[idx].endswith(","):
-            block = lines[idx]
-        # Otherwise it takes several lines until we get to a "),"
-        else:
-            block = []
-            # should change to "        )," instead of "            ),"
-            while not lines[idx].startswith("        ),"):
-                block.append(lines[idx])
-                idx += 1
-            # if the lines[idx] does start with "        )," we still need it in our block
-            block.append(lines[idx])
-            block = "\n".join(block)
-        idx += 1
-
-        # If we find the model type and tokenizer class in that block, we have the old model tokenizer block
-        if f'"{old_model_patterns.model_type}"' in block and old_model_patterns.tokenizer_class in block:
-            break
-
-    new_block = block.replace(old_model_patterns.model_type, new_model_patterns.model_type)
-    new_block = new_block.replace(old_model_patterns.tokenizer_class, new_model_patterns.tokenizer_class)
-
-    new_lines = lines[:idx] + [new_block] + lines[idx:]
-    with open(TRANSFORMERS_PATH / "models" / "auto" / "tokenization_auto.py", "w", encoding="utf-8") as f:
-        f.write("\n".join(new_lines))
-
-
-AUTO_CLASSES_PATTERNS = {
-    "configuration_auto.py": [
-        '        ("{model_type}", "{model_name}"),',
-        '        ("{model_type}", "{config_class}"),',
-        '        ("{model_type}", "{pretrained_archive_map}"),',
-    ],
-    "feature_extraction_auto.py": ['        ("{model_type}", "{feature_extractor_class}"),'],
-    "image_processing_auto.py": ['        ("{model_type}", "{image_processor_classes}"),'],
-    "modeling_auto.py": ['        ("{model_type}", "{any_pt_class}"),'],
-    "modeling_tf_auto.py": ['        ("{model_type}", "{any_tf_class}"),'],
-    "modeling_flax_auto.py": ['        ("{model_type}", "{any_flax_class}"),'],
-    "processing_auto.py": ['        ("{model_type}", "{processor_class}"),'],
-}
-
-
-def add_model_to_auto_classes(
-    old_model_patterns: ModelPatterns, new_model_patterns: ModelPatterns, model_classes: dict[str, list[str]]
-):
-    """
-    Add a model to the relevant mappings in the auto module.
-
-    Args:
-        old_model_patterns (`ModelPatterns`): The patterns for the old model.
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
-        model_classes (`dict[str, list[str]]`): A dictionary framework to list of model classes implemented.
-    """
-    for filename, patterns in AUTO_CLASSES_PATTERNS.items():
-        # Extend patterns with all model classes if necessary
-        new_patterns = []
-        for pattern in patterns:
-            if re.search("any_([a-z]*)_class", pattern) is not None:
-                framework = re.search("any_([a-z]*)_class", pattern).groups()[0]
-                if framework in model_classes:
-                    new_patterns.extend(
-                        [
-                            pattern.replace("{" + f"any_{framework}_class" + "}", cls)
-                            for cls in model_classes[framework]
-                        ]
-                    )
-            elif "{config_class}" in pattern:
-                new_patterns.append(pattern.replace("{config_class}", old_model_patterns.config_class))
-            elif "{image_processor_classes}" in pattern:
-                if (
-                    old_model_patterns.image_processor_class is not None
-                    and new_model_patterns.image_processor_class is not None
-                ):
-                    if (
-                        old_model_patterns.image_processor_fast_class is not None
-                        and new_model_patterns.image_processor_fast_class is not None
-                    ):
-                        new_patterns.append(
-                            pattern.replace(
-                                '"{image_processor_classes}"',
-                                f'("{old_model_patterns.image_processor_class}", "{old_model_patterns.image_processor_fast_class}")',
-                            )
-                        )
-                    else:
-                        new_patterns.append(
-                            pattern.replace(
-                                '"{image_processor_classes}"', f'("{old_model_patterns.image_processor_class}",)'
-                            )
-                        )
-            elif "{feature_extractor_class}" in pattern:
-                if (
-                    old_model_patterns.feature_extractor_class is not None
-                    and new_model_patterns.feature_extractor_class is not None
-                ):
-                    new_patterns.append(
-                        pattern.replace("{feature_extractor_class}", old_model_patterns.feature_extractor_class)
-                    )
-            elif "{processor_class}" in pattern:
-                if old_model_patterns.processor_class is not None and new_model_patterns.processor_class is not None:
-                    new_patterns.append(pattern.replace("{processor_class}", old_model_patterns.processor_class))
-            else:
-                new_patterns.append(pattern)
-
-        # Loop through all patterns.
-        for pattern in new_patterns:
-            full_name = TRANSFORMERS_PATH / "models" / "auto" / filename
-            old_model_line = pattern
-            new_model_line = pattern
-            for attr in ["model_type", "model_name"]:
-                old_model_line = old_model_line.replace("{" + attr + "}", getattr(old_model_patterns, attr))
-                new_model_line = new_model_line.replace("{" + attr + "}", getattr(new_model_patterns, attr))
-            new_model_line = new_model_line.replace(
-                old_model_patterns.model_camel_cased, new_model_patterns.model_camel_cased
+    for filename, to_add in corrected_filenames_to_add:
+        if to_add:
+            # The auto mapping
+            filename = filename.replace("_fast.py", ".py")
+            with open(TRANSFORMERS_PATH / "models" / "auto" / filename) as f:
+                file = f.read()
+            # The regex has to be a bit complex like this as the tokenizer mapping has new lines everywhere
+            matching_lines = re.findall(
+                rf'( {{8,12}}\(\s*"{old_lowercase_name}",.*?\),\n)(?: {{4,12}}\(|\])', file, re.DOTALL
             )
-            add_content_to_file(full_name, new_model_line, add_after=old_model_line)
-
-    # Tokenizers require special handling
-    insert_tokenizer_in_auto_module(old_model_patterns, new_model_patterns)
+            for match in matching_lines:
+                add_content_to_file(
+                    TRANSFORMERS_PATH / "models" / "auto" / filename,
+                    new_content=match.replace(old_lowercase_name, new_lowercase_name).replace(
+                        old_cased_name, new_cased_name
+                    ),
+                    add_after=match,
+                )
 
 
-DOC_OVERVIEW_TEMPLATE = """## Overview
-
-The {model_name} model was proposed in [<INSERT PAPER NAME HERE>](<INSERT PAPER LINK HERE>) by <INSERT AUTHORS HERE>.
-<INSERT SHORT SUMMARY HERE>
-
-The abstract from the paper is the following:
-
-*<INSERT PAPER ABSTRACT HERE>*
-
-Tips:
-
-<INSERT TIPS ABOUT MODEL HERE>
-
-This model was contributed by [INSERT YOUR HF USERNAME HERE](https://huggingface.co/<INSERT YOUR HF USERNAME HERE>).
-The original code can be found [here](<INSERT LINK TO GITHUB REPO HERE>).
-
-"""
-
-
-def duplicate_doc_file(
-    doc_file: Union[str, os.PathLike],
-    old_model_patterns: ModelPatterns,
-    new_model_patterns: ModelPatterns,
-    dest_file: Optional[Union[str, os.PathLike]] = None,
-    frameworks: Optional[list[str]] = None,
-):
+def create_doc_file(new_paper_name: str, public_classes: list[str]):
     """
-    Duplicate a documentation file and adapts it for a new model.
+    Create a new doc file to fill for the new model.
 
     Args:
-        module_file (`str` or `os.PathLike`): Path to the doc file to duplicate.
-        old_model_patterns (`ModelPatterns`): The patterns for the old model.
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
-        dest_file (`str` or `os.PathLike`, *optional*): Path to the new doc file.
-            Will default to the a file named `{new_model_patterns.model_type}.md` in the same folder as `module_file`.
-        frameworks (`list[str]`, *optional*):
-            If passed, will only keep the model classes corresponding to this list of frameworks in the new doc file.
+        new_paper_name (`str`):
+            The fully cased name (as in the official paper name) of the new model.
+        public_classes (`list[str]`):
+            A list of all the public classes that the model will have in the library.
     """
-    with open(doc_file, "r", encoding="utf-8") as f:
-        content = f.read()
+    added_note = (
+        "\n\n⚠️ Note that this file is in Markdown but contain specific syntax for our doc-builder (similar to MDX) that "
+        "may not be rendered properly in your Markdown viewer.\n\n-->\n\n"
+    )
+    copyright_for_markdown = re.sub(r"# ?", "", COPYRIGHT).replace("coding=utf-8\n", "<!--") + added_note
 
-    content = re.sub(r"<!--\s*Copyright (\d+)\s", f"<!--Copyright {CURRENT_YEAR} ", content)
-    if frameworks is None:
-        frameworks = get_default_frameworks()
-    if dest_file is None:
-        dest_file = Path(doc_file).parent / f"{new_model_patterns.model_type}.md"
+    doc_template = textwrap.dedent(
+        f"""
+        # {new_paper_name}
 
-    # Parse the doc file in blocks. One block per section/header
-    lines = content.split("\n")
-    blocks = []
-    current_block = []
+        ## Overview
 
-    for line in lines:
-        if line.startswith("#"):
-            blocks.append("\n".join(current_block))
-            current_block = [line]
-        else:
-            current_block.append(line)
-    blocks.append("\n".join(current_block))
+        The {new_paper_name} model was proposed in [<INSERT PAPER NAME HERE>](<INSERT PAPER LINK HERE>) by <INSERT AUTHORS HERE>.
+        <INSERT SHORT SUMMARY HERE>
 
-    new_blocks = []
-    in_classes = False
-    for block in blocks:
-        # Copyright
-        if not block.startswith("#"):
-            new_blocks.append(block)
-        # Main title
-        elif re.search(r"^#\s+\S+", block) is not None:
-            new_blocks.append(f"# {new_model_patterns.model_name}\n")
-        # The config starts the part of the doc with the classes.
-        elif not in_classes and old_model_patterns.config_class in block.split("\n")[0]:
-            in_classes = True
-            new_blocks.append(DOC_OVERVIEW_TEMPLATE.format(model_name=new_model_patterns.model_name))
-            new_block, _ = replace_model_patterns(block, old_model_patterns, new_model_patterns)
-            new_blocks.append(new_block)
-        # In classes
-        elif in_classes:
-            in_classes = True
-            block_title = block.split("\n")[0]
-            block_class = re.search(r"^#+\s+(\S.*)$", block_title).groups()[0]
-            new_block, _ = replace_model_patterns(block, old_model_patterns, new_model_patterns)
+        The abstract from the paper is the following:
 
-            if "Tokenizer" in block_class:
-                # We only add the tokenizer if necessary
-                if old_model_patterns.tokenizer_class != new_model_patterns.tokenizer_class:
-                    new_blocks.append(new_block)
-            elif "ImageProcessor" in block_class:
-                # We only add the image processor if necessary
-                if old_model_patterns.image_processor_class != new_model_patterns.image_processor_class:
-                    new_blocks.append(new_block)
-            elif "ImageProcessorFast" in block_class:
-                # We only add the image processor if necessary
-                if old_model_patterns.image_processor_fast_class != new_model_patterns.image_processor_fast_class:
-                    new_blocks.append(new_block)
-            elif "FeatureExtractor" in block_class:
-                # We only add the feature extractor if necessary
-                if old_model_patterns.feature_extractor_class != new_model_patterns.feature_extractor_class:
-                    new_blocks.append(new_block)
-            elif "Processor" in block_class:
-                # We only add the processor if necessary
-                if old_model_patterns.processor_class != new_model_patterns.processor_class:
-                    new_blocks.append(new_block)
-            elif block_class.startswith("Flax"):
-                # We only add Flax models if in the selected frameworks
-                if "flax" in frameworks:
-                    new_blocks.append(new_block)
-            elif block_class.startswith("TF"):
-                # We only add TF models if in the selected frameworks
-                if "tf" in frameworks:
-                    new_blocks.append(new_block)
-            elif len(block_class.split(" ")) == 1:
-                # We only add PyTorch models if in the selected frameworks
-                if "pt" in frameworks:
-                    new_blocks.append(new_block)
-            else:
-                new_blocks.append(new_block)
+        <INSERT PAPER ABSTRACT HERE>
 
-    with open(dest_file, "w", encoding="utf-8") as f:
-        f.write("\n".join(new_blocks))
+        Tips:
+
+        <INSERT TIPS ABOUT MODEL HERE>
+
+        This model was contributed by [INSERT YOUR HF USERNAME HERE](https://huggingface.co/<INSERT YOUR HF USERNAME HERE>).
+        The original code can be found [here](<INSERT LINK TO GITHUB REPO HERE>).
+
+        ## Usage examples
+
+        <INSERT SOME NICE EXAMPLES HERE>
+
+        """
+    )
+
+    # Add public classes doc
+    doc_for_classes = []
+    for class_ in public_classes:
+        doc = f"## {class_}\n\n[[autodoc]] {class_}"
+        if "Model" in class_:
+            doc += "\n    - forward"
+        doc_for_classes.append(doc)
+
+    class_doc = "\n\n".join(doc_for_classes)
+
+    return copyright_for_markdown + doc_template + class_doc
 
 
-def insert_model_in_doc_toc(old_model_patterns, new_model_patterns):
+def insert_model_in_doc_toc(old_lowercase_name: str, new_lowercase_name: str, new_model_paper_name: str):
     """
-    Insert the new model in the doc TOC, in the same section as the old model.
+    Insert the new model in the doc `_toctree.yaml`, in the same section as the old model.
 
     Args:
-        old_model_patterns (`ModelPatterns`): The patterns for the old model.
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
+        old_lowercase_name (`str`):
+            The old lowercase model name.
+        new_lowercase_name (`str`):
+            The old lowercase model name.
+        new_model_paper_name (`str`):
+            The fully cased name (as in the official paper name) of the new model.
     """
     toc_file = REPO_PATH / "docs" / "source" / "en" / "_toctree.yml"
-    with open(toc_file, "r", encoding="utf8") as f:
-        content = yaml.safe_load(f)
+    with open(toc_file, "r") as f:
+        content = f.read()
 
-    # Get to the model API doc
-    api_idx = 0
-    while content[api_idx]["title"] != "API":
-        api_idx += 1
-    api_doc = content[api_idx]["sections"]
+    old_model_toc = re.search(rf"- local: model_doc/{old_lowercase_name}\n {{8}}title: .*?\n", content).group(0)
+    new_toc = f"      - local: model_doc/{new_lowercase_name}\n        title: {new_model_paper_name}\n"
+    add_content_to_file(
+        REPO_PATH / "docs" / "source" / "en" / "_toctree.yml", new_content=new_toc, add_after=old_model_toc
+    )
 
-    model_idx = 0
-    while api_doc[model_idx]["title"] != "Models":
-        model_idx += 1
-    model_doc = api_doc[model_idx]["sections"]
 
-    # Find the base model in the Toc
-    old_model_type = old_model_patterns.model_type
-    section_idx = 0
-    while section_idx < len(model_doc):
-        sections = [entry["local"] for entry in model_doc[section_idx]["sections"]]
-        if f"model_doc/{old_model_type}" in sections:
-            break
+def create_init_file(old_lowercase_name: str, new_lowercase_name: str, filenames_to_add: list[tuple[str, bool]]):
+    """
+    Create the `__init__.py` file to add in the new model folder.
 
-        section_idx += 1
+    Args:
+        old_lowercase_name (`str`):
+            The old lowercase model name.
+        new_lowercase_name (`str`):
+            The new lowercase model name.
+        filenames_to_add (`list[tuple[str, bool]]`):
+            A list of tuples of all potential filenames to add for a new model, along a boolean flag describing if we
+            should add this file or not. For example, [(`modeling_xxx.px`, True), (`configuration_xxx.py`, True), (`tokenization_xxx.py`, False),...]
+    """
+    filenames_to_add = [
+        (filename.replace(old_lowercase_name, new_lowercase_name).replace(".py", ""), to_add)
+        for filename, to_add in filenames_to_add
+    ]
+    imports = "\n            ".join(f"from .{file} import *" for file, to_add in filenames_to_add if to_add)
+    init_file = COPYRIGHT + textwrap.dedent(
+        f"""
+        from typing import TYPE_CHECKING
 
-    if section_idx == len(model_doc):
-        old_model = old_model_patterns.model_name
-        new_model = new_model_patterns.model_name
-        print(f"Did not find {old_model} in the table of content, so you will need to add {new_model} manually.")
-        return
+        from ...utils import _LazyModule
+        from ...utils.import_utils import define_import_structure
 
-    # Add the new model in the same toc
-    toc_entry = {"local": f"model_doc/{new_model_patterns.model_type}", "title": new_model_patterns.model_name}
-    model_doc[section_idx]["sections"].append(toc_entry)
-    model_doc[section_idx]["sections"] = sorted(model_doc[section_idx]["sections"], key=lambda s: s["title"].lower())
-    api_doc[model_idx]["sections"] = model_doc
-    content[api_idx]["sections"] = api_doc
 
-    with open(toc_file, "w", encoding="utf-8") as f:
-        f.write(yaml.dump(content, allow_unicode=True))
+        if TYPE_CHECKING:
+            {imports}
+        else:
+            import sys
+
+            _file = globals()["__file__"]
+            sys.modules[__name__] = _LazyModule(__name__, _file, define_import_structure(_file), module_spec=__spec__)
+        """
+    )
+    return init_file
+
+
+def find_all_classes_from_file(module_name: str) -> set:
+    """
+    Find the name of all classes defined in `module_name`, including public ones (defined in `__all__`).
+
+    Args:
+        module_name (`str`):
+            The full path to the python module from which to extract classes.
+    """
+    with open(module_name, "r", encoding="utf-8") as file:
+        source_code = file.read()
+    module = cst.parse_module(source_code)
+    visitor = ClassFinder()
+    module.visit(visitor)
+    return visitor.classes, visitor.public_classes
+
+
+def find_modular_structure(
+    module_name: str, old_model_infos: ModelInfos, new_cased_name: str
+) -> tuple[str, str, list]:
+    """
+    Extract the modular structure that will be needed to copy a file `module_name` using modular.
+
+    Args:
+        module_name (`str`):
+            The full path to the python module to copy with modular.
+        old_model_infos (`ModelInfos`):
+            The structure containing the class informations of the old model.
+        new_cased_name (`str`):
+            The new cased model name.
+    """
+    all_classes, public_classes = find_all_classes_from_file(module_name)
+    import_location = ".".join(module_name.parts[-2:]).replace(".py", "")
+    old_cased_name = old_model_infos.camelcase_name
+    imports = f"from ..{import_location} import {', '.join(class_ for class_ in all_classes)}"
+    modular_classes = "\n\n".join(
+        f"class {class_.replace(old_cased_name, new_cased_name)}({class_}):\n    pass" for class_ in all_classes
+    )
+    public_classes = [class_.replace(old_cased_name, new_cased_name) for class_ in public_classes]
+    return imports, modular_classes, public_classes
+
+
+def create_modular_file(
+    old_model_infos: ModelInfos,
+    new_lowercase_name: str,
+    filenames_to_add: list[tuple[str, bool]],
+) -> str:
+    """
+    Create a new modular file which will copy the old model, based on the new name and the different filenames
+    (modules) to add.
+
+    Args:
+        old_model_infos (`ModelInfos`):
+            The structure containing the class informations of the old model.
+        new_lowercase_name (`str`):
+            The new lowercase model name.
+        filenames_to_add (`list[tuple[str, bool]]`):
+            A list of tuples of all potential filenames to add for a new model, along a boolean flag describing if we
+            should add this file or not. For example, [(`modeling_xxx.px`, True), (`configuration_xxx.py`, True), (`tokenization_xxx.py`, False),...]
+    """
+    new_cased_name = "".join(x.title() for x in new_lowercase_name.replace("-", "_").split("_"))
+    old_lowercase_name = old_model_infos.lowercase_name
+    old_folder_root = TRANSFORMERS_PATH / "models" / old_lowercase_name
+
+    # Construct the modular file from the original (old) model, by subclassing each class
+    all_imports = ""
+    all_bodies = ""
+    all_public_classes = []
+    for filename, to_add in filenames_to_add:
+        if to_add:
+            imports, body, public_classes = find_modular_structure(
+                old_folder_root / filename, old_model_infos, new_cased_name
+            )
+            all_imports += f"\n{imports}"
+            all_bodies += f"\n\n{body}"
+            all_public_classes.extend(public_classes)
+
+    # Create the __all__ assignment
+    public_classes_formatted = "\n            ".join(f"{public_class}," for public_class in all_public_classes)
+    all_statement = textwrap.dedent(
+        f"""
+
+        __all__ = [
+            {public_classes_formatted}
+        ]
+        """
+    )
+    # Create the whole modular file
+    modular_file = COPYRIGHT + all_imports + all_bodies + all_statement
+    # Remove outer explicit quotes "" around the public class names before returning them
+    all_public_classes = [public_class.replace('"', "") for public_class in all_public_classes]
+    return modular_file, all_public_classes
+
+
+def create_test_files(old_model_infos: ModelInfos, new_lowercase_name, filenames_to_add: list[tuple[str, bool]]):
+    """
+    Create the test files for the new model. It basically copies over the old test files and adjust the class names.
+
+    Args:
+        old_model_infos (`ModelInfos`):
+            The structure containing the class informations of the old model.
+        new_lowercase_name (`str`):
+            The new lowercase model name.
+        filenames_to_add (`list[tuple[str, bool]]`):
+            A list of tuples of all potential filenames to add for a new model, along a boolean flag describing if we
+            should add this file or not. For example, [(`modeling_xxx.px`, True), (`configuration_xxx.py`, True), (`tokenization_xxx.py`, False),...]
+    """
+    new_cased_name = "".join(x.title() for x in new_lowercase_name.replace("-", "_").split("_"))
+    old_lowercase_name = old_model_infos.lowercase_name
+    old_cased_name = old_model_infos.camelcase_name
+    filenames_to_add = [
+        ("test_" + filename.replace(old_lowercase_name, new_lowercase_name), to_add)
+        for filename, to_add in filenames_to_add[1:]
+    ]
+    # fast tokenizer/image processor have the same test files as normal ones
+    corrected_filenames_to_add = []
+    for file, to_add in filenames_to_add:
+        if re.search(rf"test_(?:tokenization)|(?:image_processing)_{new_lowercase_name}_fast.py", file):
+            previous_file, previous_to_add = corrected_filenames_to_add[-1]
+            corrected_filenames_to_add[-1] = (previous_file, previous_to_add or to_add)
+        else:
+            corrected_filenames_to_add.append((file, to_add))
+
+    test_files = {}
+    for new_file, to_add in corrected_filenames_to_add:
+        if to_add:
+            original_test_file = new_file.replace(new_lowercase_name, old_lowercase_name)
+            original_test_path = REPO_PATH / "tests" / "models" / old_lowercase_name / original_test_file
+            # Sometimes, tests may not exist
+            if not original_test_path.is_file():
+                continue
+            with open(original_test_path, "r") as f:
+                test_code = f.read()
+            # Remove old copyright and add new one
+            test_lines = test_code.split("\n")
+            idx = 0
+            while test_lines[idx].startswith("#"):
+                idx += 1
+            test_code = COPYRIGHT + "\n".join(test_lines[idx:])
+            test_files[new_file] = test_code.replace(old_cased_name, new_cased_name)
+
+    return test_files
 
 
 def create_new_model_like(
-    model_type: str,
-    new_model_patterns: ModelPatterns,
-    add_copied_from: bool = True,
-    frameworks: Optional[list[str]] = None,
-    old_checkpoint: Optional[str] = None,
-    create_fast_image_processor: bool = False,
+    old_model_infos: ModelInfos,
+    new_lowercase_name: str,
+    new_model_paper_name: str,
+    filenames_to_add: list[tuple[str, bool]],
+    create_fast_image_processor: bool,
 ):
     """
     Creates a new model module like a given model of the Transformers library.
 
     Args:
-        model_type (`str`): The model type to duplicate (like "bert" or "gpt2")
-        new_model_patterns (`ModelPatterns`): The patterns for the new model.
-        add_copied_from (`bool`, *optional*, defaults to `True`):
-            Whether or not to add "Copied from" statements to all classes in the new model modeling files.
-        frameworks (`list[str]`, *optional*):
-            If passed, will limit the duplicate to the frameworks specified.
-        old_checkpoint (`str`, *optional*):
-            The name of the base checkpoint for the old model. Should be passed along when it can't be automatically
-            recovered from the `model_type`.
-        create_fast_image_processor (`bool`, *optional*, defaults to `False`):
-            Whether or not to add a fast image processor to the new model, if the old model had only a slow one.
+        old_model_infos (`ModelInfos`):
+            The structure containing the class informations of the old model.
+        new_lowercase_name (`str`):
+            The new lowercase model name.
+        new_model_paper_name (`str`):
+            The fully cased name (as in the official paper name) of the new model.
+        filenames_to_add (`list[tuple[str, bool]]`):
+            A list of tuples of all potential filenames to add for a new model, along a boolean flag describing if we
+            should add this file or not. For example, [(`modeling_xxx.px`, True), (`configuration_xxx.py`, True), (`tokenization_xxx.py`, False),...]
+        create_fast_image_processor (`bool`):
+            If it makes sense, whether to add a fast processor as well, even if the old model does not have one.
     """
-    # Retrieve all the old model info.
-    model_info = retrieve_info_for_model(model_type, frameworks=frameworks)
-    model_files = model_info["model_files"]
-    old_model_patterns = model_info["model_patterns"]
-    if old_checkpoint is not None:
-        old_model_patterns.checkpoint = old_checkpoint
-    if len(old_model_patterns.checkpoint) == 0:
-        raise ValueError(
-            "The old model checkpoint could not be recovered from the model type. Please pass it to the "
-            "`old_checkpoint` argument."
-        )
+    # As the import was protected, raise if not present (as it's actually a hard dependency for this command)
+    if not is_libcst_available():
+        raise ValueError("You need to install `libcst` to run this command -> `pip install libcst`")
 
-    keep_old_processing = True
-    for processing_attr in [
-        "image_processor_class",
-        "image_processor_fast_class",
-        "feature_extractor_class",
-        "processor_class",
-        "tokenizer_class",
-    ]:
-        if getattr(old_model_patterns, processing_attr) != getattr(new_model_patterns, processing_attr):
-            keep_old_processing = False
+    old_lowercase_name = old_model_infos.lowercase_name
 
-    model_classes = model_info["model_classes"]
+    # 1. We create the folder for our new model
+    new_module_folder = TRANSFORMERS_PATH / "models" / new_lowercase_name
+    os.makedirs(new_module_folder, exist_ok=True)
 
-    # 1. We create the module for our new model.
-    old_module_name = model_files["module_name"]
-    module_folder = TRANSFORMERS_PATH / "models" / new_model_patterns.model_lower_cased
-    os.makedirs(module_folder, exist_ok=True)
+    # 2. Create and add the modular file
+    modular_file, public_classes = create_modular_file(old_model_infos, new_lowercase_name, filenames_to_add)
+    with open(new_module_folder / f"modular_{new_lowercase_name}.py", "w") as f:
+        f.write(modular_file)
 
-    files_to_adapt = model_files["model_files"]
-    if keep_old_processing:
-        files_to_adapt = [
-            f
-            for f in files_to_adapt
-            if "tokenization" not in str(f)
-            and "processing" not in str(f)
-            and "feature_extraction" not in str(f)
-            and "image_processing" not in str(f)
-        ]
+    # 3. Create and add the __init__.py
+    init_file = create_init_file(old_lowercase_name, new_lowercase_name, filenames_to_add)
+    with open(new_module_folder / "__init__.py", "w") as f:
+        f.write(init_file)
 
-    os.makedirs(module_folder, exist_ok=True)
-    for module_file in files_to_adapt:
-        new_module_name = module_file.name.replace(
-            old_model_patterns.model_lower_cased, new_model_patterns.model_lower_cased
-        )
-        dest_file = module_folder / new_module_name
-        duplicate_module(
-            module_file,
-            old_model_patterns,
-            new_model_patterns,
-            dest_file=dest_file,
-            add_copied_from=add_copied_from and "modeling" in new_module_name,
-        )
-
-    clean_frameworks_in_init(
-        module_folder / "__init__.py", frameworks=frameworks, keep_processing=not keep_old_processing
-    )
-
-    # 2. We add our new model to the models init and the main init
+    # 4. Add new model to the models init
     add_content_to_file(
         TRANSFORMERS_PATH / "models" / "__init__.py",
-        f"    {new_model_patterns.model_lower_cased},",
-        add_after=f"    {old_module_name},",
-        exact_match=True,
-    )
-    add_model_to_main_init(
-        old_model_patterns, new_model_patterns, frameworks=frameworks, with_processing=not keep_old_processing
+        new_content=f"    from .{new_lowercase_name} import *\n",
+        add_after="if TYPE_CHECKING:\n",
     )
 
-    # 3. Add test files
-    files_to_adapt = model_files["test_files"]
-    if keep_old_processing:
-        files_to_adapt = [
-            f
-            for f in files_to_adapt
-            if "tokenization" not in str(f)
-            and "processor" not in str(f)
-            and "feature_extraction" not in str(f)
-            and "image_processing" not in str(f)
-        ]
+    # 5. Add model to auto mappings
+    add_model_to_auto_mappings(old_model_infos, new_lowercase_name, new_model_paper_name, filenames_to_add)
 
-    def disable_fx_test(filename: Path) -> bool:
-        with open(filename) as fp:
-            content = fp.read()
-        new_content = re.sub(r"fx_compatible\s*=\s*True", "fx_compatible = False", content)
-        with open(filename, "w") as fp:
-            fp.write(new_content)
-        return content != new_content
-
-    disabled_fx_test = False
-
-    tests_folder = REPO_PATH / "tests" / "models" / new_model_patterns.model_lower_cased
+    # 6. Add test files
+    tests_folder = REPO_PATH / "tests" / "models" / new_lowercase_name
     os.makedirs(tests_folder, exist_ok=True)
+    # Add empty __init__.py
     with open(tests_folder / "__init__.py", "w"):
         pass
+    test_files = create_test_files(old_model_infos, new_lowercase_name, filenames_to_add)
+    for filename, content in test_files.items():
+        with open(tests_folder / filename, "w") as f:
+            f.write(content)
 
-    for test_file in files_to_adapt:
-        new_test_file_name = test_file.name.replace(
-            old_model_patterns.model_lower_cased, new_model_patterns.model_lower_cased
-        )
-        dest_file = test_file.parent.parent / new_model_patterns.model_lower_cased / new_test_file_name
-        duplicate_module(
-            test_file,
-            old_model_patterns,
-            new_model_patterns,
-            dest_file=dest_file,
-            add_copied_from=False,
-            attrs_to_remove=["pipeline_model_mapping", "is_pipeline_test_to_skip"],
-        )
-        disabled_fx_test = disabled_fx_test | disable_fx_test(dest_file)
+    # 7. Add doc file
+    doc_file = create_doc_file(new_model_paper_name, public_classes)
+    with open(REPO_PATH / "docs" / "source" / "en" / "model_doc" / f"{new_lowercase_name}.md", "w") as f:
+        f.write(doc_file)
+    insert_model_in_doc_toc(old_lowercase_name, new_lowercase_name, new_model_paper_name)
 
-    if disabled_fx_test:
-        print(
-            "The tests for symbolic tracing with torch.fx were disabled, you can add those once symbolic tracing works"
-            " for your new model."
-        )
-
-    # 4. Add model to auto classes
-    add_model_to_auto_classes(old_model_patterns, new_model_patterns, model_classes)
-
-    # 5. Add doc file
-    doc_file = REPO_PATH / "docs" / "source" / "en" / "model_doc" / f"{old_model_patterns.model_type}.md"
-    duplicate_doc_file(doc_file, old_model_patterns, new_model_patterns, frameworks=frameworks)
-    insert_model_in_doc_toc(old_model_patterns, new_model_patterns)
-
-    # 6. Add fast image processor if necessary
+    # 8. Add additional fast image processor if necessary
     if create_fast_image_processor:
-        add_fast_image_processor(model_name=new_model_patterns.model_lower_cased)
+        add_fast_image_processor(model_name=new_lowercase_name)
 
-    # 7. Warn the user for duplicate patterns
-    if old_model_patterns.model_type == old_model_patterns.checkpoint:
-        print(
-            "The model you picked has the same name for the model type and the checkpoint name "
-            f"({old_model_patterns.model_type}). As a result, it's possible some places where the new checkpoint "
-            f"should be, you have {new_model_patterns.model_type} instead. You should search for all instances of "
-            f"{new_model_patterns.model_type} in the new files and check they're not badly used as checkpoints."
-        )
-    elif old_model_patterns.model_lower_cased == old_model_patterns.checkpoint:
-        print(
-            "The model you picked has the same name for the model type and the checkpoint name "
-            f"({old_model_patterns.model_lower_cased}). As a result, it's possible some places where the new "
-            f"checkpoint should be, you have {new_model_patterns.model_lower_cased} instead. You should search for "
-            f"all instances of {new_model_patterns.model_lower_cased} in the new files and check they're not badly "
-            "used as checkpoints."
-        )
-    if (
-        old_model_patterns.model_type == old_model_patterns.model_lower_cased
-        and new_model_patterns.model_type != new_model_patterns.model_lower_cased
-    ):
-        print(
-            "The model you picked has the same name for the model type and the lowercased model name "
-            f"({old_model_patterns.model_lower_cased}). As a result, it's possible some places where the new "
-            f"model type should be, you have {new_model_patterns.model_lower_cased} instead. You should search for "
-            f"all instances of {new_model_patterns.model_lower_cased} in the new files and check they're not badly "
-            "used as the model type."
-        )
+    # 9. Run linters
+    model_init_file = TRANSFORMERS_PATH / "models" / "__init__.py"
+    subprocess.run(
+        ["ruff", "check", new_module_folder, tests_folder, model_init_file, "--fix"],
+        cwd=REPO_PATH,
+        stdout=subprocess.DEVNULL,
+    )
+    subprocess.run(
+        ["ruff", "format", new_module_folder, tests_folder, model_init_file],
+        cwd=REPO_PATH,
+        stdout=subprocess.DEVNULL,
+    )
+    subprocess.run(
+        ["python", "utils/check_doc_toc.py", "--fix_and_overwrite"], cwd=REPO_PATH, stdout=subprocess.DEVNULL
+    )
+    subprocess.run(["python", "utils/sort_auto_mappings.py"], cwd=REPO_PATH, stdout=subprocess.DEVNULL)
 
-    if not keep_old_processing and old_model_patterns.tokenizer_class is not None:
-        print(
-            "The constants at the start of the new tokenizer file created needs to be manually fixed. If your new "
-            "model has a tokenizer fast, you will also need to manually add the converter in the "
-            "`SLOW_TO_FAST_CONVERTERS` constant of `convert_slow_tokenizer.py`."
-        )
-
-
-def add_new_model_like_command_factory(args: Namespace):
-    return AddNewModelLikeCommand(config_file=args.config_file, path_to_repo=args.path_to_repo)
-
-
-class AddNewModelLikeCommand(BaseTransformersCLICommand):
-    @staticmethod
-    def register_subcommand(parser: ArgumentParser):
-        add_new_model_like_parser = parser.add_parser("add-new-model-like")
-        add_new_model_like_parser.add_argument(
-            "--config_file", type=str, help="A file with all the information for this model creation."
-        )
-        add_new_model_like_parser.add_argument(
-            "--path_to_repo", type=str, help="When not using an editable install, the path to the Transformers repo."
-        )
-        add_new_model_like_parser.set_defaults(func=add_new_model_like_command_factory)
-
-    def __init__(self, config_file=None, path_to_repo=None, *args):
-        if config_file is not None:
-            with open(config_file, "r", encoding="utf-8") as f:
-                config = json.load(f)
-            self.old_model_type = config["old_model_type"]
-            self.model_patterns = ModelPatterns(**config["new_model_patterns"])
-            self.add_copied_from = config.get("add_copied_from", True)
-            self.frameworks = config.get("frameworks", get_default_frameworks())
-            self.old_checkpoint = config.get("old_checkpoint", None)
-        else:
-            (
-                self.old_model_type,
-                self.model_patterns,
-                self.add_copied_from,
-                self.frameworks,
-                self.old_checkpoint,
-                self.create_fast_image_processor,
-            ) = get_user_input()
-
-        self.path_to_repo = path_to_repo
-
-    def run(self):
-        if self.path_to_repo is not None:
-            # Adapt constants
-            global TRANSFORMERS_PATH
-            global REPO_PATH
-
-            REPO_PATH = Path(self.path_to_repo)
-            TRANSFORMERS_PATH = REPO_PATH / "src" / "transformers"
-
-        create_new_model_like(
-            model_type=self.old_model_type,
-            new_model_patterns=self.model_patterns,
-            add_copied_from=self.add_copied_from,
-            frameworks=self.frameworks,
-            old_checkpoint=self.old_checkpoint,
-            create_fast_image_processor=self.create_fast_image_processor,
-        )
+    # 10. Run the modular conversion
+    subprocess.run(
+        ["python", "utils/modular_model_converter.py", new_lowercase_name], cwd=REPO_PATH, stdout=subprocess.DEVNULL
+    )
 
 
 def get_user_field(
     question: str,
     default_value: Optional[str] = None,
-    is_valid_answer: Optional[Callable] = None,
     convert_to: Optional[Callable] = None,
     fallback_message: Optional[str] = None,
 ) -> Any:
@@ -1575,10 +582,10 @@ def get_user_field(
     answer.
 
     Args:
-        question (`str`): The question to ask the user.
-        default_value (`str`, *optional*): A potential default value that will be used when the answer is empty.
-        is_valid_answer (`Callable`, *optional*):
-            If set, the question will be asked until this function returns `True` on the provided answer.
+        question (`str`):
+            The question to ask the user.
+        default_value (`str`, *optional*):
+            A potential default value that will be used when the answer is empty.
         convert_to (`Callable`, *optional*):
             If set, the answer will be passed to this function. If this function raises an error on the provided
             answer, the question will be asked again.
@@ -1598,9 +605,7 @@ def get_user_field(
         answer = input(question)
         if default_value is not None and len(answer) == 0:
             answer = default_value
-        if is_valid_answer is not None:
-            valid_answer = is_valid_answer(answer)
-        elif convert_to is not None:
+        if convert_to is not None:
             try:
                 answer = convert_to(answer)
                 valid_answer = True
@@ -1630,13 +635,13 @@ def get_user_input():
     """
     Ask the user for the necessary inputs to add the new model.
     """
-    model_types = list(auto_module.configuration_auto.MODEL_NAMES_MAPPING.keys())
+    model_types = list(MODEL_NAMES_MAPPING.keys())
 
     # Get old model type
     valid_model_type = False
     while not valid_model_type:
         old_model_type = input(
-            "What is the model you would like to duplicate? Please provide the lowercase `model_type` (e.g. roberta): "
+            "What model would you like to duplicate? Please provide it as lowercase, e.g. `llama`): "
         )
         if old_model_type in model_types:
             valid_model_type = True
@@ -1648,156 +653,131 @@ def get_user_input():
                     near_choices = " or ".join(near_choices)
                 print(f"Did you mean {near_choices}?")
 
-    old_model_info = retrieve_info_for_model(old_model_type)
-    old_tokenizer_class = old_model_info["model_patterns"].tokenizer_class
-    old_image_processor_class = old_model_info["model_patterns"].image_processor_class
-    old_image_processor_fast_class = old_model_info["model_patterns"].image_processor_fast_class
-    old_feature_extractor_class = old_model_info["model_patterns"].feature_extractor_class
-    old_processor_class = old_model_info["model_patterns"].processor_class
-    old_frameworks = old_model_info["frameworks"]
+    old_model_infos = ModelInfos(old_model_type)
 
-    old_checkpoint = None
-    if len(old_model_info["model_patterns"].checkpoint) == 0:
-        old_checkpoint = get_user_field(
-            "We couldn't find the name of the base checkpoint for that model, please enter it here."
+    # Ask for the new model name
+    new_lowercase_name = get_user_field(
+        "What is the new model name? Please provide it as snake lowercase, e.g. `new_model`?"
+    )
+    new_model_paper_name = get_user_field(
+        "What is the fully cased name you would like to appear in the doc (e.g. `NeW ModEl`)? ",
+        default_value="".join(x.title() for x in new_lowercase_name.split("_")),
+    )
+
+    # Ask if we want to add individual processor classes as well
+    add_tokenizer = False
+    add_fast_tokenizer = False
+    add_image_processor = False
+    add_fast_image_processor = False
+    add_video_processor = False
+    add_feature_extractor = False
+    add_processor = False
+    if old_model_infos.tokenizer_class is not None:
+        add_tokenizer = get_user_field(
+            f"Do you want to create a new tokenizer? If `no`, it will use the same as {old_model_type} (y/n)?",
+            convert_to=convert_to_bool,
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
+        )
+    if old_model_infos.fast_tokenizer_class is not None:
+        add_fast_tokenizer = get_user_field(
+            f"Do you want to create a new fast tokenizer? If `no`, it will use the same as {old_model_type} (y/n)?",
+            convert_to=convert_to_bool,
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
+        )
+    if old_model_infos.image_processor_class is not None:
+        add_image_processor = get_user_field(
+            f"Do you want to create a new image processor? If `no`, it will use the same as {old_model_type} (y/n)?",
+            convert_to=convert_to_bool,
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
+        )
+    if old_model_infos.fast_image_processor_class is not None:
+        add_fast_image_processor = get_user_field(
+            f"Do you want to create a new fast image processor? If `no`, it will use the same as {old_model_type} (y/n)?",
+            convert_to=convert_to_bool,
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
+        )
+    if old_model_infos.video_processor_class is not None:
+        add_video_processor = get_user_field(
+            f"Do you want to create a new video processor? If `no`, it will use the same as {old_model_type} (y/n)?",
+            convert_to=convert_to_bool,
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
+        )
+    if old_model_infos.feature_extractor_class is not None:
+        add_feature_extractor = get_user_field(
+            f"Do you want to create a new feature extractor? If `no`, it will use the same as {old_model_type} (y/n)?",
+            convert_to=convert_to_bool,
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
+        )
+    if old_model_infos.processor_class is not None:
+        add_processor = get_user_field(
+            f"Do you want to create a new processor? If `no`, it will use the same as {old_model_type} (y/n)?",
+            convert_to=convert_to_bool,
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
         )
 
-    model_name = get_user_field(
-        "What is the name (with no special casing) for your new model in the paper (e.g. RoBERTa)? "
-    )
-    default_patterns = ModelPatterns(model_name, model_name)
-
-    model_type = get_user_field(
-        "What identifier would you like to use for the `model_type` of this model? ",
-        default_value=default_patterns.model_type,
-    )
-    model_lower_cased = get_user_field(
-        "What lowercase name would you like to use for the module (folder) of this model? ",
-        default_value=default_patterns.model_lower_cased,
-    )
-    model_camel_cased = get_user_field(
-        "What prefix (camel-cased) would you like to use for the model classes of this model (e.g. Roberta)? ",
-        default_value=default_patterns.model_camel_cased,
-    )
-    model_upper_cased = get_user_field(
-        "What prefix (upper-cased) would you like to use for the constants relative to this model? ",
-        default_value=default_patterns.model_upper_cased,
-    )
-    config_class = get_user_field(
-        "What will be the name of the config class for this model? ", default_value=f"{model_camel_cased}Config"
-    )
-    checkpoint = get_user_field(
-        "Please give a checkpoint identifier (on the model Hub) for this new model (e.g. facebook/FacebookAI/roberta-base): "
+    old_lowercase_name = old_model_infos.lowercase_name
+    # A list of the old filenames, along whether we should copy them or not
+    filenames_to_add = (
+        (f"configuration_{old_lowercase_name}.py", True),
+        (f"modeling_{old_lowercase_name}.py", True),
+        (f"tokenization_{old_lowercase_name}.py", add_tokenizer),
+        (f"tokenization_{old_lowercase_name}_fast.py", add_fast_tokenizer),
+        (f"image_processing_{old_lowercase_name}.py", add_image_processor),
+        (f"image_processing_{old_lowercase_name}_fast.py", add_fast_image_processor),
+        (f"video_processing_{old_lowercase_name}.py", add_video_processor),
+        (f"feature_extraction_{old_lowercase_name}.py", add_feature_extractor),
+        (f"processing_{old_lowercase_name}.py", add_processor),
     )
 
-    old_processing_classes = [
-        c if not isinstance(c, tuple) else c[0]
-        for c in [
-            old_image_processor_class,
-            old_image_processor_fast_class,
-            old_feature_extractor_class,
-            old_tokenizer_class,
-            old_processor_class,
-        ]
-        if c is not None
-    ]
-    old_processing_classes = ", ".join(old_processing_classes)
-    keep_processing = get_user_field(
-        f"Will your new model use the same processing class as {old_model_type} ({old_processing_classes}) (yes/no)? ",
-        convert_to=convert_to_bool,
-        fallback_message="Please answer yes/no, y/n, true/false or 1/0. ",
-    )
-    if keep_processing:
-        image_processor_class = old_image_processor_class
-        image_processor_fast_class = old_image_processor_fast_class
-        feature_extractor_class = old_feature_extractor_class
-        processor_class = old_processor_class
-        tokenizer_class = old_tokenizer_class
-        create_fast_image_processor = False
-    else:
-        if old_tokenizer_class is not None:
-            tokenizer_class = get_user_field(
-                "What will be the name of the tokenizer class for this model? ",
-                default_value=f"{model_camel_cased}Tokenizer",
-            )
-        else:
-            tokenizer_class = None
-        if old_image_processor_class is not None:
-            image_processor_class = get_user_field(
-                "What will be the name of the image processor class for this model? ",
-                default_value=f"{model_camel_cased}ImageProcessor",
-            )
-        else:
-            image_processor_class = None
-        if old_image_processor_fast_class is not None:
-            image_processor_fast_class = get_user_field(
-                "What will be the name of the fast image processor class for this model? ",
-                default_value=f"{model_camel_cased}ImageProcessorFast",
-            )
-        else:
-            image_processor_fast_class = None
-        if old_feature_extractor_class is not None:
-            feature_extractor_class = get_user_field(
-                "What will be the name of the feature extractor class for this model? ",
-                default_value=f"{model_camel_cased}FeatureExtractor",
-            )
-        else:
-            feature_extractor_class = None
-        if old_processor_class is not None:
-            processor_class = get_user_field(
-                "What will be the name of the processor class for this model? ",
-                default_value=f"{model_camel_cased}Processor",
-            )
-        else:
-            processor_class = None
-        if old_image_processor_class is not None and old_image_processor_fast_class is None:
-            create_fast_image_processor = get_user_field(
-                "A fast image processor can be created from the slow one, but modifications might be needed. "
-                "Should we add a fast image processor class for this model (recommended, yes/no)? ",
-                convert_to=convert_to_bool,
-                default_value="yes",
-                fallback_message="Please answer yes/no, y/n, true/false or 1/0.",
-            )
-        else:
-            create_fast_image_processor = False
-
-    model_patterns = ModelPatterns(
-        model_name,
-        checkpoint,
-        model_type=model_type,
-        model_lower_cased=model_lower_cased,
-        model_camel_cased=model_camel_cased,
-        model_upper_cased=model_upper_cased,
-        config_class=config_class,
-        tokenizer_class=tokenizer_class,
-        image_processor_class=image_processor_class,
-        image_processor_fast_class=image_processor_fast_class,
-        feature_extractor_class=feature_extractor_class,
-        processor_class=processor_class,
-    )
-
-    add_copied_from = get_user_field(
-        "Should we add # Copied from statements when creating the new modeling file (yes/no)? ",
-        convert_to=convert_to_bool,
-        default_value="yes",
-        fallback_message="Please answer yes/no, y/n, true/false or 1/0.",
-    )
-
-    all_frameworks = get_user_field(
-        "Should we add a version of your new model in all the frameworks implemented by"
-        f" {old_model_type} ({old_frameworks}) (yes/no)? ",
-        convert_to=convert_to_bool,
-        default_value="yes",
-        fallback_message="Please answer yes/no, y/n, true/false or 1/0.",
-    )
-
-    if all_frameworks:
-        frameworks = None
-    else:
-        frameworks = get_user_field(
-            "Please enter the list of frameworks you want (pt, tf, flax) separated by spaces",
-            is_valid_answer=lambda x: all(p in ["pt", "tf", "flax"] for p in x.split(" ")),
+    create_fast_image_processor = False
+    if add_image_processor and not add_fast_image_processor:
+        create_fast_image_processor = get_user_field(
+            "A fast image processor can be created from the slow one, but modifications might be needed. "
+            "Should we add a fast image processor class for this model (recommended) (y/n)? ",
+            convert_to=convert_to_bool,
+            default_value="y",
+            fallback_message="Please answer yes/no, y/n, true/false or 1/0.",
         )
-        frameworks = list(set(frameworks.split(" ")))
 
-    return (old_model_type, model_patterns, add_copied_from, frameworks, old_checkpoint, create_fast_image_processor)
+    return old_model_infos, new_lowercase_name, new_model_paper_name, filenames_to_add, create_fast_image_processor
+
+
+def add_new_model_like_command_factory(args: Namespace):
+    return AddNewModelLikeCommand(path_to_repo=args.path_to_repo)
+
+
+class AddNewModelLikeCommand(BaseTransformersCLICommand):
+    @staticmethod
+    def register_subcommand(parser: ArgumentParser):
+        add_new_model_like_parser = parser.add_parser("add-new-model-like")
+        add_new_model_like_parser.add_argument(
+            "--path_to_repo", type=str, help="When not using an editable install, the path to the Transformers repo."
+        )
+        add_new_model_like_parser.set_defaults(func=add_new_model_like_command_factory)
+
+    def __init__(self, path_to_repo=None, *args):
+        (
+            self.old_model_infos,
+            self.new_lowercase_name,
+            self.new_model_paper_name,
+            self.filenames_to_add,
+            self.create_fast_image_processor,
+        ) = get_user_input()
+        self.path_to_repo = path_to_repo
+
+    def run(self):
+        if self.path_to_repo is not None:
+            # Adapt constants
+            global TRANSFORMERS_PATH
+            global REPO_PATH
+
+            REPO_PATH = Path(self.path_to_repo)
+            TRANSFORMERS_PATH = REPO_PATH / "src" / "transformers"
+
+        create_new_model_like(
+            old_model_infos=self.old_model_infos,
+            new_lowercase_name=self.new_lowercase_name,
+            new_model_paper_name=self.new_model_paper_name,
+            filenames_to_add=self.filenames_to_add,
+            create_fast_image_processor=self.create_fast_image_processor,
+        )
diff --git a/src/transformers/models/auto/image_processing_auto.py b/src/transformers/models/auto/image_processing_auto.py
index d0ad2238c9..d00bfad332 100644
--- a/src/transformers/models/auto/image_processing_auto.py
+++ b/src/transformers/models/auto/image_processing_auto.py
@@ -62,7 +62,7 @@ else:
             ("aimv2", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
             ("aimv2_vision_model", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
             ("align", ("EfficientNetImageProcessor", "EfficientNetImageProcessorFast")),
-            ("aria", ("AriaImageProcessor")),
+            ("aria", ("AriaImageProcessor", None)),
             ("beit", ("BeitImageProcessor", "BeitImageProcessorFast")),
             ("bit", ("BitImageProcessor", "BitImageProcessorFast")),
             ("blip", ("BlipImageProcessor", "BlipImageProcessorFast")),
@@ -72,7 +72,7 @@ else:
             ("chinese_clip", ("ChineseCLIPImageProcessor", "ChineseCLIPImageProcessorFast")),
             ("clip", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
             ("clipseg", ("ViTImageProcessor", "ViTImageProcessorFast")),
-            ("cohere2_vision", ("Cohere2VisionImageProcessorFast",)),
+            ("cohere2_vision", (None, "Cohere2VisionImageProcessorFast")),
             ("conditional_detr", ("ConditionalDetrImageProcessor", "ConditionalDetrImageProcessorFast")),
             ("convnext", ("ConvNextImageProcessor", "ConvNextImageProcessorFast")),
             ("convnextv2", ("ConvNextImageProcessor", "ConvNextImageProcessorFast")),
@@ -84,52 +84,52 @@ else:
             ("deit", ("DeiTImageProcessor", "DeiTImageProcessorFast")),
             ("depth_anything", ("DPTImageProcessor", "DPTImageProcessorFast")),
             ("depth_pro", ("DepthProImageProcessor", "DepthProImageProcessorFast")),
-            ("deta", ("DetaImageProcessor",)),
+            ("deta", ("DetaImageProcessor", None)),
             ("detr", ("DetrImageProcessor", "DetrImageProcessorFast")),
             ("dinat", ("ViTImageProcessor", "ViTImageProcessorFast")),
             ("dinov2", ("BitImageProcessor", "BitImageProcessorFast")),
             ("donut-swin", ("DonutImageProcessor", "DonutImageProcessorFast")),
             ("dpt", ("DPTImageProcessor", "DPTImageProcessorFast")),
-            ("efficientformer", ("EfficientFormerImageProcessor",)),
-            ("efficientloftr", ("EfficientLoFTRImageProcessor",)),
+            ("efficientformer", ("EfficientFormerImageProcessor", None)),
+            ("efficientloftr", ("EfficientLoFTRImageProcessor", None)),
             ("efficientnet", ("EfficientNetImageProcessor", "EfficientNetImageProcessorFast")),
             ("eomt", ("EomtImageProcessor", "EomtImageProcessorFast")),
             ("flava", ("FlavaImageProcessor", "FlavaImageProcessorFast")),
             ("focalnet", ("BitImageProcessor", "BitImageProcessorFast")),
-            ("fuyu", ("FuyuImageProcessor",)),
+            ("fuyu", ("FuyuImageProcessor", None)),
             ("gemma3", ("Gemma3ImageProcessor", "Gemma3ImageProcessorFast")),
             ("gemma3n", ("SiglipImageProcessor", "SiglipImageProcessorFast")),
             ("git", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
             ("glm4v", ("Glm4vImageProcessor", "Glm4vImageProcessorFast")),
-            ("glpn", ("GLPNImageProcessor",)),
+            ("glpn", ("GLPNImageProcessor", None)),
             ("got_ocr2", ("GotOcr2ImageProcessor", "GotOcr2ImageProcessorFast")),
             ("grounding-dino", ("GroundingDinoImageProcessor", "GroundingDinoImageProcessorFast")),
             ("groupvit", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
             ("hiera", ("BitImageProcessor", "BitImageProcessorFast")),
-            ("idefics", ("IdeficsImageProcessor",)),
+            ("idefics", ("IdeficsImageProcessor", None)),
             ("idefics2", ("Idefics2ImageProcessor", "Idefics2ImageProcessorFast")),
             ("idefics3", ("Idefics3ImageProcessor", "Idefics3ImageProcessorFast")),
             ("ijepa", ("ViTImageProcessor", "ViTImageProcessorFast")),
-            ("imagegpt", ("ImageGPTImageProcessor",)),
+            ("imagegpt", ("ImageGPTImageProcessor", None)),
             ("instructblip", ("BlipImageProcessor", "BlipImageProcessorFast")),
-            ("instructblipvideo", ("InstructBlipVideoImageProcessor",)),
+            ("instructblipvideo", ("InstructBlipVideoImageProcessor", None)),
             ("janus", ("JanusImageProcessor", "JanusImageProcessorFast")),
             ("kosmos-2", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
             ("layoutlmv2", ("LayoutLMv2ImageProcessor", "LayoutLMv2ImageProcessorFast")),
             ("layoutlmv3", ("LayoutLMv3ImageProcessor", "LayoutLMv3ImageProcessorFast")),
             ("levit", ("LevitImageProcessor", "LevitImageProcessorFast")),
-            ("lightglue", ("LightGlueImageProcessor",)),
+            ("lightglue", ("LightGlueImageProcessor", None)),
             ("llama4", ("Llama4ImageProcessor", "Llama4ImageProcessorFast")),
             ("llava", ("LlavaImageProcessor", "LlavaImageProcessorFast")),
             ("llava_next", ("LlavaNextImageProcessor", "LlavaNextImageProcessorFast")),
-            ("llava_next_video", ("LlavaNextVideoImageProcessor",)),
+            ("llava_next_video", ("LlavaNextVideoImageProcessor", None)),
             ("llava_onevision", ("LlavaOnevisionImageProcessor", "LlavaOnevisionImageProcessorFast")),
             ("mask2former", ("Mask2FormerImageProcessor", "Mask2FormerImageProcessorFast")),
             ("maskformer", ("MaskFormerImageProcessor", "MaskFormerImageProcessorFast")),
             ("mgp-str", ("ViTImageProcessor", "ViTImageProcessorFast")),
             ("mistral3", ("PixtralImageProcessor", "PixtralImageProcessorFast")),
             ("mlcd", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
-            ("mllama", ("MllamaImageProcessor",)),
+            ("mllama", ("MllamaImageProcessor", None)),
             ("mm-grounding-dino", ("GroundingDinoImageProcessor", "GroundingDinoImageProcessorFast")),
             ("mobilenet_v1", ("MobileNetV1ImageProcessor", "MobileNetV1ImageProcessorFast")),
             ("mobilenet_v2", ("MobileNetV2ImageProcessor", "MobileNetV2ImageProcessorFast")),
@@ -142,12 +142,12 @@ else:
             ("owlvit", ("OwlViTImageProcessor", "OwlViTImageProcessorFast")),
             ("paligemma", ("SiglipImageProcessor", "SiglipImageProcessorFast")),
             ("perceiver", ("PerceiverImageProcessor", "PerceiverImageProcessorFast")),
-            ("perception_lm", ("PerceptionLMImageProcessorFast",)),
-            ("phi4_multimodal", ("Phi4MultimodalImageProcessorFast",)),
-            ("pix2struct", ("Pix2StructImageProcessor",)),
+            ("perception_lm", (None, "PerceptionLMImageProcessorFast")),
+            ("phi4_multimodal", (None, "Phi4MultimodalImageProcessorFast")),
+            ("pix2struct", ("Pix2StructImageProcessor", None)),
             ("pixtral", ("PixtralImageProcessor", "PixtralImageProcessorFast")),
             ("poolformer", ("PoolFormerImageProcessor", "PoolFormerImageProcessorFast")),
-            ("prompt_depth_anything", ("PromptDepthAnythingImageProcessor",)),
+            ("prompt_depth_anything", ("PromptDepthAnythingImageProcessor", None)),
             ("pvt", ("PvtImageProcessor", "PvtImageProcessorFast")),
             ("pvt_v2", ("PvtImageProcessor", "PvtImageProcessorFast")),
             ("qwen2_5_vl", ("Qwen2VLImageProcessor", "Qwen2VLImageProcessorFast")),
@@ -157,39 +157,31 @@ else:
             ("rt_detr", ("RTDetrImageProcessor", "RTDetrImageProcessorFast")),
             ("sam", ("SamImageProcessor", "SamImageProcessorFast")),
             ("sam_hq", ("SamImageProcessor", "SamImageProcessorFast")),
-            ("segformer", ("SegformerImageProcessor",)),
             ("segformer", ("SegformerImageProcessor", "SegformerImageProcessorFast")),
-            ("seggpt", ("SegGptImageProcessor",)),
+            ("seggpt", ("SegGptImageProcessor", None)),
             ("shieldgemma2", ("Gemma3ImageProcessor", "Gemma3ImageProcessorFast")),
             ("siglip", ("SiglipImageProcessor", "SiglipImageProcessorFast")),
             ("siglip2", ("Siglip2ImageProcessor", "Siglip2ImageProcessorFast")),
             ("smolvlm", ("SmolVLMImageProcessor", "SmolVLMImageProcessorFast")),
-            ("superglue", ("SuperGlueImageProcessor",)),
-            (
-                "superpoint",
-                (
-                    "SuperPointImageProcessor",
-                    "SuperPointImageProcessorFast",
-                ),
-            ),
+            ("superglue", ("SuperGlueImageProcessor", None)),
+            ("superpoint", ("SuperPointImageProcessor", "SuperPointImageProcessorFast")),
             ("swiftformer", ("ViTImageProcessor", "ViTImageProcessorFast")),
             ("swin", ("ViTImageProcessor", "ViTImageProcessorFast")),
             ("swin2sr", ("Swin2SRImageProcessor", "Swin2SRImageProcessorFast")),
             ("swinv2", ("ViTImageProcessor", "ViTImageProcessorFast")),
-            ("table-transformer", ("DetrImageProcessor",)),
-            ("timesformer", ("VideoMAEImageProcessor",)),
-            ("timm_wrapper", ("TimmWrapperImageProcessor",)),
-            ("tvlt", ("TvltImageProcessor",)),
-            ("tvp", ("TvpImageProcessor",)),
+            ("table-transformer", ("DetrImageProcessor", None)),
+            ("timesformer", ("VideoMAEImageProcessor", None)),
+            ("timm_wrapper", ("TimmWrapperImageProcessor", None)),
+            ("tvlt", ("TvltImageProcessor", None)),
+            ("tvp", ("TvpImageProcessor", None)),
             ("udop", ("LayoutLMv3ImageProcessor", "LayoutLMv3ImageProcessorFast")),
-            ("udop", ("LayoutLMv3ImageProcessor",)),
             ("upernet", ("SegformerImageProcessor", "SegformerImageProcessorFast")),
             ("van", ("ConvNextImageProcessor", "ConvNextImageProcessorFast")),
-            ("videomae", ("VideoMAEImageProcessor",)),
+            ("videomae", ("VideoMAEImageProcessor", None)),
             ("vilt", ("ViltImageProcessor", "ViltImageProcessorFast")),
             ("vipllava", ("CLIPImageProcessor", "CLIPImageProcessorFast")),
             ("vit", ("ViTImageProcessor", "ViTImageProcessorFast")),
-            ("vit_hybrid", ("ViTHybridImageProcessor",)),
+            ("vit_hybrid", ("ViTHybridImageProcessor", None)),
             ("vit_mae", ("ViTImageProcessor", "ViTImageProcessorFast")),
             ("vit_msn", ("ViTImageProcessor", "ViTImageProcessorFast")),
             ("vitmatte", ("VitMatteImageProcessor", "VitMatteImageProcessorFast")),
@@ -199,18 +191,14 @@ else:
         ]
     )
 
-for model_type, image_processors in IMAGE_PROCESSOR_MAPPING_NAMES.items():
-    slow_image_processor_class, *fast_image_processor_class = image_processors
+# Override to None if the packages are not available
+for model_type, (slow_class, fast_class) in IMAGE_PROCESSOR_MAPPING_NAMES.items():
     if not is_vision_available():
-        slow_image_processor_class = None
+        slow_class = None
+    if not is_torchvision_available():
+        fast_class = None
 
-    # If the fast image processor is not defined, or torchvision is not available, we set it to None
-    if not fast_image_processor_class or fast_image_processor_class[0] is None or not is_torchvision_available():
-        fast_image_processor_class = None
-    else:
-        fast_image_processor_class = fast_image_processor_class[0]
-
-    IMAGE_PROCESSOR_MAPPING_NAMES[model_type] = (slow_image_processor_class, fast_image_processor_class)
+    IMAGE_PROCESSOR_MAPPING_NAMES[model_type] = (slow_class, fast_class)
 
 IMAGE_PROCESSOR_MAPPING = _LazyAutoMapping(CONFIG_MAPPING_NAMES, IMAGE_PROCESSOR_MAPPING_NAMES)
 
diff --git a/src/transformers/utils/__init__.py b/src/transformers/utils/__init__.py
index c45a93e406..bb2920b403 100644
--- a/src/transformers/utils/__init__.py
+++ b/src/transformers/utils/__init__.py
@@ -179,6 +179,7 @@ from .import_utils import (
     is_keras_nlp_available,
     is_kernels_available,
     is_levenshtein_available,
+    is_libcst_available,
     is_librosa_available,
     is_liger_kernel_available,
     is_lomo_available,
diff --git a/src/transformers/utils/import_utils.py b/src/transformers/utils/import_utils.py
index 106e8abe11..9fa7c5253d 100644
--- a/src/transformers/utils/import_utils.py
+++ b/src/transformers/utils/import_utils.py
@@ -120,6 +120,7 @@ _vptq_available, _vptq_version = _is_package_available("vptq", return_version=Tr
 _av_available = importlib.util.find_spec("av") is not None
 _decord_available = importlib.util.find_spec("decord") is not None
 _torchcodec_available = importlib.util.find_spec("torchcodec") is not None
+_libcst_available = _is_package_available("libcst")
 _bitsandbytes_available = _is_package_available("bitsandbytes")
 _eetq_available = _is_package_available("eetq")
 _fbgemm_gpu_available = _is_package_available("fbgemm_gpu")
@@ -379,6 +380,10 @@ def is_torch_available():
     return _torch_available
 
 
+def is_libcst_available():
+    return _libcst_available
+
+
 def is_accelerate_available(min_version: str = ACCELERATE_MIN_VERSION):
     return _accelerate_available and version.parse(_accelerate_version) >= version.parse(min_version)
 
diff --git a/tests/models/align/test_processor_align.py b/tests/models/align/test_processing_align.py
similarity index 100%
rename from tests/models/align/test_processor_align.py
rename to tests/models/align/test_processing_align.py
diff --git a/tests/models/altclip/test_processor_altclip.py b/tests/models/altclip/test_processing_altclip.py
similarity index 100%
rename from tests/models/altclip/test_processor_altclip.py
rename to tests/models/altclip/test_processing_altclip.py
diff --git a/tests/models/aria/test_processor_aria.py b/tests/models/aria/test_processing_aria.py
similarity index 99%
rename from tests/models/aria/test_processor_aria.py
rename to tests/models/aria/test_processing_aria.py
index 4c228d3c16..a78c372f0e 100644
--- a/tests/models/aria/test_processor_aria.py
+++ b/tests/models/aria/test_processing_aria.py
@@ -95,7 +95,7 @@ class AriaProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname, ignore_errors=True)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/aya_vision/test_processor_aya_vision.py b/tests/models/aya_vision/test_processing_aya_vision.py
similarity index 98%
rename from tests/models/aya_vision/test_processor_aya_vision.py
rename to tests/models/aya_vision/test_processing_aya_vision.py
index b768f08a03..33b7da48f2 100644
--- a/tests/models/aya_vision/test_processor_aya_vision.py
+++ b/tests/models/aya_vision/test_processing_aya_vision.py
@@ -80,7 +80,7 @@ class AyaVisionProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname, ignore_errors=True)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/bark/test_processor_bark.py b/tests/models/bark/test_processing_bark.py
similarity index 100%
rename from tests/models/bark/test_processor_bark.py
rename to tests/models/bark/test_processing_bark.py
diff --git a/tests/models/blip/test_processor_blip.py b/tests/models/blip/test_processing_blip.py
similarity index 100%
rename from tests/models/blip/test_processor_blip.py
rename to tests/models/blip/test_processing_blip.py
diff --git a/tests/models/blip_2/test_processor_blip_2.py b/tests/models/blip_2/test_processing_blip_2.py
similarity index 100%
rename from tests/models/blip_2/test_processor_blip_2.py
rename to tests/models/blip_2/test_processing_blip_2.py
diff --git a/tests/models/bridgetower/test_processor_bridgetower.py b/tests/models/bridgetower/test_processing_bridgetower.py
similarity index 100%
rename from tests/models/bridgetower/test_processor_bridgetower.py
rename to tests/models/bridgetower/test_processing_bridgetower.py
diff --git a/tests/models/chameleon/test_processor_chameleon.py b/tests/models/chameleon/test_processing_chameleon.py
similarity index 96%
rename from tests/models/chameleon/test_processor_chameleon.py
rename to tests/models/chameleon/test_processing_chameleon.py
index 57f3b810af..71da4431e7 100644
--- a/tests/models/chameleon/test_processor_chameleon.py
+++ b/tests/models/chameleon/test_processing_chameleon.py
@@ -75,7 +75,7 @@ class ChameleonProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def prepare_processor_dict():
         return {"image_seq_length": 2}  # fmt: skip
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/chinese_clip/test_processor_chinese_clip.py b/tests/models/chinese_clip/test_processing_chinese_clip.py
similarity index 100%
rename from tests/models/chinese_clip/test_processor_chinese_clip.py
rename to tests/models/chinese_clip/test_processing_chinese_clip.py
diff --git a/tests/models/clap/test_processor_clap.py b/tests/models/clap/test_processing_clap.py
similarity index 100%
rename from tests/models/clap/test_processor_clap.py
rename to tests/models/clap/test_processing_clap.py
diff --git a/tests/models/clip/test_processor_clip.py b/tests/models/clip/test_processing_clip.py
similarity index 100%
rename from tests/models/clip/test_processor_clip.py
rename to tests/models/clip/test_processing_clip.py
diff --git a/tests/models/clipseg/test_processor_clipseg.py b/tests/models/clipseg/test_processing_clipseg.py
similarity index 100%
rename from tests/models/clipseg/test_processor_clipseg.py
rename to tests/models/clipseg/test_processing_clipseg.py
diff --git a/tests/models/clvp/test_processor_clvp.py b/tests/models/clvp/test_processing_clvp.py
similarity index 91%
rename from tests/models/clvp/test_processor_clvp.py
rename to tests/models/clvp/test_processing_clvp.py
index 817cbbff88..d03f7f75ed 100644
--- a/tests/models/clvp/test_processor_clvp.py
+++ b/tests/models/clvp/test_processing_clvp.py
@@ -35,15 +35,15 @@ class ClvpProcessorTest(unittest.TestCase):
         shutil.rmtree(self.tmpdirname)
         gc.collect()
 
-    # Copied from transformers.tests.models.whisper.test_processor_whisper.WhisperProcessorTest.get_tokenizer with Whisper->Clvp
+    # Copied from transformers.tests.models.whisper.test_processing_whisper.WhisperProcessorTest.get_tokenizer with Whisper->Clvp
     def get_tokenizer(self, **kwargs):
         return ClvpTokenizer.from_pretrained(self.checkpoint, **kwargs)
 
-    # Copied from transformers.tests.models.whisper.test_processor_whisper.WhisperProcessorTest.get_feature_extractor with Whisper->Clvp
+    # Copied from transformers.tests.models.whisper.test_processing_whisper.WhisperProcessorTest.get_feature_extractor with Whisper->Clvp
     def get_feature_extractor(self, **kwargs):
         return ClvpFeatureExtractor.from_pretrained(self.checkpoint, **kwargs)
 
-    # Copied from transformers.tests.models.whisper.test_processor_whisper.WhisperProcessorTest.test_save_load_pretrained_default with Whisper->Clvp
+    # Copied from transformers.tests.models.whisper.test_processing_whisper.WhisperProcessorTest.test_save_load_pretrained_default with Whisper->Clvp
     def test_save_load_pretrained_default(self):
         tokenizer = self.get_tokenizer()
         feature_extractor = self.get_feature_extractor()
@@ -59,7 +59,7 @@ class ClvpProcessorTest(unittest.TestCase):
         self.assertEqual(processor.feature_extractor.to_json_string(), feature_extractor.to_json_string())
         self.assertIsInstance(processor.feature_extractor, ClvpFeatureExtractor)
 
-    # Copied from transformers.tests.models.whisper.test_processor_whisper.WhisperProcessorTest.test_feature_extractor with Whisper->Clvp,processor(raw_speech->processor(raw_speech=raw_speech
+    # Copied from transformers.tests.models.whisper.test_processing_whisper.WhisperProcessorTest.test_feature_extractor with Whisper->Clvp,processor(raw_speech->processor(raw_speech=raw_speech
     def test_feature_extractor(self):
         feature_extractor = self.get_feature_extractor()
         tokenizer = self.get_tokenizer()
@@ -74,7 +74,7 @@ class ClvpProcessorTest(unittest.TestCase):
         for key in input_feat_extract:
             self.assertAlmostEqual(input_feat_extract[key].sum(), input_processor[key].sum(), delta=1e-2)
 
-    # Copied from transformers.tests.models.whisper.test_processor_whisper.WhisperProcessorTest.test_tokenizer with Whisper->Clvp
+    # Copied from transformers.tests.models.whisper.test_processing_whisper.WhisperProcessorTest.test_tokenizer with Whisper->Clvp
     def test_tokenizer(self):
         feature_extractor = self.get_feature_extractor()
         tokenizer = self.get_tokenizer()
@@ -90,7 +90,7 @@ class ClvpProcessorTest(unittest.TestCase):
         for key in encoded_tok:
             self.assertListEqual(encoded_tok[key], encoded_processor[key])
 
-    # Copied from transformers.tests.models.whisper.test_processor_whisper.WhisperProcessorTest.test_tokenizer_decode with Whisper->Clvp
+    # Copied from transformers.tests.models.whisper.test_processing_whisper.WhisperProcessorTest.test_tokenizer_decode with Whisper->Clvp
     def test_tokenizer_decode(self):
         feature_extractor = self.get_feature_extractor()
         tokenizer = self.get_tokenizer()
diff --git a/tests/models/colpali/test_processing_colpali.py b/tests/models/colpali/test_processing_colpali.py
index 539b604a35..aa4fad517b 100644
--- a/tests/models/colpali/test_processing_colpali.py
+++ b/tests/models/colpali/test_processing_colpali.py
@@ -54,7 +54,7 @@ class ColPaliProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname, ignore_errors=True)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/colqwen2/test_processing_colqwen2.py b/tests/models/colqwen2/test_processing_colqwen2.py
index 25e6b523c8..300cc680fe 100644
--- a/tests/models/colqwen2/test_processing_colqwen2.py
+++ b/tests/models/colqwen2/test_processing_colqwen2.py
@@ -57,7 +57,7 @@ class ColQwen2ProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/csm/test_processor_csm.py b/tests/models/csm/test_processing_csm.py
similarity index 100%
rename from tests/models/csm/test_processor_csm.py
rename to tests/models/csm/test_processing_csm.py
diff --git a/tests/models/deepseek_vl/test_processor_deepseek_vl.py b/tests/models/deepseek_vl/test_processing_deepseek_vl.py
similarity index 100%
rename from tests/models/deepseek_vl/test_processor_deepseek_vl.py
rename to tests/models/deepseek_vl/test_processing_deepseek_vl.py
diff --git a/tests/models/deepseek_vl_hybrid/test_processor_deepseek_vl_hybrid.py b/tests/models/deepseek_vl_hybrid/test_processing_deepseek_vl_hybrid.py
similarity index 100%
rename from tests/models/deepseek_vl_hybrid/test_processor_deepseek_vl_hybrid.py
rename to tests/models/deepseek_vl_hybrid/test_processing_deepseek_vl_hybrid.py
diff --git a/tests/models/dia/test_processor_dia.py b/tests/models/dia/test_processing_dia.py
similarity index 100%
rename from tests/models/dia/test_processor_dia.py
rename to tests/models/dia/test_processing_dia.py
diff --git a/tests/models/donut/test_processor_donut.py b/tests/models/donut/test_processing_donut.py
similarity index 100%
rename from tests/models/donut/test_processor_donut.py
rename to tests/models/donut/test_processing_donut.py
diff --git a/tests/models/emu3/test_processor_emu3.py b/tests/models/emu3/test_processing_emu3.py
similarity index 97%
rename from tests/models/emu3/test_processor_emu3.py
rename to tests/models/emu3/test_processing_emu3.py
index bb7c8187e5..a62107892a 100644
--- a/tests/models/emu3/test_processor_emu3.py
+++ b/tests/models/emu3/test_processing_emu3.py
@@ -91,7 +91,7 @@ class Emu3ProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         # For an image where pixels go from 0 to 255 the diff can be 1 due to some numerical precision errors when scaling and unscaling
         self.assertTrue(np.abs(orig_image - unnormalized_images).max() >= 1)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/evolla/test_processor_evolla.py b/tests/models/evolla/test_processing_evolla.py
similarity index 100%
rename from tests/models/evolla/test_processor_evolla.py
rename to tests/models/evolla/test_processing_evolla.py
diff --git a/tests/models/flava/test_processor_flava.py b/tests/models/flava/test_processing_flava.py
similarity index 100%
rename from tests/models/flava/test_processor_flava.py
rename to tests/models/flava/test_processing_flava.py
diff --git a/tests/models/fuyu/test_processor_fuyu.py b/tests/models/fuyu/test_processing_fuyu.py
similarity index 99%
rename from tests/models/fuyu/test_processor_fuyu.py
rename to tests/models/fuyu/test_processing_fuyu.py
index 6fb935cbec..6f38e9a0e8 100644
--- a/tests/models/fuyu/test_processor_fuyu.py
+++ b/tests/models/fuyu/test_processing_fuyu.py
@@ -64,7 +64,7 @@ class FuyuProcessingTest(ProcessorTesterMixin, unittest.TestCase):
     def get_image_processor(self, **kwargs):
         return AutoProcessor.from_pretrained(self.tmpdirname, **kwargs).image_processor
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/gemma3/test_processing_gemma3.py b/tests/models/gemma3/test_processing_gemma3.py
index 98984a3c08..16789e8096 100644
--- a/tests/models/gemma3/test_processing_gemma3.py
+++ b/tests/models/gemma3/test_processing_gemma3.py
@@ -58,7 +58,7 @@ class Gemma3ProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         processor.save_pretrained(cls.tmpdirname)
         cls.image_token = processor.boi_token
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/git/test_processor_git.py b/tests/models/git/test_processing_git.py
similarity index 100%
rename from tests/models/git/test_processor_git.py
rename to tests/models/git/test_processing_git.py
diff --git a/tests/models/got_ocr2/test_processor_got_ocr2.py b/tests/models/got_ocr2/test_processing_got_ocr2.py
similarity index 100%
rename from tests/models/got_ocr2/test_processor_got_ocr2.py
rename to tests/models/got_ocr2/test_processing_got_ocr2.py
diff --git a/tests/models/granite_speech/test_processor_granite_speech.py b/tests/models/granite_speech/test_processing_granite_speech.py
similarity index 100%
rename from tests/models/granite_speech/test_processor_granite_speech.py
rename to tests/models/granite_speech/test_processing_granite_speech.py
diff --git a/tests/models/grounding_dino/test_processor_grounding_dino.py b/tests/models/grounding_dino/test_processing_grounding_dino.py
similarity index 91%
rename from tests/models/grounding_dino/test_processor_grounding_dino.py
rename to tests/models/grounding_dino/test_processing_grounding_dino.py
index 89f14153b1..5aaa4f8b31 100644
--- a/tests/models/grounding_dino/test_processor_grounding_dino.py
+++ b/tests/models/grounding_dino/test_processing_grounding_dino.py
@@ -94,17 +94,17 @@ class GroundingDinoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         return [labels, labels_longer] + [labels] * (batch_size - 2)
 
     @classmethod
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.get_tokenizer with CLIP->Bert
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.get_tokenizer with CLIP->Bert
     def get_tokenizer(cls, **kwargs):
         return BertTokenizer.from_pretrained(cls.tmpdirname, **kwargs)
 
     @classmethod
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.get_rust_tokenizer with CLIP->Bert
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.get_rust_tokenizer with CLIP->Bert
     def get_rust_tokenizer(cls, **kwargs):
         return BertTokenizerFast.from_pretrained(cls.tmpdirname, **kwargs)
 
     @classmethod
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.get_image_processor with CLIP->GroundingDino
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.get_image_processor with CLIP->GroundingDino
     def get_image_processor(cls, **kwargs):
         return GroundingDinoImageProcessor.from_pretrained(cls.tmpdirname, **kwargs)
 
@@ -145,7 +145,7 @@ class GroundingDinoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         expected_box_slice = torch.tensor([0.6908, 0.4354, 1.0737, 1.3947])
         torch.testing.assert_close(post_processed[0]["boxes"][0], expected_box_slice, rtol=1e-4, atol=1e-4)
 
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.test_save_load_pretrained_default with CLIP->GroundingDino,GroundingDinoTokenizer->BertTokenizer
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.test_save_load_pretrained_default with CLIP->GroundingDino,GroundingDinoTokenizer->BertTokenizer
     def test_save_load_pretrained_default(self):
         tokenizer_slow = self.get_tokenizer()
         tokenizer_fast = self.get_rust_tokenizer()
@@ -171,7 +171,7 @@ class GroundingDinoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         self.assertIsInstance(processor_slow.image_processor, GroundingDinoImageProcessor)
         self.assertIsInstance(processor_fast.image_processor, GroundingDinoImageProcessor)
 
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.test_save_load_pretrained_additional_features with CLIP->GroundingDino,GroundingDinoTokenizer->BertTokenizer
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.test_save_load_pretrained_additional_features with CLIP->GroundingDino,GroundingDinoTokenizer->BertTokenizer
     def test_save_load_pretrained_additional_features(self):
         with tempfile.TemporaryDirectory() as tmpdir:
             processor = GroundingDinoProcessor(
@@ -194,7 +194,7 @@ class GroundingDinoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         self.assertEqual(processor.image_processor.to_json_string(), image_processor_add_kwargs.to_json_string())
         self.assertIsInstance(processor.image_processor, GroundingDinoImageProcessor)
 
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.test_image_processor with CLIP->GroundingDino
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.test_image_processor with CLIP->GroundingDino
     def test_image_processor(self):
         image_processor = self.get_image_processor()
         tokenizer = self.get_tokenizer()
@@ -209,7 +209,7 @@ class GroundingDinoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         for key in input_image_proc:
             self.assertAlmostEqual(input_image_proc[key].sum(), input_processor[key].sum(), delta=1e-2)
 
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.test_tokenizer with CLIP->GroundingDino
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.test_tokenizer with CLIP->GroundingDino
     def test_tokenizer(self):
         image_processor = self.get_image_processor()
         tokenizer = self.get_tokenizer()
@@ -244,7 +244,7 @@ class GroundingDinoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         with pytest.raises(ValueError):
             processor()
 
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.test_tokenizer_decode with CLIP->GroundingDino
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.test_tokenizer_decode with CLIP->GroundingDino
     def test_tokenizer_decode(self):
         image_processor = self.get_image_processor()
         tokenizer = self.get_tokenizer()
@@ -258,7 +258,7 @@ class GroundingDinoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
 
         self.assertListEqual(decoded_tok, decoded_processor)
 
-    # Copied from tests.models.clip.test_processor_clip.CLIPProcessorTest.test_model_input_names with CLIP->GroundingDino
+    # Copied from tests.models.clip.test_processing_clip.CLIPProcessorTest.test_model_input_names with CLIP->GroundingDino
     def test_model_input_names(self):
         image_processor = self.get_image_processor()
         tokenizer = self.get_tokenizer()
diff --git a/tests/models/idefics/test_processor_idefics.py b/tests/models/idefics/test_processing_idefics.py
similarity index 100%
rename from tests/models/idefics/test_processor_idefics.py
rename to tests/models/idefics/test_processing_idefics.py
diff --git a/tests/models/idefics2/test_processor_idefics2.py b/tests/models/idefics2/test_processing_idefics2.py
similarity index 100%
rename from tests/models/idefics2/test_processor_idefics2.py
rename to tests/models/idefics2/test_processing_idefics2.py
diff --git a/tests/models/idefics3/test_processor_idefics3.py b/tests/models/idefics3/test_processing_idefics3.py
similarity index 98%
rename from tests/models/idefics3/test_processor_idefics3.py
rename to tests/models/idefics3/test_processing_idefics3.py
index 7020a24398..780a6899d5 100644
--- a/tests/models/idefics3/test_processor_idefics3.py
+++ b/tests/models/idefics3/test_processing_idefics3.py
@@ -84,7 +84,7 @@ class Idefics3ProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def prepare_processor_dict():
         return {"image_seq_len": 2}
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
@@ -284,7 +284,7 @@ class Idefics3ProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         self.assertEqual(np.array(inputs["pixel_values"]).shape, (2, 2, 3, 364, 364))
         self.assertEqual(np.array(inputs["pixel_attention_mask"]).shape, (2, 2, 364, 364))
 
-    # Copied from tests.models.idefics2.test_processor_idefics2.Idefics2ProcessorTest.test_process_interleaved_images_prompts_image_error
+    # Copied from tests.models.idefics2.test_processing_idefics2.Idefics2ProcessorTest.test_process_interleaved_images_prompts_image_error
     def test_process_interleaved_images_prompts_image_error(self):
         processor = self.get_processor()
 
diff --git a/tests/models/instructblip/test_processor_instructblip.py b/tests/models/instructblip/test_processing_instructblip.py
similarity index 100%
rename from tests/models/instructblip/test_processor_instructblip.py
rename to tests/models/instructblip/test_processing_instructblip.py
diff --git a/tests/models/instructblipvideo/test_processor_instructblipvideo.py b/tests/models/instructblipvideo/test_processing_instructblipvideo.py
similarity index 100%
rename from tests/models/instructblipvideo/test_processor_instructblipvideo.py
rename to tests/models/instructblipvideo/test_processing_instructblipvideo.py
diff --git a/tests/models/internvl/test_processor_internvl.py b/tests/models/internvl/test_processing_internvl.py
similarity index 99%
rename from tests/models/internvl/test_processor_internvl.py
rename to tests/models/internvl/test_processing_internvl.py
index d192a6c049..b5cf23c8d2 100644
--- a/tests/models/internvl/test_processor_internvl.py
+++ b/tests/models/internvl/test_processing_internvl.py
@@ -97,7 +97,7 @@ class InternVLProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname, ignore_errors=True)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/internvl/test_video_processor_internvl.py b/tests/models/internvl/test_video_processing_internvl.py
similarity index 100%
rename from tests/models/internvl/test_video_processor_internvl.py
rename to tests/models/internvl/test_video_processing_internvl.py
diff --git a/tests/models/janus/test_processor_janus.py b/tests/models/janus/test_processing_janus.py
similarity index 100%
rename from tests/models/janus/test_processor_janus.py
rename to tests/models/janus/test_processing_janus.py
diff --git a/tests/models/kosmos2/test_processor_kosmos2.py b/tests/models/kosmos2/test_processing_kosmos2.py
similarity index 100%
rename from tests/models/kosmos2/test_processor_kosmos2.py
rename to tests/models/kosmos2/test_processing_kosmos2.py
diff --git a/tests/models/layoutlmv2/test_processor_layoutlmv2.py b/tests/models/layoutlmv2/test_processing_layoutlmv2.py
similarity index 100%
rename from tests/models/layoutlmv2/test_processor_layoutlmv2.py
rename to tests/models/layoutlmv2/test_processing_layoutlmv2.py
diff --git a/tests/models/layoutlmv3/test_processor_layoutlmv3.py b/tests/models/layoutlmv3/test_processing_layoutlmv3.py
similarity index 100%
rename from tests/models/layoutlmv3/test_processor_layoutlmv3.py
rename to tests/models/layoutlmv3/test_processing_layoutlmv3.py
diff --git a/tests/models/layoutxlm/test_processor_layoutxlm.py b/tests/models/layoutxlm/test_processing_layoutxlm.py
similarity index 100%
rename from tests/models/layoutxlm/test_processor_layoutxlm.py
rename to tests/models/layoutxlm/test_processing_layoutxlm.py
diff --git a/tests/models/llama4/test_processor_llama4.py b/tests/models/llama4/test_processing_llama4.py
similarity index 100%
rename from tests/models/llama4/test_processor_llama4.py
rename to tests/models/llama4/test_processing_llama4.py
diff --git a/tests/models/llava/test_processor_llava.py b/tests/models/llava/test_processing_llava.py
similarity index 100%
rename from tests/models/llava/test_processor_llava.py
rename to tests/models/llava/test_processing_llava.py
diff --git a/tests/models/llava_next/test_processor_llava_next.py b/tests/models/llava_next/test_processing_llava_next.py
similarity index 96%
rename from tests/models/llava_next/test_processor_llava_next.py
rename to tests/models/llava_next/test_processing_llava_next.py
index 46d385d2d8..915ea238b2 100644
--- a/tests/models/llava_next/test_processor_llava_next.py
+++ b/tests/models/llava_next/test_processing_llava_next.py
@@ -66,7 +66,7 @@ class LlavaNextProcessorTest(ProcessorTesterMixin, unittest.TestCase):
             "vision_feature_select_strategy": "default"
         }  # fmt: skip
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
@@ -79,7 +79,7 @@ class LlavaNextProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         self.assertTrue("num_image_patches" in output)
         self.assertEqual(len(output["num_image_patches"]), 3)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_chat_template_is_saved
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_chat_template_is_saved
     def test_chat_template_is_saved(self):
         processor_loaded = self.processor_class.from_pretrained(self.tmpdirname)
         processor_dict_loaded = json.loads(processor_loaded.to_json_string())
diff --git a/tests/models/llava_next_video/test_processor_llava_next_video.py b/tests/models/llava_next_video/test_processing_llava_next_video.py
similarity index 96%
rename from tests/models/llava_next_video/test_processor_llava_next_video.py
rename to tests/models/llava_next_video/test_processing_llava_next_video.py
index 3426d1e453..bf5d608205 100644
--- a/tests/models/llava_next_video/test_processor_llava_next_video.py
+++ b/tests/models/llava_next_video/test_processing_llava_next_video.py
@@ -75,7 +75,7 @@ class LlavaNextVideoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
             "vision_feature_select_strategy": "default",
         }
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
@@ -88,7 +88,7 @@ class LlavaNextVideoProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         self.assertTrue("num_image_patches" in output)
         self.assertEqual(len(output["num_image_patches"]), 3)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_chat_template_is_saved
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_chat_template_is_saved
     def test_chat_template_is_saved(self):
         processor_loaded = self.processor_class.from_pretrained(self.tmpdirname)
         processor_dict_loaded = json.loads(processor_loaded.to_json_string())
diff --git a/tests/models/llava_onevision/test_processor_llava_onevision.py b/tests/models/llava_onevision/test_processing_llava_onevision.py
similarity index 96%
rename from tests/models/llava_onevision/test_processor_llava_onevision.py
rename to tests/models/llava_onevision/test_processing_llava_onevision.py
index 577ba19cd8..d7e03443ab 100644
--- a/tests/models/llava_onevision/test_processor_llava_onevision.py
+++ b/tests/models/llava_onevision/test_processing_llava_onevision.py
@@ -79,7 +79,7 @@ class LlavaOnevisionProcessorTest(ProcessorTesterMixin, unittest.TestCase):
             "vision_feature_select_strategy": "default"
         }  # fmt: skip
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
@@ -92,7 +92,7 @@ class LlavaOnevisionProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         self.assertTrue("num_image_patches" in output)
         self.assertEqual(len(output["num_image_patches"]), 3)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_chat_template_is_saved
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_chat_template_is_saved
     def test_chat_template_is_saved(self):
         processor_loaded = self.processor_class.from_pretrained(self.tmpdirname)
         processor_dict_loaded = json.loads(processor_loaded.to_json_string())
diff --git a/tests/models/markuplm/test_processor_markuplm.py b/tests/models/markuplm/test_processing_markuplm.py
similarity index 100%
rename from tests/models/markuplm/test_processor_markuplm.py
rename to tests/models/markuplm/test_processing_markuplm.py
diff --git a/tests/models/mgp_str/test_processor_mgp_str.py b/tests/models/mgp_str/test_processing_mgp_str.py
similarity index 100%
rename from tests/models/mgp_str/test_processor_mgp_str.py
rename to tests/models/mgp_str/test_processing_mgp_str.py
diff --git a/tests/models/mistral3/test_processor_mistral3.py b/tests/models/mistral3/test_processing_mistral3.py
similarity index 100%
rename from tests/models/mistral3/test_processor_mistral3.py
rename to tests/models/mistral3/test_processing_mistral3.py
diff --git a/tests/models/mllama/test_processor_mllama.py b/tests/models/mllama/test_processing_mllama.py
similarity index 100%
rename from tests/models/mllama/test_processor_mllama.py
rename to tests/models/mllama/test_processing_mllama.py
diff --git a/tests/models/musicgen/test_processor_musicgen.py b/tests/models/musicgen/test_processing_musicgen.py
similarity index 100%
rename from tests/models/musicgen/test_processor_musicgen.py
rename to tests/models/musicgen/test_processing_musicgen.py
diff --git a/tests/models/musicgen_melody/test_processor_musicgen_melody.py b/tests/models/musicgen_melody/test_processing_musicgen_melody.py
similarity index 97%
rename from tests/models/musicgen_melody/test_processor_musicgen_melody.py
rename to tests/models/musicgen_melody/test_processing_musicgen_melody.py
index fbeee0543b..f6bf6ea17c 100644
--- a/tests/models/musicgen_melody/test_processor_musicgen_melody.py
+++ b/tests/models/musicgen_melody/test_processing_musicgen_melody.py
@@ -50,7 +50,7 @@ def floats_list(shape, scale=1.0, rng=None, name=None):
 @require_torch
 @require_sentencepiece
 @require_torchaudio
-# Copied from tests.models.musicgen.test_processor_musicgen.MusicgenProcessorTest with Musicgen->MusicgenMelody, Encodec->MusicgenMelody, padding_mask->attention_mask, input_values->input_features
+# Copied from tests.models.musicgen.test_processing_musicgen.MusicgenProcessorTest with Musicgen->MusicgenMelody, Encodec->MusicgenMelody, padding_mask->attention_mask, input_values->input_features
 class MusicgenMelodyProcessorTest(unittest.TestCase):
     def setUp(self):
         # Ignore copy
diff --git a/tests/models/omdet_turbo/test_processor_omdet_turbo.py b/tests/models/omdet_turbo/test_processing_omdet_turbo.py
similarity index 100%
rename from tests/models/omdet_turbo/test_processor_omdet_turbo.py
rename to tests/models/omdet_turbo/test_processing_omdet_turbo.py
diff --git a/tests/models/oneformer/test_processor_oneformer.py b/tests/models/oneformer/test_processing_oneformer.py
similarity index 100%
rename from tests/models/oneformer/test_processor_oneformer.py
rename to tests/models/oneformer/test_processing_oneformer.py
diff --git a/tests/models/owlv2/test_processor_owlv2.py b/tests/models/owlv2/test_processing_owlv2.py
similarity index 100%
rename from tests/models/owlv2/test_processor_owlv2.py
rename to tests/models/owlv2/test_processing_owlv2.py
diff --git a/tests/models/owlvit/test_processor_owlvit.py b/tests/models/owlvit/test_processing_owlvit.py
similarity index 100%
rename from tests/models/owlvit/test_processor_owlvit.py
rename to tests/models/owlvit/test_processing_owlvit.py
diff --git a/tests/models/paligemma/test_processor_paligemma.py b/tests/models/paligemma/test_processing_paligemma.py
similarity index 98%
rename from tests/models/paligemma/test_processor_paligemma.py
rename to tests/models/paligemma/test_processing_paligemma.py
index 821e18d550..25f33bfada 100644
--- a/tests/models/paligemma/test_processor_paligemma.py
+++ b/tests/models/paligemma/test_processing_paligemma.py
@@ -48,7 +48,7 @@ class PaliGemmaProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname, ignore_errors=True)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/perception_lm/test_processor_perception_lm.py b/tests/models/perception_lm/test_processing_perception_lm.py
similarity index 100%
rename from tests/models/perception_lm/test_processor_perception_lm.py
rename to tests/models/perception_lm/test_processing_perception_lm.py
diff --git a/tests/models/phi4_multimodal/test_feature_extractor_phi4_multimodal.py b/tests/models/phi4_multimodal/test_feature_extraction_phi4_multimodal.py
similarity index 100%
rename from tests/models/phi4_multimodal/test_feature_extractor_phi4_multimodal.py
rename to tests/models/phi4_multimodal/test_feature_extraction_phi4_multimodal.py
diff --git a/tests/models/pix2struct/test_processor_pix2struct.py b/tests/models/pix2struct/test_processing_pix2struct.py
similarity index 100%
rename from tests/models/pix2struct/test_processor_pix2struct.py
rename to tests/models/pix2struct/test_processing_pix2struct.py
diff --git a/tests/models/pixtral/test_processor_pixtral.py b/tests/models/pixtral/test_processing_pixtral.py
similarity index 100%
rename from tests/models/pixtral/test_processor_pixtral.py
rename to tests/models/pixtral/test_processing_pixtral.py
diff --git a/tests/models/pop2piano/test_processor_pop2piano.py b/tests/models/pop2piano/test_processing_pop2piano.py
similarity index 100%
rename from tests/models/pop2piano/test_processor_pop2piano.py
rename to tests/models/pop2piano/test_processing_pop2piano.py
diff --git a/tests/models/qwen2_5_omni/test_processor_qwen2_5_omni.py b/tests/models/qwen2_5_omni/test_processing_qwen2_5_omni.py
similarity index 100%
rename from tests/models/qwen2_5_omni/test_processor_qwen2_5_omni.py
rename to tests/models/qwen2_5_omni/test_processing_qwen2_5_omni.py
diff --git a/tests/models/qwen2_5_vl/test_processor_qwen2_5_vl.py b/tests/models/qwen2_5_vl/test_processing_qwen2_5_vl.py
similarity index 99%
rename from tests/models/qwen2_5_vl/test_processor_qwen2_5_vl.py
rename to tests/models/qwen2_5_vl/test_processing_qwen2_5_vl.py
index 5b8a3beb1d..e05238d588 100644
--- a/tests/models/qwen2_5_vl/test_processor_qwen2_5_vl.py
+++ b/tests/models/qwen2_5_vl/test_processing_qwen2_5_vl.py
@@ -65,7 +65,7 @@ class Qwen2_5_VLProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname, ignore_errors=True)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/qwen2_audio/test_processor_qwen2_audio.py b/tests/models/qwen2_audio/test_processing_qwen2_audio.py
similarity index 100%
rename from tests/models/qwen2_audio/test_processor_qwen2_audio.py
rename to tests/models/qwen2_audio/test_processing_qwen2_audio.py
diff --git a/tests/models/qwen2_vl/test_processor_qwen2_vl.py b/tests/models/qwen2_vl/test_processing_qwen2_vl.py
similarity index 99%
rename from tests/models/qwen2_vl/test_processor_qwen2_vl.py
rename to tests/models/qwen2_vl/test_processing_qwen2_vl.py
index ccc9b3834f..05a82f5fc9 100644
--- a/tests/models/qwen2_vl/test_processor_qwen2_vl.py
+++ b/tests/models/qwen2_vl/test_processing_qwen2_vl.py
@@ -68,7 +68,7 @@ class Qwen2VLProcessorTest(ProcessorTesterMixin, unittest.TestCase):
     def tearDownClass(cls):
         shutil.rmtree(cls.tmpdirname, ignore_errors=True)
 
-    # Copied from tests.models.llava.test_processor_llava.LlavaProcessorTest.test_get_num_vision_tokens
+    # Copied from tests.models.llava.test_processing_llava.LlavaProcessorTest.test_get_num_vision_tokens
     def test_get_num_vision_tokens(self):
         "Tests general functionality of the helper used internally in vLLM"
 
diff --git a/tests/models/sam/test_processor_sam.py b/tests/models/sam/test_processing_sam.py
similarity index 100%
rename from tests/models/sam/test_processor_sam.py
rename to tests/models/sam/test_processing_sam.py
diff --git a/tests/models/sam_hq/test_processor_samhq.py b/tests/models/sam_hq/test_processing_samhq.py
similarity index 100%
rename from tests/models/sam_hq/test_processor_samhq.py
rename to tests/models/sam_hq/test_processing_samhq.py
diff --git a/tests/models/seamless_m4t/test_processor_seamless_m4t.py b/tests/models/seamless_m4t/test_processing_seamless_m4t.py
similarity index 92%
rename from tests/models/seamless_m4t/test_processor_seamless_m4t.py
rename to tests/models/seamless_m4t/test_processing_seamless_m4t.py
index f963fa2098..929255a82f 100644
--- a/tests/models/seamless_m4t/test_processor_seamless_m4t.py
+++ b/tests/models/seamless_m4t/test_processing_seamless_m4t.py
@@ -76,7 +76,7 @@ class SeamlessM4TProcessorTest(unittest.TestCase):
         tokenizer_instance = isinstance(processor.tokenizer, (SeamlessM4TTokenizerFast, SeamlessM4TTokenizer))
         self.assertTrue(tokenizer_instance)
 
-    # Copied from test.models.whisper.test_processor_whisper.WhisperProcessorTest.test_feature_extractor with Whisper->SeamlessM4T
+    # Copied from test.models.whisper.test_processing_whisper.WhisperProcessorTest.test_feature_extractor with Whisper->SeamlessM4T
     def test_feature_extractor(self):
         feature_extractor = self.get_feature_extractor()
         tokenizer = self.get_tokenizer()
@@ -91,7 +91,7 @@ class SeamlessM4TProcessorTest(unittest.TestCase):
         for key in input_feat_extract:
             self.assertAlmostEqual(input_feat_extract[key].sum(), input_processor[key].sum(), delta=1e-2)
 
-    # Copied from test.models.whisper.test_processor_whisper.WhisperProcessorTest.test_tokenizer with Whisper->SeamlessM4T
+    # Copied from test.models.whisper.test_processing_whisper.WhisperProcessorTest.test_tokenizer with Whisper->SeamlessM4T
     def test_tokenizer(self):
         feature_extractor = self.get_feature_extractor()
         tokenizer = self.get_tokenizer()
@@ -107,7 +107,7 @@ class SeamlessM4TProcessorTest(unittest.TestCase):
         for key in encoded_tok:
             self.assertListEqual(encoded_tok[key], encoded_processor[key])
 
-    # Copied from test.models.whisper.test_processor_whisper.WhisperProcessorTest.test_tokenizer_decode with Whisper->SeamlessM4T
+    # Copied from test.models.whisper.test_processing_whisper.WhisperProcessorTest.test_tokenizer_decode with Whisper->SeamlessM4T
     def test_tokenizer_decode(self):
         feature_extractor = self.get_feature_extractor()
         tokenizer = self.get_tokenizer()
diff --git a/tests/models/smolvlm/test_processor_smolvlm.py b/tests/models/smolvlm/test_processing_smolvlm.py
similarity index 99%
rename from tests/models/smolvlm/test_processor_smolvlm.py
rename to tests/models/smolvlm/test_processing_smolvlm.py
index 9a75575bd9..88f1c79902 100644
--- a/tests/models/smolvlm/test_processor_smolvlm.py
+++ b/tests/models/smolvlm/test_processing_smolvlm.py
@@ -297,7 +297,7 @@ class SmolVLMProcessorTest(ProcessorTesterMixin, unittest.TestCase):
         self.assertEqual(np.array(inputs["pixel_values"]).shape, (2, 2, 3, 512, 512))
         self.assertEqual(np.array(inputs["pixel_attention_mask"]).shape, (2, 2, 512, 512))
 
-    # Copied from tests.models.idefics2.test_processor_idefics2.Idefics2ProcessorTest.test_process_interleaved_images_prompts_image_error
+    # Copied from tests.models.idefics2.test_processing_idefics2.Idefics2ProcessorTest.test_process_interleaved_images_prompts_image_error
     def test_process_interleaved_images_prompts_image_error(self):
         processor = self.get_processor()
 
diff --git a/tests/models/speech_to_text/test_processor_speech_to_text.py b/tests/models/speech_to_text/test_processing_speech_to_text.py
similarity index 100%
rename from tests/models/speech_to_text/test_processor_speech_to_text.py
rename to tests/models/speech_to_text/test_processing_speech_to_text.py
diff --git a/tests/models/speecht5/test_processor_speecht5.py b/tests/models/speecht5/test_processing_speecht5.py
similarity index 100%
rename from tests/models/speecht5/test_processor_speecht5.py
rename to tests/models/speecht5/test_processing_speecht5.py
diff --git a/tests/models/trocr/test_processor_trocr.py b/tests/models/trocr/test_processing_trocr.py
similarity index 100%
rename from tests/models/trocr/test_processor_trocr.py
rename to tests/models/trocr/test_processing_trocr.py
diff --git a/tests/models/udop/test_processor_udop.py b/tests/models/udop/test_processing_udop.py
similarity index 100%
rename from tests/models/udop/test_processor_udop.py
rename to tests/models/udop/test_processing_udop.py
diff --git a/tests/models/vision_text_dual_encoder/test_processor_vision_text_dual_encoder.py b/tests/models/vision_text_dual_encoder/test_processing_vision_text_dual_encoder.py
similarity index 100%
rename from tests/models/vision_text_dual_encoder/test_processor_vision_text_dual_encoder.py
rename to tests/models/vision_text_dual_encoder/test_processing_vision_text_dual_encoder.py
diff --git a/tests/models/wav2vec2/test_processor_wav2vec2.py b/tests/models/wav2vec2/test_processing_wav2vec2.py
similarity index 100%
rename from tests/models/wav2vec2/test_processor_wav2vec2.py
rename to tests/models/wav2vec2/test_processing_wav2vec2.py
diff --git a/tests/models/wav2vec2_bert/test_processor_wav2vec2_bert.py b/tests/models/wav2vec2_bert/test_processing_wav2vec2_bert.py
similarity index 100%
rename from tests/models/wav2vec2_bert/test_processor_wav2vec2_bert.py
rename to tests/models/wav2vec2_bert/test_processing_wav2vec2_bert.py
diff --git a/tests/models/wav2vec2_with_lm/test_processor_wav2vec2_with_lm.py b/tests/models/wav2vec2_with_lm/test_processing_wav2vec2_with_lm.py
similarity index 100%
rename from tests/models/wav2vec2_with_lm/test_processor_wav2vec2_with_lm.py
rename to tests/models/wav2vec2_with_lm/test_processing_wav2vec2_with_lm.py
diff --git a/tests/models/whisper/test_processor_whisper.py b/tests/models/whisper/test_processing_whisper.py
similarity index 100%
rename from tests/models/whisper/test_processor_whisper.py
rename to tests/models/whisper/test_processing_whisper.py
diff --git a/tests/utils/test_add_new_model_like.py b/tests/utils/test_add_new_model_like.py
index a8e005b6a5..dffe718978 100644
--- a/tests/utils/test_add_new_model_like.py
+++ b/tests/utils/test_add_new_model_like.py
@@ -12,1229 +12,815 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import os
-import re
+import shutil
 import tempfile
+import textwrap
 import unittest
+from datetime import date
+from pathlib import Path
 
-from transformers.commands.add_new_model_like import (
-    ModelPatterns,
-    _re_class_func,
-    add_content_to_file,
-    add_content_to_text,
-    clean_frameworks_in_init,
-    duplicate_doc_file,
-    duplicate_module,
-    filter_framework_files,
-    find_base_model_checkpoint,
-    get_model_files,
-    get_module_from_file,
-    parse_module_content,
-    replace_model_patterns,
-    retrieve_info_for_model,
-    retrieve_model_classes,
-    simplify_replacements,
-)
+import transformers.commands.add_new_model_like
+from transformers.commands.add_new_model_like import ModelInfos, create_new_model_like
 from transformers.testing_utils import require_torch
 
 
-BERT_MODEL_FILES = {
-    "transformers/models/bert/__init__.py",
-    "transformers/models/bert/configuration_bert.py",
-    "transformers/models/bert/tokenization_bert.py",
-    "transformers/models/bert/tokenization_bert_fast.py",
-    "transformers/models/bert/tokenization_bert_tf.py",
-    "transformers/models/bert/modeling_bert.py",
-    "transformers/models/bert/modeling_flax_bert.py",
-    "transformers/models/bert/modeling_tf_bert.py",
-    "transformers/models/bert/convert_bert_original_tf_checkpoint_to_pytorch.py",
-    "transformers/models/bert/convert_bert_original_tf2_checkpoint_to_pytorch.py",
-    "transformers/models/bert/convert_bert_pytorch_checkpoint_to_original_tf.py",
-    "transformers/models/bert/convert_bert_token_dropping_original_tf2_checkpoint_to_pytorch.py",
-}
-
-VIT_MODEL_FILES = {
-    "transformers/models/vit/__init__.py",
-    "transformers/models/vit/configuration_vit.py",
-    "transformers/models/vit/convert_dino_to_pytorch.py",
-    "transformers/models/vit/convert_vit_timm_to_pytorch.py",
-    "transformers/models/vit/feature_extraction_vit.py",
-    "transformers/models/vit/image_processing_vit.py",
-    "transformers/models/vit/image_processing_vit_fast.py",
-    "transformers/models/vit/modeling_vit.py",
-    "transformers/models/vit/modeling_tf_vit.py",
-    "transformers/models/vit/modeling_flax_vit.py",
-}
-
-WAV2VEC2_MODEL_FILES = {
-    "transformers/models/wav2vec2/__init__.py",
-    "transformers/models/wav2vec2/configuration_wav2vec2.py",
-    "transformers/models/wav2vec2/convert_wav2vec2_original_pytorch_checkpoint_to_pytorch.py",
-    "transformers/models/wav2vec2/convert_wav2vec2_original_s3prl_checkpoint_to_pytorch.py",
-    "transformers/models/wav2vec2/feature_extraction_wav2vec2.py",
-    "transformers/models/wav2vec2/modeling_wav2vec2.py",
-    "transformers/models/wav2vec2/modeling_tf_wav2vec2.py",
-    "transformers/models/wav2vec2/modeling_flax_wav2vec2.py",
-    "transformers/models/wav2vec2/processing_wav2vec2.py",
-    "transformers/models/wav2vec2/tokenization_wav2vec2.py",
-}
-
-
-def get_last_n_components_of_path(path, n):
-    """
-    Get the last `components` of the path. E.g. `get_last_n_components_of_path("/foo/bar/baz", 2)` returns `bar/baz`
-    """
-    return os.path.sep.join(os.path.normpath(path).split(os.path.sep)[-n:])
+REPO_PATH = os.path.dirname(os.path.dirname(os.path.dirname(__file__)))
+MODELS_TO_COPY = ("auto", "llama", "phi4_multimodal")
+CURRENT_YEAR = date.today().year
 
 
 @require_torch
 class TestAddNewModelLike(unittest.TestCase):
-    def init_file(self, file_name, content):
-        with open(file_name, "w", encoding="utf-8") as f:
-            f.write(content)
+    @classmethod
+    def setUpClass(cls):
+        """
+        Create a temporary repo with the same structure as Transformers, with just 2 models.
+        """
+        cls.FAKE_REPO = tempfile.TemporaryDirectory().name
+        os.makedirs(os.path.join(cls.FAKE_REPO, "src", "transformers", "models"), exist_ok=True)
+        os.makedirs(os.path.join(cls.FAKE_REPO, "tests", "models"), exist_ok=True)
+        os.makedirs(os.path.join(cls.FAKE_REPO, "docs", "source", "en", "model_doc"), exist_ok=True)
 
-    def check_result(self, file_name, expected_result):
-        with open(file_name, encoding="utf-8") as f:
-            result = f.read()
-            self.assertEqual(result, expected_result)
+        # We need to copy the utils to run the cleanup commands
+        utils_src = os.path.join(REPO_PATH, "utils")
+        shutil.copytree(utils_src, utils_src.replace(REPO_PATH, cls.FAKE_REPO))
+        # Copy the __init__ files
+        model_init = os.path.join(REPO_PATH, "src", "transformers", "models", "__init__.py")
+        shutil.copy(model_init, model_init.replace(REPO_PATH, cls.FAKE_REPO))
+        doc_toc = os.path.join(REPO_PATH, "docs", "source", "en", "_toctree.yml")
+        shutil.copy(doc_toc, doc_toc.replace(REPO_PATH, cls.FAKE_REPO))
+        # We need the pyproject for ruff as well
+        pyproject = os.path.join(REPO_PATH, "pyproject.toml")
+        shutil.copy(pyproject, pyproject.replace(REPO_PATH, cls.FAKE_REPO))
+        # Copy over all the specific model files
+        for model in MODELS_TO_COPY:
+            model_src = os.path.join(REPO_PATH, "src", "transformers", "models", model)
+            shutil.copytree(model_src, model_src.replace(REPO_PATH, cls.FAKE_REPO))
 
-    def test_re_class_func(self):
-        self.assertEqual(_re_class_func.search("def my_function(x, y):").groups()[0], "my_function")
-        self.assertEqual(_re_class_func.search("class MyClass:").groups()[0], "MyClass")
-        self.assertEqual(_re_class_func.search("class MyClass(SuperClass):").groups()[0], "MyClass")
+            test_src = os.path.join(REPO_PATH, "tests", "models", model)
+            shutil.copytree(test_src, test_src.replace(REPO_PATH, cls.FAKE_REPO))
 
-    def test_model_patterns_defaults(self):
-        model_patterns = ModelPatterns("GPT-New new", "huggingface/gpt-new-base")
+            if model != "auto":
+                doc_src = os.path.join(REPO_PATH, "docs", "source", "en", "model_doc", f"{model}.md")
+                shutil.copy(doc_src, doc_src.replace(REPO_PATH, cls.FAKE_REPO))
 
-        self.assertEqual(model_patterns.model_type, "gpt-new-new")
-        self.assertEqual(model_patterns.model_lower_cased, "gpt_new_new")
-        self.assertEqual(model_patterns.model_camel_cased, "GPTNewNew")
-        self.assertEqual(model_patterns.model_upper_cased, "GPT_NEW_NEW")
-        self.assertEqual(model_patterns.config_class, "GPTNewNewConfig")
-        self.assertIsNone(model_patterns.tokenizer_class)
-        self.assertIsNone(model_patterns.feature_extractor_class)
-        self.assertIsNone(model_patterns.processor_class)
+        # Replace the globals
+        cls.ORIGINAL_REPO = transformers.commands.add_new_model_like.REPO_PATH
+        cls.ORIGINAL_TRANSFORMERS_REPO = transformers.commands.add_new_model_like.TRANSFORMERS_PATH
+        transformers.commands.add_new_model_like.REPO_PATH = Path(cls.FAKE_REPO)
+        transformers.commands.add_new_model_like.TRANSFORMERS_PATH = Path(cls.FAKE_REPO) / "src" / "transformers"
 
-    def test_parse_module_content(self):
-        test_code = """SOME_CONSTANT = a constant
+        # For convenience
+        cls.MODEL_PATH = os.path.join(cls.FAKE_REPO, "src", "transformers", "models")
+        cls.TESTS_MODEL_PATH = os.path.join(cls.FAKE_REPO, "tests", "models")
+        cls.DOC_PATH = os.path.join(cls.FAKE_REPO, "docs", "source", "en")
 
-CONSTANT_DEFINED_ON_SEVERAL_LINES = [
-    first_item,
-    second_item
-]
+    @classmethod
+    def tearDownClass(cls):
+        transformers.commands.add_new_model_like.REPO_PATH = cls.ORIGINAL_REPO
+        transformers.commands.add_new_model_like.TRANSFORMERS_PATH = cls.ORIGINAL_TRANSFORMERS_REPO
+        del cls.FAKE_REPO
 
-def function(args):
-    some code
+    def assertFileIsEqual(self, text: str, filepath: str):
+        with open(filepath, "r") as f:
+            file_text = f.read()
+        self.assertEqual(file_text.strip(), text.strip())
 
-# Copied from transformers.some_module
-class SomeClass:
-    some code
-"""
+    def assertInFile(self, text: str, filepath: str):
+        with open(filepath, "r") as f:
+            file_text = f.read()
+        self.assertTrue(text in file_text)
 
-        expected_parts = [
-            "SOME_CONSTANT = a constant\n",
-            "CONSTANT_DEFINED_ON_SEVERAL_LINES = [\n    first_item,\n    second_item\n]",
-            "",
-            "def function(args):\n    some code\n",
-            "# Copied from transformers.some_module\nclass SomeClass:\n    some code\n",
-        ]
-        self.assertEqual(parse_module_content(test_code), expected_parts)
-
-    def test_add_content_to_text(self):
-        test_text = """all_configs = {
-    "gpt": "GPTConfig",
-    "bert": "BertConfig",
-    "t5": "T5Config",
-}"""
-
-        expected = """all_configs = {
-    "gpt": "GPTConfig",
-    "gpt2": "GPT2Config",
-    "bert": "BertConfig",
-    "t5": "T5Config",
-}"""
-        line = '    "gpt2": "GPT2Config",'
-
-        self.assertEqual(add_content_to_text(test_text, line, add_before="bert"), expected)
-        self.assertEqual(add_content_to_text(test_text, line, add_before="bert", exact_match=True), test_text)
-        self.assertEqual(
-            add_content_to_text(test_text, line, add_before='    "bert": "BertConfig",', exact_match=True), expected
+    def test_llama_without_tokenizers(self):
+        # This is the structure without adding the tokenizers
+        filenames_to_add = (
+            ("configuration_llama.py", True),
+            ("modeling_llama.py", True),
+            ("tokenization_llama.py", False),
+            ("tokenization_llama_fast.py", False),
+            ("image_processing_llama.py", False),
+            ("image_processing_llama_fast.py", False),
+            ("video_processing_llama.py", False),
+            ("feature_extraction_llama.py", False),
+            ("processing_llama.py", False),
         )
-        self.assertEqual(add_content_to_text(test_text, line, add_before=re.compile(r'^\s*"bert":')), expected)
-
-        self.assertEqual(add_content_to_text(test_text, line, add_after="gpt"), expected)
-        self.assertEqual(add_content_to_text(test_text, line, add_after="gpt", exact_match=True), test_text)
-        self.assertEqual(
-            add_content_to_text(test_text, line, add_after='    "gpt": "GPTConfig",', exact_match=True), expected
-        )
-        self.assertEqual(add_content_to_text(test_text, line, add_after=re.compile(r'^\s*"gpt":')), expected)
-
-    def test_add_content_to_file(self):
-        test_text = """all_configs = {
-    "gpt": "GPTConfig",
-    "bert": "BertConfig",
-    "t5": "T5Config",
-}"""
-
-        expected = """all_configs = {
-    "gpt": "GPTConfig",
-    "gpt2": "GPT2Config",
-    "bert": "BertConfig",
-    "t5": "T5Config",
-}"""
-        line = '    "gpt2": "GPT2Config",'
-
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            file_name = os.path.join(tmp_dir, "code.py")
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_before="bert")
-            self.check_result(file_name, expected)
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_before="bert", exact_match=True)
-            self.check_result(file_name, test_text)
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_before='    "bert": "BertConfig",', exact_match=True)
-            self.check_result(file_name, expected)
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_before=re.compile(r'^\s*"bert":'))
-            self.check_result(file_name, expected)
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_after="gpt")
-            self.check_result(file_name, expected)
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_after="gpt", exact_match=True)
-            self.check_result(file_name, test_text)
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_after='    "gpt": "GPTConfig",', exact_match=True)
-            self.check_result(file_name, expected)
-
-            self.init_file(file_name, test_text)
-            add_content_to_file(file_name, line, add_after=re.compile(r'^\s*"gpt":'))
-            self.check_result(file_name, expected)
-
-    def test_simplify_replacements(self):
-        self.assertEqual(simplify_replacements([("Bert", "NewBert")]), [("Bert", "NewBert")])
-        self.assertEqual(
-            simplify_replacements([("Bert", "NewBert"), ("bert", "new-bert")]),
-            [("Bert", "NewBert"), ("bert", "new-bert")],
-        )
-        self.assertEqual(
-            simplify_replacements([("BertConfig", "NewBertConfig"), ("Bert", "NewBert"), ("bert", "new-bert")]),
-            [("Bert", "NewBert"), ("bert", "new-bert")],
+        # Run the command
+        create_new_model_like(
+            old_model_infos=ModelInfos("llama"),
+            new_lowercase_name="my_test",
+            new_model_paper_name="MyTest",
+            filenames_to_add=filenames_to_add,
+            create_fast_image_processor=False,
         )
 
-    def test_replace_model_patterns(self):
-        bert_model_patterns = ModelPatterns("Bert", "google-bert/bert-base-cased")
-        new_bert_model_patterns = ModelPatterns("New Bert", "huggingface/bert-new-base")
-        bert_test = '''class TFBertPreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
+        # First assert that all files were created correctly
+        model_repo = os.path.join(self.MODEL_PATH, "my_test")
+        tests_repo = os.path.join(self.TESTS_MODEL_PATH, "my_test")
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "modular_my_test.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "modeling_my_test.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "configuration_my_test.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "__init__.py")))
+        self.assertTrue(os.path.isfile(os.path.join(self.DOC_PATH, "model_doc", "my_test.md")))
+        self.assertTrue(os.path.isfile(os.path.join(tests_repo, "__init__.py")))
+        self.assertTrue(os.path.isfile(os.path.join(tests_repo, "test_modeling_my_test.py")))
 
-    config_class = BertConfig
-    load_tf_weights = load_tf_weights_in_bert
-    base_model_prefix = "bert"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-    model_type = "bert"
-
-BERT_CONSTANT = "value"
-'''
-        bert_expected = '''class TFNewBertPreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
-
-    config_class = NewBertConfig
-    load_tf_weights = load_tf_weights_in_new_bert
-    base_model_prefix = "new_bert"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-    model_type = "new-bert"
-
-NEW_BERT_CONSTANT = "value"
-'''
-
-        bert_converted, replacements = replace_model_patterns(bert_test, bert_model_patterns, new_bert_model_patterns)
-        self.assertEqual(bert_converted, bert_expected)
-        # Replacements are empty here since bert as been replaced by bert_new in some instances and bert-new
-        # in others.
-        self.assertEqual(replacements, "")
-
-        # If we remove the model type, we will get replacements
-        bert_test = bert_test.replace('    model_type = "bert"\n', "")
-        bert_expected = bert_expected.replace('    model_type = "new-bert"\n', "")
-        bert_converted, replacements = replace_model_patterns(bert_test, bert_model_patterns, new_bert_model_patterns)
-        self.assertEqual(bert_converted, bert_expected)
-        self.assertEqual(replacements, "BERT->NEW_BERT,Bert->NewBert,bert->new_bert")
-
-        gpt_model_patterns = ModelPatterns("GPT2", "gpt2")
-        new_gpt_model_patterns = ModelPatterns("GPT-New new", "huggingface/gpt-new-base")
-        gpt_test = '''class GPT2PreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
-
-    config_class = GPT2Config
-    load_tf_weights = load_tf_weights_in_gpt2
-    base_model_prefix = "transformer"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-
-GPT2_CONSTANT = "value"
-'''
-
-        gpt_expected = '''class GPTNewNewPreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
-
-    config_class = GPTNewNewConfig
-    load_tf_weights = load_tf_weights_in_gpt_new_new
-    base_model_prefix = "transformer"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-
-GPT_NEW_NEW_CONSTANT = "value"
-'''
-
-        gpt_converted, replacements = replace_model_patterns(gpt_test, gpt_model_patterns, new_gpt_model_patterns)
-        self.assertEqual(gpt_converted, gpt_expected)
-        # Replacements are empty here since GPT2 as been replaced by GPTNewNew in some instances and GPT_NEW_NEW
-        # in others.
-        self.assertEqual(replacements, "")
-
-        roberta_model_patterns = ModelPatterns("RoBERTa", "FacebookAI/roberta-base", model_camel_cased="Roberta")
-        new_roberta_model_patterns = ModelPatterns(
-            "RoBERTa-New", "huggingface/roberta-new-base", model_camel_cased="RobertaNew"
+        # Now assert the correct imports/auto mappings/toctree were added
+        self.assertInFile(
+            "from .my_test import *\n",
+            os.path.join(self.MODEL_PATH, "__init__.py"),
         )
-        roberta_test = '''# Copied from transformers.models.bert.BertModel with Bert->Roberta
-class RobertaModel(RobertaPreTrainedModel):
-    """ The base RoBERTa model. """
-    checkpoint = FacebookAI/roberta-base
-    base_model_prefix = "roberta"
-        '''
-        roberta_expected = '''# Copied from transformers.models.bert.BertModel with Bert->RobertaNew
-class RobertaNewModel(RobertaNewPreTrainedModel):
-    """ The base RoBERTa-New model. """
-    checkpoint = huggingface/roberta-new-base
-    base_model_prefix = "roberta_new"
-        '''
-        roberta_converted, replacements = replace_model_patterns(
-            roberta_test, roberta_model_patterns, new_roberta_model_patterns
+        self.assertInFile(
+            '("my_test", "MyTestConfig"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "configuration_auto.py"),
         )
-        self.assertEqual(roberta_converted, roberta_expected)
-
-    def test_get_module_from_file(self):
-        self.assertEqual(
-            get_module_from_file("/git/transformers/src/transformers/models/bert/modeling_tf_bert.py"),
-            "transformers.models.bert.modeling_tf_bert",
+        self.assertInFile(
+            '("my_test", "MyTest"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "configuration_auto.py"),
         )
-        self.assertEqual(
-            get_module_from_file("/transformers/models/gpt2/modeling_gpt2.py"),
-            "transformers.models.gpt2.modeling_gpt2",
+        self.assertInFile(
+            '("my_test", "MyTestModel"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "modeling_auto.py"),
         )
-        with self.assertRaises(ValueError):
-            get_module_from_file("/models/gpt2/modeling_gpt2.py")
-
-    def test_duplicate_module(self):
-        bert_model_patterns = ModelPatterns("Bert", "google-bert/bert-base-cased")
-        new_bert_model_patterns = ModelPatterns("New Bert", "huggingface/bert-new-base")
-        bert_test = '''class TFBertPreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
-
-    config_class = BertConfig
-    load_tf_weights = load_tf_weights_in_bert
-    base_model_prefix = "bert"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-
-BERT_CONSTANT = "value"
-'''
-        bert_expected = '''class TFNewBertPreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
-
-    config_class = NewBertConfig
-    load_tf_weights = load_tf_weights_in_new_bert
-    base_model_prefix = "new_bert"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-
-NEW_BERT_CONSTANT = "value"
-'''
-        bert_expected_with_copied_from = (
-            "# Copied from transformers.bert_module.TFBertPreTrainedModel with Bert->NewBert,bert->new_bert\n"
-            + bert_expected
+        self.assertInFile(
+            '("my_test", "MyTestForCausalLM"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "modeling_auto.py"),
         )
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            work_dir = os.path.join(tmp_dir, "transformers")
-            os.makedirs(work_dir)
-            file_name = os.path.join(work_dir, "bert_module.py")
-            dest_file_name = os.path.join(work_dir, "new_bert_module.py")
-
-            self.init_file(file_name, bert_test)
-            duplicate_module(file_name, bert_model_patterns, new_bert_model_patterns)
-            self.check_result(dest_file_name, bert_expected_with_copied_from)
-
-            self.init_file(file_name, bert_test)
-            duplicate_module(file_name, bert_model_patterns, new_bert_model_patterns, add_copied_from=False)
-            self.check_result(dest_file_name, bert_expected)
-
-    def test_duplicate_module_with_copied_from(self):
-        bert_model_patterns = ModelPatterns("Bert", "google-bert/bert-base-cased")
-        new_bert_model_patterns = ModelPatterns("New Bert", "huggingface/bert-new-base")
-        bert_test = '''# Copied from transformers.models.xxx.XxxModel with Xxx->Bert
-class TFBertPreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
-
-    config_class = BertConfig
-    load_tf_weights = load_tf_weights_in_bert
-    base_model_prefix = "bert"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-
-BERT_CONSTANT = "value"
-'''
-        bert_expected = '''# Copied from transformers.models.xxx.XxxModel with Xxx->NewBert
-class TFNewBertPreTrainedModel(PreTrainedModel):
-    """
-    An abstract class to handle weights initialization and a simple interface for downloading and loading pretrained
-    models.
-    """
-
-    config_class = NewBertConfig
-    load_tf_weights = load_tf_weights_in_new_bert
-    base_model_prefix = "new_bert"
-    is_parallelizable = True
-    supports_gradient_checkpointing = True
-
-NEW_BERT_CONSTANT = "value"
-'''
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            work_dir = os.path.join(tmp_dir, "transformers")
-            os.makedirs(work_dir)
-            file_name = os.path.join(work_dir, "bert_module.py")
-            dest_file_name = os.path.join(work_dir, "new_bert_module.py")
-
-            self.init_file(file_name, bert_test)
-            duplicate_module(file_name, bert_model_patterns, new_bert_model_patterns)
-            # There should not be a new Copied from statement, the old one should be adapted.
-            self.check_result(dest_file_name, bert_expected)
-
-            self.init_file(file_name, bert_test)
-            duplicate_module(file_name, bert_model_patterns, new_bert_model_patterns, add_copied_from=False)
-            self.check_result(dest_file_name, bert_expected)
-
-    def test_filter_framework_files(self):
-        files = ["modeling_bert.py", "modeling_tf_bert.py", "modeling_flax_bert.py", "configuration_bert.py"]
-        self.assertEqual(set(filter_framework_files(files, ["pt", "tf", "flax"])), set(files))
-
-        self.assertEqual(set(filter_framework_files(files, ["pt"])), {"modeling_bert.py", "configuration_bert.py"})
-        self.assertEqual(set(filter_framework_files(files, ["tf"])), {"modeling_tf_bert.py", "configuration_bert.py"})
-        self.assertEqual(
-            set(filter_framework_files(files, ["flax"])), {"modeling_flax_bert.py", "configuration_bert.py"}
+        self.assertInFile(
+            '("my_test", "MyTestForSequenceClassification"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "modeling_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test", "MyTestForQuestionAnswering"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "modeling_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test", "MyTestForTokenClassification"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "modeling_auto.py"),
+        )
+        self.assertInFile(
+            "- local: model_doc/my_test\n        title: MyTest\n",
+            os.path.join(self.DOC_PATH, "_toctree.yml"),
         )
 
-        self.assertEqual(
-            set(filter_framework_files(files, ["pt", "tf"])),
-            {"modeling_tf_bert.py", "modeling_bert.py", "configuration_bert.py"},
-        )
-        self.assertEqual(
-            set(filter_framework_files(files, ["tf", "flax"])),
-            {"modeling_tf_bert.py", "modeling_flax_bert.py", "configuration_bert.py"},
-        )
-        self.assertEqual(
-            set(filter_framework_files(files, ["pt", "flax"])),
-            {"modeling_bert.py", "modeling_flax_bert.py", "configuration_bert.py"},
-        )
-
-    def test_get_model_files_only_pt(self):
-        # BERT
-        bert_files = get_model_files("bert", frameworks=["pt"])
-
-        doc_file = get_last_n_components_of_path(bert_files["doc_file"], n=5)
-        self.assertEqual(doc_file, "docs/source/en/model_doc/bert.md")
-
-        model_files = {get_last_n_components_of_path(f, n=4) for f in bert_files["model_files"]}
-        bert_model_files = BERT_MODEL_FILES - {
-            "transformers/models/bert/modeling_tf_bert.py",
-            "transformers/models/bert/modeling_flax_bert.py",
-        }
-        self.assertEqual(model_files, bert_model_files)
-
-        self.assertEqual(bert_files["module_name"], "bert")
-
-        # TODO: failing in CI, fix me
-        # test_files = {get_last_n_components_of_path(f, n=4) for f in bert_files["test_files"]}
-        # bert_test_files = {
-        #     "tests/models/bert/test_tokenization_bert.py",
-        #     "tests/models/bert/test_modeling_bert.py",
-        # }
-        # self.assertEqual(test_files, bert_test_files)
-
-        # VIT
-        vit_files = get_model_files("vit", frameworks=["pt"])
-        doc_file = get_last_n_components_of_path(vit_files["doc_file"], n=5)
-        self.assertEqual(doc_file, "docs/source/en/model_doc/vit.md")
-
-        model_files = {get_last_n_components_of_path(f, n=4) for f in vit_files["model_files"]}
-        vit_model_files = VIT_MODEL_FILES - {
-            "transformers/models/vit/modeling_tf_vit.py",
-            "transformers/models/vit/modeling_flax_vit.py",
-        }
-        self.assertEqual(model_files, vit_model_files)
-
-        self.assertEqual(vit_files["module_name"], "vit")
-
-        # TODO: failing in CI, fix me
-        # test_files = {get_last_n_components_of_path(f, n=4) for f in vit_files["test_files"]}
-        # vit_test_files = {
-        #     "tests/models/vit/test_image_processing_vit.py",
-        #     "tests/models/vit/test_modeling_vit.py",
-        # }
-        # self.assertEqual(test_files, vit_test_files)
-
-        # Wav2Vec2
-        wav2vec2_files = get_model_files("wav2vec2", frameworks=["pt"])
-        doc_file = get_last_n_components_of_path(wav2vec2_files["doc_file"], n=5)
-        self.assertEqual(doc_file, "docs/source/en/model_doc/wav2vec2.md")
-
-        model_files = {get_last_n_components_of_path(f, n=4) for f in wav2vec2_files["model_files"]}
-        wav2vec2_model_files = WAV2VEC2_MODEL_FILES - {
-            "transformers/models/wav2vec2/modeling_tf_wav2vec2.py",
-            "transformers/models/wav2vec2/modeling_flax_wav2vec2.py",
-        }
-        self.assertEqual(model_files, wav2vec2_model_files)
-
-        self.assertEqual(wav2vec2_files["module_name"], "wav2vec2")
-
-        # TODO: failing in CI, fix me
-        # test_files = {get_last_n_components_of_path(f, n=4) for f in wav2vec2_files["test_files"]}
-        # wav2vec2_test_files = {
-        #     "tests/models/wav2vec2/test_feature_extraction_wav2vec2.py",
-        #     "tests/models/wav2vec2/test_modeling_wav2vec2.py",
-        #     "tests/models/wav2vec2/test_processor_wav2vec2.py",
-        #     "tests/models/wav2vec2/test_tokenization_wav2vec2.py",
-        # }
-        # self.assertEqual(test_files, wav2vec2_test_files)
-
-    def test_find_base_model_checkpoint(self):
-        self.assertEqual(find_base_model_checkpoint("bert"), "google-bert/bert-base-uncased")
-        self.assertEqual(find_base_model_checkpoint("gpt2"), "openai-community/gpt2")
-
-    def test_retrieve_model_classes(self):
-        gpt_classes = {k: set(v) for k, v in retrieve_model_classes("gpt2", frameworks=["pt"]).items()}
-        expected_gpt_classes = {
-            "pt": {
-                "GPT2ForTokenClassification",
-                "GPT2Model",
-                "GPT2LMHeadModel",
-                "GPT2ForSequenceClassification",
-                "GPT2ForQuestionAnswering",
-            },
-        }
-        self.assertEqual(gpt_classes, expected_gpt_classes)
-
-    def test_retrieve_info_for_model_with_bert(self):
-        bert_info = retrieve_info_for_model("bert", frameworks=["pt"])
-        bert_classes = [
-            "BertForTokenClassification",
-            "BertForQuestionAnswering",
-            "BertForNextSentencePrediction",
-            "BertForSequenceClassification",
-            "BertForMaskedLM",
-            "BertForMultipleChoice",
-            "BertModel",
-            "BertForPreTraining",
-            "BertLMHeadModel",
-        ]
-        expected_model_classes = {
-            "pt": set(bert_classes),
-        }
-
-        self.assertEqual(set(bert_info["frameworks"]), {"pt"})
-        model_classes = {k: set(v) for k, v in bert_info["model_classes"].items()}
-        self.assertEqual(model_classes, expected_model_classes)
-
-        all_bert_files = bert_info["model_files"]
-        model_files = {get_last_n_components_of_path(f, 4) for f in all_bert_files["model_files"]}
-        bert_model_files = BERT_MODEL_FILES - {
-            "transformers/models/bert/modeling_tf_bert.py",
-            "transformers/models/bert/modeling_flax_bert.py",
-        }
-        self.assertEqual(model_files, bert_model_files)
-
-        # TODO: failing in CI, fix me
-        # test_files = {get_last_n_components_of_path(f, n=4) for f in all_bert_files["test_files"]}
-        # bert_test_files = {
-        #     "tests/models/bert/test_tokenization_bert.py",
-        #     "tests/models/bert/test_modeling_bert.py",
-        # }
-        # self.assertEqual(test_files, bert_test_files)
-
-        doc_file = get_last_n_components_of_path(all_bert_files["doc_file"], n=5)
-        self.assertEqual(doc_file, "docs/source/en/model_doc/bert.md")
-
-        self.assertEqual(all_bert_files["module_name"], "bert")
-
-        bert_model_patterns = bert_info["model_patterns"]
-        self.assertEqual(bert_model_patterns.model_name, "BERT")
-        self.assertEqual(bert_model_patterns.checkpoint, "google-bert/bert-base-uncased")
-        self.assertEqual(bert_model_patterns.model_type, "bert")
-        self.assertEqual(bert_model_patterns.model_lower_cased, "bert")
-        self.assertEqual(bert_model_patterns.model_camel_cased, "Bert")
-        self.assertEqual(bert_model_patterns.model_upper_cased, "BERT")
-        self.assertEqual(bert_model_patterns.config_class, "BertConfig")
-        self.assertEqual(bert_model_patterns.tokenizer_class, "BertTokenizer")
-        self.assertIsNone(bert_model_patterns.feature_extractor_class)
-        self.assertIsNone(bert_model_patterns.processor_class)
-
-    def test_retrieve_info_for_model_with_vit(self):
-        vit_info = retrieve_info_for_model("vit", frameworks=["pt"])
-        vit_classes = ["ViTForImageClassification", "ViTModel"]
-        pt_only_classes = ["ViTForMaskedImageModeling"]
-        expected_model_classes = {
-            "pt": set(vit_classes + pt_only_classes),
-        }
-
-        self.assertEqual(set(vit_info["frameworks"]), {"pt"})
-        model_classes = {k: set(v) for k, v in vit_info["model_classes"].items()}
-        self.assertEqual(model_classes, expected_model_classes)
-
-        all_vit_files = vit_info["model_files"]
-        model_files = {get_last_n_components_of_path(f, 4) for f in all_vit_files["model_files"]}
-        vit_model_files = VIT_MODEL_FILES - {
-            "transformers/models/vit/modeling_tf_vit.py",
-            "transformers/models/vit/modeling_flax_vit.py",
-        }
-        self.assertEqual(model_files, vit_model_files)
-
-        # TODO: failing in CI, fix me
-        # test_files = {get_last_n_components_of_path(f, n=4) for f in all_vit_files["test_files"]}
-        # vit_test_files = {
-        #     "tests/models/vit/test_image_processing_vit.py",
-        #     "tests/models/vit/test_modeling_vit.py",
-        # }
-        # self.assertEqual(test_files, vit_test_files)
-
-        doc_file = get_last_n_components_of_path(all_vit_files["doc_file"], n=5)
-        self.assertEqual(doc_file, "docs/source/en/model_doc/vit.md")
-
-        self.assertEqual(all_vit_files["module_name"], "vit")
-
-        vit_model_patterns = vit_info["model_patterns"]
-        self.assertEqual(vit_model_patterns.model_name, "ViT")
-        self.assertEqual(vit_model_patterns.checkpoint, "google/vit-base-patch16-224")
-        self.assertEqual(vit_model_patterns.model_type, "vit")
-        self.assertEqual(vit_model_patterns.model_lower_cased, "vit")
-        self.assertEqual(vit_model_patterns.model_camel_cased, "ViT")
-        self.assertEqual(vit_model_patterns.model_upper_cased, "VIT")
-        self.assertEqual(vit_model_patterns.config_class, "ViTConfig")
-        self.assertEqual(vit_model_patterns.feature_extractor_class, "ViTFeatureExtractor")
-        self.assertEqual(vit_model_patterns.image_processor_class, "ViTImageProcessor")
-        self.assertIsNone(vit_model_patterns.tokenizer_class)
-        self.assertIsNone(vit_model_patterns.processor_class)
-
-    def test_retrieve_info_for_model_with_wav2vec2(self):
-        wav2vec2_info = retrieve_info_for_model("wav2vec2", frameworks=["pt"])
-        wav2vec2_classes = [
-            "Wav2Vec2Model",
-            "Wav2Vec2ForPreTraining",
-            "Wav2Vec2ForAudioFrameClassification",
-            "Wav2Vec2ForCTC",
-            "Wav2Vec2ForMaskedLM",
-            "Wav2Vec2ForSequenceClassification",
-            "Wav2Vec2ForXVector",
-        ]
-        expected_model_classes = {
-            "pt": set(wav2vec2_classes),
-        }
-
-        self.assertEqual(set(wav2vec2_info["frameworks"]), {"pt"})
-        model_classes = {k: set(v) for k, v in wav2vec2_info["model_classes"].items()}
-        self.assertEqual(model_classes, expected_model_classes)
-
-        all_wav2vec2_files = wav2vec2_info["model_files"]
-        model_files = {get_last_n_components_of_path(f, 4) for f in all_wav2vec2_files["model_files"]}
-        wav2vec2_model_files = WAV2VEC2_MODEL_FILES - {
-            "transformers/models/wav2vec2/modeling_tf_wav2vec2.py",
-            "transformers/models/wav2vec2/modeling_flax_wav2vec2.py",
-        }
-        self.assertEqual(model_files, wav2vec2_model_files)
-
-        # TODO: failing in CI, fix me
-        # test_files = {get_last_n_components_of_path(f, n=4) for f in all_wav2vec2_files["test_files"]}
-        # wav2vec2_test_files = {
-        #     "tests/models/wav2vec2/test_feature_extraction_wav2vec2.py",
-        #     "tests/models/wav2vec2/test_modeling_wav2vec2.py",
-        #     "tests/models/wav2vec2/test_processor_wav2vec2.py",
-        #     "tests/models/wav2vec2/test_tokenization_wav2vec2.py",
-        # }
-        # self.assertEqual(test_files, wav2vec2_test_files)
-
-        doc_file = get_last_n_components_of_path(all_wav2vec2_files["doc_file"], n=5)
-        self.assertEqual(doc_file, "docs/source/en/model_doc/wav2vec2.md")
-
-        self.assertEqual(all_wav2vec2_files["module_name"], "wav2vec2")
-
-        wav2vec2_model_patterns = wav2vec2_info["model_patterns"]
-        self.assertEqual(wav2vec2_model_patterns.model_name, "Wav2Vec2")
-        self.assertEqual(wav2vec2_model_patterns.checkpoint, "facebook/wav2vec2-base-960h")
-        self.assertEqual(wav2vec2_model_patterns.model_type, "wav2vec2")
-        self.assertEqual(wav2vec2_model_patterns.model_lower_cased, "wav2vec2")
-        self.assertEqual(wav2vec2_model_patterns.model_camel_cased, "Wav2Vec2")
-        self.assertEqual(wav2vec2_model_patterns.model_upper_cased, "WAV2VEC2")
-        self.assertEqual(wav2vec2_model_patterns.config_class, "Wav2Vec2Config")
-        self.assertEqual(wav2vec2_model_patterns.feature_extractor_class, "Wav2Vec2FeatureExtractor")
-        self.assertEqual(wav2vec2_model_patterns.processor_class, "Wav2Vec2Processor")
-        self.assertEqual(wav2vec2_model_patterns.tokenizer_class, "Wav2Vec2CTCTokenizer")
-
-    def test_clean_frameworks_in_init_with_gpt(self):
-        test_init = """
-from typing import TYPE_CHECKING
-
-from ...utils import _LazyModule, is_flax_available, is_tf_available, is_tokenizers_available, is_torch_available
-
-_import_structure = {
-    "configuration_gpt2": ["GPT2Config", "GPT2OnnxConfig"],
-    "tokenization_gpt2": ["GPT2Tokenizer"],
-}
-
-try:
-    if not is_tokenizers_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["tokenization_gpt2_fast"] = ["GPT2TokenizerFast"]
-
-try:
-    if not is_torch_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_gpt2"] = ["GPT2Model"]
-
-try:
-    if not is_tf_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_tf_gpt2"] = ["TFGPT2Model"]
-
-try:
-    if not is_flax_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_flax_gpt2"] = ["FlaxGPT2Model"]
-
-if TYPE_CHECKING:
-    from .configuration_gpt2 import GPT2Config, GPT2OnnxConfig
-    from .tokenization_gpt2 import GPT2Tokenizer
-
-    try:
-        if not is_tokenizers_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .tokenization_gpt2_fast import GPT2TokenizerFast
-
-    try:
-        if not is_torch_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_gpt2 import GPT2Model
-
-    try:
-        if not is_tf_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_tf_gpt2 import TFGPT2Model
-
-    try:
-        if not is_flax_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_flax_gpt2 import FlaxGPT2Model
-
-else:
-    import sys
-
-    sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure)
-"""
-
-        init_pt_only = """
-from typing import TYPE_CHECKING
-
-from ...utils import _LazyModule, is_tokenizers_available, is_torch_available
-
-_import_structure = {
-    "configuration_gpt2": ["GPT2Config", "GPT2OnnxConfig"],
-    "tokenization_gpt2": ["GPT2Tokenizer"],
-}
-
-try:
-    if not is_tokenizers_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["tokenization_gpt2_fast"] = ["GPT2TokenizerFast"]
-
-try:
-    if not is_torch_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_gpt2"] = ["GPT2Model"]
-
-if TYPE_CHECKING:
-    from .configuration_gpt2 import GPT2Config, GPT2OnnxConfig
-    from .tokenization_gpt2 import GPT2Tokenizer
-
-    try:
-        if not is_tokenizers_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .tokenization_gpt2_fast import GPT2TokenizerFast
-
-    try:
-        if not is_torch_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_gpt2 import GPT2Model
-
-else:
-    import sys
-
-    sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure)
-"""
-
-        init_pt_only_no_tokenizer = """
-from typing import TYPE_CHECKING
-
-from ...utils import _LazyModule, is_torch_available
-
-_import_structure = {
-    "configuration_gpt2": ["GPT2Config", "GPT2OnnxConfig"],
-}
-
-try:
-    if not is_torch_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_gpt2"] = ["GPT2Model"]
-
-if TYPE_CHECKING:
-    from .configuration_gpt2 import GPT2Config, GPT2OnnxConfig
-
-    try:
-        if not is_torch_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_gpt2 import GPT2Model
-
-else:
-    import sys
-
-    sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure)
-"""
-
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            file_name = os.path.join(tmp_dir, "../__init__.py")
-
-            self.init_file(file_name, test_init)
-            clean_frameworks_in_init(file_name, frameworks=["pt"])
-            self.check_result(file_name, init_pt_only)
-
-            self.init_file(file_name, test_init)
-            clean_frameworks_in_init(file_name, frameworks=["pt"], keep_processing=False)
-            self.check_result(file_name, init_pt_only_no_tokenizer)
-
-    def test_clean_frameworks_in_init_with_vit(self):
-        test_init = """
-from typing import TYPE_CHECKING
-
-from ...utils import _LazyModule, is_flax_available, is_tf_available, is_torch_available, is_vision_available
-
-_import_structure = {
-    "configuration_vit": ["ViTConfig"],
-}
-
-try:
-    if not is_vision_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["image_processing_vit"] = ["ViTImageProcessor"]
-
-try:
-    if not is_torch_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_vit"] = ["ViTModel"]
-
-try:
-    if not is_tf_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_tf_vit"] = ["TFViTModel"]
-
-try:
-    if not is_flax_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_flax_vit"] = ["FlaxViTModel"]
-
-if TYPE_CHECKING:
-    from .configuration_vit import ViTConfig
-
-    try:
-        if not is_vision_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .image_processing_vit import ViTImageProcessor
-
-    try:
-        if not is_torch_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_vit import ViTModel
-
-    try:
-        if not is_tf_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_tf_vit import TFViTModel
-
-    try:
-        if not is_flax_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_flax_vit import FlaxViTModel
-
-else:
-    import sys
-
-    sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure)
-"""
-
-        init_pt_only = """
-from typing import TYPE_CHECKING
-
-from ...utils import _LazyModule, is_torch_available, is_vision_available
-
-_import_structure = {
-    "configuration_vit": ["ViTConfig"],
-}
-
-try:
-    if not is_vision_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["image_processing_vit"] = ["ViTImageProcessor"]
-
-try:
-    if not is_torch_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_vit"] = ["ViTModel"]
-
-if TYPE_CHECKING:
-    from .configuration_vit import ViTConfig
-
-    try:
-        if not is_vision_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .image_processing_vit import ViTImageProcessor
-
-    try:
-        if not is_torch_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_vit import ViTModel
-
-else:
-    import sys
-
-    sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure)
-"""
-
-        init_pt_only_no_feature_extractor = """
-from typing import TYPE_CHECKING
-
-from ...utils import _LazyModule, is_torch_available
-
-_import_structure = {
-    "configuration_vit": ["ViTConfig"],
-}
-
-try:
-    if not is_torch_available():
-        raise OptionalDependencyNotAvailable()
-except OptionalDependencyNotAvailable:
-    pass
-else:
-    _import_structure["modeling_vit"] = ["ViTModel"]
-
-if TYPE_CHECKING:
-    from .configuration_vit import ViTConfig
-
-    try:
-        if not is_torch_available():
-            raise OptionalDependencyNotAvailable()
-    except OptionalDependencyNotAvailable:
-        pass
-    else:
-        from .modeling_vit import ViTModel
-
-else:
-    import sys
-
-    sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure)
-"""
-
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            file_name = os.path.join(tmp_dir, "../__init__.py")
-
-            self.init_file(file_name, test_init)
-            clean_frameworks_in_init(file_name, frameworks=["pt"])
-            self.check_result(file_name, init_pt_only)
-
-            self.init_file(file_name, test_init)
-            clean_frameworks_in_init(file_name, frameworks=["pt"], keep_processing=False)
-            self.check_result(file_name, init_pt_only_no_feature_extractor)
-
-    def test_duplicate_doc_file(self):
-        test_doc = """
-# GPT2
-
-## Overview
-
-Overview of the model.
-
-## GPT2Config
-
-[[autodoc]] GPT2Config
-
-## GPT2Tokenizer
-
-[[autodoc]] GPT2Tokenizer
-    - save_vocabulary
-
-## GPT2TokenizerFast
-
-[[autodoc]] GPT2TokenizerFast
-
-## GPT2 specific outputs
-
-[[autodoc]] models.gpt2.modeling_gpt2.GPT2DoubleHeadsModelOutput
-
-[[autodoc]] models.gpt2.modeling_tf_gpt2.TFGPT2DoubleHeadsModelOutput
-
-## GPT2Model
-
-[[autodoc]] GPT2Model
-    - forward
-
-## TFGPT2Model
-
-[[autodoc]] TFGPT2Model
-    - call
-
-## FlaxGPT2Model
-
-[[autodoc]] FlaxGPT2Model
-    - __call__
-
-"""
-        test_new_doc = """
-# GPT-New New
-
-## Overview
-
-The GPT-New New model was proposed in [<INSERT PAPER NAME HERE>](<INSERT PAPER LINK HERE>) by <INSERT AUTHORS HERE>.
-<INSERT SHORT SUMMARY HERE>
-
-The abstract from the paper is the following:
-
-*<INSERT PAPER ABSTRACT HERE>*
-
-Tips:
-
-<INSERT TIPS ABOUT MODEL HERE>
-
-This model was contributed by [INSERT YOUR HF USERNAME HERE](https://huggingface.co/<INSERT YOUR HF USERNAME HERE>).
-The original code can be found [here](<INSERT LINK TO GITHUB REPO HERE>).
-
-
-## GPTNewNewConfig
-
-[[autodoc]] GPTNewNewConfig
-
-## GPTNewNewTokenizer
-
-[[autodoc]] GPTNewNewTokenizer
-    - save_vocabulary
-
-## GPTNewNewTokenizerFast
-
-[[autodoc]] GPTNewNewTokenizerFast
-
-## GPTNewNew specific outputs
-
-[[autodoc]] models.gpt_new_new.modeling_gpt_new_new.GPTNewNewDoubleHeadsModelOutput
-
-[[autodoc]] models.gpt_new_new.modeling_tf_gpt_new_new.TFGPTNewNewDoubleHeadsModelOutput
-
-## GPTNewNewModel
-
-[[autodoc]] GPTNewNewModel
-    - forward
-
-## TFGPTNewNewModel
-
-[[autodoc]] TFGPTNewNewModel
-    - call
-
-## FlaxGPTNewNewModel
-
-[[autodoc]] FlaxGPTNewNewModel
-    - __call__
-
-"""
-
-        with tempfile.TemporaryDirectory() as tmp_dir:
-            doc_file = os.path.join(tmp_dir, "gpt2.md")
-            new_doc_file = os.path.join(tmp_dir, "gpt-new-new.md")
-
-            gpt2_model_patterns = ModelPatterns("GPT2", "gpt2", tokenizer_class="GPT2Tokenizer")
-            new_model_patterns = ModelPatterns(
-                "GPT-New New", "huggingface/gpt-new-new", tokenizer_class="GPTNewNewTokenizer"
+        # Check some exact file creation. For model definition, only check modular as modeling/config/etc... are created
+        # directly from it
+        EXPECTED_MODULAR = textwrap.dedent(
+            f"""
+            # coding=utf-8
+            # Copyright {CURRENT_YEAR} the HuggingFace Team. All rights reserved.
+            #
+            # Licensed under the Apache License, Version 2.0 (the "License");
+            # you may not use this file except in compliance with the License.
+            # You may obtain a copy of the License at
+            #
+            #     http://www.apache.org/licenses/LICENSE-2.0
+            #
+            # Unless required by applicable law or agreed to in writing, software
+            # distributed under the License is distributed on an "AS IS" BASIS,
+            # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+            # See the License for the specific language governing permissions and
+            # limitations under the License.
+
+            from ..llama.configuration_llama import LlamaConfig
+            from ..llama.modeling_llama import (
+                LlamaAttention,
+                LlamaDecoderLayer,
+                LlamaForCausalLM,
+                LlamaForQuestionAnswering,
+                LlamaForSequenceClassification,
+                LlamaForTokenClassification,
+                LlamaMLP,
+                LlamaModel,
+                LlamaPreTrainedModel,
+                LlamaRMSNorm,
+                LlamaRotaryEmbedding,
             )
 
-            self.init_file(doc_file, test_doc)
-            duplicate_doc_file(doc_file, gpt2_model_patterns, new_model_patterns, frameworks=["pt", "tf", "flax"])
-            self.check_result(new_doc_file, test_new_doc)
 
-            test_new_doc_pt_only = test_new_doc.replace(
-                """
-## TFGPTNewNewModel
+            class MyTestConfig(LlamaConfig):
+                pass
 
-[[autodoc]] TFGPTNewNewModel
-    - call
 
-## FlaxGPTNewNewModel
+            class MyTestRMSNorm(LlamaRMSNorm):
+                pass
 
-[[autodoc]] FlaxGPTNewNewModel
-    - __call__
 
-""",
-                "",
+            class MyTestRotaryEmbedding(LlamaRotaryEmbedding):
+                pass
+
+
+            class MyTestMLP(LlamaMLP):
+                pass
+
+
+            class MyTestAttention(LlamaAttention):
+                pass
+
+
+            class MyTestDecoderLayer(LlamaDecoderLayer):
+                pass
+
+
+            class MyTestPreTrainedModel(LlamaPreTrainedModel):
+                pass
+
+
+            class MyTestModel(LlamaModel):
+                pass
+
+
+            class MyTestForCausalLM(LlamaForCausalLM):
+                pass
+
+
+            class MyTestForSequenceClassification(LlamaForSequenceClassification):
+                pass
+
+
+            class MyTestForQuestionAnswering(LlamaForQuestionAnswering):
+                pass
+
+
+            class MyTestForTokenClassification(LlamaForTokenClassification):
+                pass
+
+
+            __all__ = [
+                "MyTestConfig",
+                "MyTestForCausalLM",
+                "MyTestModel",
+                "MyTestPreTrainedModel",
+                "MyTestForSequenceClassification",
+                "MyTestForQuestionAnswering",
+                "MyTestForTokenClassification",
+            ]
+            """
+        )
+        self.assertFileIsEqual(EXPECTED_MODULAR, os.path.join(model_repo, "modular_my_test.py"))
+
+        EXPECTED_INIT = textwrap.dedent(
+            f"""
+            # coding=utf-8
+            # Copyright {CURRENT_YEAR} the HuggingFace Team. All rights reserved.
+            #
+            # Licensed under the Apache License, Version 2.0 (the "License");
+            # you may not use this file except in compliance with the License.
+            # You may obtain a copy of the License at
+            #
+            #     http://www.apache.org/licenses/LICENSE-2.0
+            #
+            # Unless required by applicable law or agreed to in writing, software
+            # distributed under the License is distributed on an "AS IS" BASIS,
+            # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+            # See the License for the specific language governing permissions and
+            # limitations under the License.
+
+            from typing import TYPE_CHECKING
+
+            from ...utils import _LazyModule
+            from ...utils.import_utils import define_import_structure
+
+
+            if TYPE_CHECKING:
+                from .configuration_my_test import *
+                from .modeling_my_test import *
+            else:
+                import sys
+
+                _file = globals()["__file__"]
+                sys.modules[__name__] = _LazyModule(__name__, _file, define_import_structure(_file), module_spec=__spec__)
+
+            """
+        )
+        self.assertFileIsEqual(EXPECTED_INIT, os.path.join(model_repo, "__init__.py"))
+
+        EXPECTED_DOC = textwrap.dedent(
+            f"""
+            <!--Copyright {CURRENT_YEAR} the HuggingFace Team. All rights reserved.
+
+            Licensed under the Apache License, Version 2.0 (the "License");
+            you may not use this file except in compliance with the License.
+            You may obtain a copy of the License at
+
+                http://www.apache.org/licenses/LICENSE-2.0
+
+            Unless required by applicable law or agreed to in writing, software
+            distributed under the License is distributed on an "AS IS" BASIS,
+            WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+            See the License for the specific language governing permissions and
+            limitations under the License.
+
+
+            ⚠️ Note that this file is in Markdown but contain specific syntax for our doc-builder (similar to MDX) that may not be rendered properly in your Markdown viewer.
+
+            -->
+
+
+            # MyTest
+
+            ## Overview
+
+            The MyTest model was proposed in [<INSERT PAPER NAME HERE>](<INSERT PAPER LINK HERE>) by <INSERT AUTHORS HERE>.
+            <INSERT SHORT SUMMARY HERE>
+
+            The abstract from the paper is the following:
+
+            <INSERT PAPER ABSTRACT HERE>
+
+            Tips:
+
+            <INSERT TIPS ABOUT MODEL HERE>
+
+            This model was contributed by [INSERT YOUR HF USERNAME HERE](https://huggingface.co/<INSERT YOUR HF USERNAME HERE>).
+            The original code can be found [here](<INSERT LINK TO GITHUB REPO HERE>).
+
+            ## Usage examples
+
+            <INSERT SOME NICE EXAMPLES HERE>
+
+            ## MyTestConfig
+
+            [[autodoc]] MyTestConfig
+
+            ## MyTestForCausalLM
+
+            [[autodoc]] MyTestForCausalLM
+
+            ## MyTestModel
+
+            [[autodoc]] MyTestModel
+                - forward
+
+            ## MyTestPreTrainedModel
+
+            [[autodoc]] MyTestPreTrainedModel
+                - forward
+
+            ## MyTestForSequenceClassification
+
+            [[autodoc]] MyTestForSequenceClassification
+
+            ## MyTestForQuestionAnswering
+
+            [[autodoc]] MyTestForQuestionAnswering
+
+            ## MyTestForTokenClassification
+
+            [[autodoc]] MyTestForTokenClassification
+            """
+        )
+        self.assertFileIsEqual(EXPECTED_DOC, os.path.join(self.DOC_PATH, "model_doc", "my_test.md"))
+
+    def test_phi4_with_all_processors(self):
+        # This is the structure without adding the tokenizers
+        filenames_to_add = (
+            ("configuration_phi4_multimodal.py", True),
+            ("modeling_phi4_multimodal.py", True),
+            ("tokenization_phi4_multimodal.py", False),
+            ("tokenization_phi4_multimodal_fast.py", False),
+            ("image_processing_phi4_multimodal.py", False),
+            ("image_processing_phi4_multimodal_fast.py", True),
+            ("video_processing_phi4_multimodal.py", False),
+            ("feature_extraction_phi4_multimodal.py", True),
+            ("processing_phi4_multimodal.py", True),
+        )
+        # Run the command
+        create_new_model_like(
+            old_model_infos=ModelInfos("phi4_multimodal"),
+            new_lowercase_name="my_test2",
+            new_model_paper_name="MyTest2",
+            filenames_to_add=filenames_to_add,
+            create_fast_image_processor=False,
+        )
+
+        # First assert that all files were created correctly
+        model_repo = os.path.join(self.MODEL_PATH, "my_test2")
+        tests_repo = os.path.join(self.TESTS_MODEL_PATH, "my_test2")
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "modular_my_test2.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "modeling_my_test2.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "configuration_my_test2.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "image_processing_my_test2_fast.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "feature_extraction_my_test2.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "processing_my_test2.py")))
+        self.assertTrue(os.path.isfile(os.path.join(model_repo, "__init__.py")))
+        self.assertTrue(os.path.isfile(os.path.join(self.DOC_PATH, "model_doc", "my_test2.md")))
+        self.assertTrue(os.path.isfile(os.path.join(tests_repo, "__init__.py")))
+        self.assertTrue(os.path.isfile(os.path.join(tests_repo, "test_modeling_my_test2.py")))
+        self.assertTrue(os.path.isfile(os.path.join(tests_repo, "test_feature_extraction_my_test2.py")))
+        self.assertTrue(os.path.isfile(os.path.join(tests_repo, "test_image_processing_my_test2.py")))
+
+        # Now assert the correct imports/auto mappings/toctree were added
+        self.assertInFile(
+            "from .my_test2 import *\n",
+            os.path.join(self.MODEL_PATH, "__init__.py"),
+        )
+        self.assertInFile(
+            '("my_test2", "MyTest2Config"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "configuration_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test2", "MyTest2"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "configuration_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test2", "MyTest2Model"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "modeling_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test2", "MyTest2ForCausalLM"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "modeling_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test2", (None, "MyTest2ImageProcessorFast")),\n',
+            os.path.join(self.MODEL_PATH, "auto", "image_processing_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test2", "MyTest2FeatureExtractor"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "feature_extraction_auto.py"),
+        )
+        self.assertInFile(
+            '("my_test2", "MyTest2Processor"),\n',
+            os.path.join(self.MODEL_PATH, "auto", "processing_auto.py"),
+        )
+        self.assertInFile(
+            "- local: model_doc/my_test2\n        title: MyTest2\n",
+            os.path.join(self.DOC_PATH, "_toctree.yml"),
+        )
+
+        # Check some exact file creation. For model definition, only check modular as modeling/config/etc... are created
+        # directly from it
+        EXPECTED_MODULAR = textwrap.dedent(
+            f"""
+            # coding=utf-8
+            # Copyright {CURRENT_YEAR} the HuggingFace Team. All rights reserved.
+            #
+            # Licensed under the Apache License, Version 2.0 (the "License");
+            # you may not use this file except in compliance with the License.
+            # You may obtain a copy of the License at
+            #
+            #     http://www.apache.org/licenses/LICENSE-2.0
+            #
+            # Unless required by applicable law or agreed to in writing, software
+            # distributed under the License is distributed on an "AS IS" BASIS,
+            # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+            # See the License for the specific language governing permissions and
+            # limitations under the License.
+
+            from ..phi4_multimodal.configuration_phi4_multimodal import (
+                Phi4MultimodalAudioConfig,
+                Phi4MultimodalConfig,
+                Phi4MultimodalVisionConfig,
             )
-            self.init_file(doc_file, test_doc)
-            duplicate_doc_file(doc_file, gpt2_model_patterns, new_model_patterns, frameworks=["pt"])
-            self.check_result(new_doc_file, test_new_doc_pt_only)
-
-            test_new_doc_no_tok = test_new_doc.replace(
-                """
-## GPTNewNewTokenizer
-
-[[autodoc]] GPTNewNewTokenizer
-    - save_vocabulary
-
-## GPTNewNewTokenizerFast
-
-[[autodoc]] GPTNewNewTokenizerFast
-""",
-                "",
+            from ..phi4_multimodal.feature_extraction_phi4_multimodal import Phi4MultimodalFeatureExtractor
+            from ..phi4_multimodal.image_processing_phi4_multimodal_fast import (
+                Phi4MultimodalFastImageProcessorKwargs,
+                Phi4MultimodalImageProcessorFast,
             )
-            new_model_patterns = ModelPatterns(
-                "GPT-New New", "huggingface/gpt-new-new", tokenizer_class="GPT2Tokenizer"
+            from ..phi4_multimodal.modeling_phi4_multimodal import (
+                Phi4MultimodalAttention,
+                Phi4MultimodalAudioAttention,
+                Phi4MultimodalAudioConformerEncoderLayer,
+                Phi4MultimodalAudioConvModule,
+                Phi4MultimodalAudioDepthWiseSeperableConv1d,
+                Phi4MultimodalAudioEmbedding,
+                Phi4MultimodalAudioGluPointWiseConv,
+                Phi4MultimodalAudioMeanVarianceNormLayer,
+                Phi4MultimodalAudioMLP,
+                Phi4MultimodalAudioModel,
+                Phi4MultimodalAudioNemoConvSubsampling,
+                Phi4MultimodalAudioPreTrainedModel,
+                Phi4MultimodalAudioRelativeAttentionBias,
+                Phi4MultimodalDecoderLayer,
+                Phi4MultimodalFeatureEmbedding,
+                Phi4MultimodalForCausalLM,
+                Phi4MultimodalImageEmbedding,
+                Phi4MultimodalMLP,
+                Phi4MultimodalModel,
+                Phi4MultimodalPreTrainedModel,
+                Phi4MultimodalRMSNorm,
+                Phi4MultimodalRotaryEmbedding,
+                Phi4MultimodalVisionAttention,
+                Phi4MultimodalVisionEmbeddings,
+                Phi4MultimodalVisionEncoder,
+                Phi4MultimodalVisionEncoderLayer,
+                Phi4MultimodalVisionMLP,
+                Phi4MultimodalVisionModel,
+                Phi4MultimodalVisionMultiheadAttentionPoolingHead,
+                Phi4MultimodalVisionPreTrainedModel,
             )
-            self.init_file(doc_file, test_doc)
-            duplicate_doc_file(doc_file, gpt2_model_patterns, new_model_patterns, frameworks=["pt", "tf", "flax"])
-            print(test_new_doc_no_tok)
-            self.check_result(new_doc_file, test_new_doc_no_tok)
+            from ..phi4_multimodal.processing_phi4_multimodal import Phi4MultimodalProcessor, Phi4MultimodalProcessorKwargs
 
-            test_new_doc_pt_only_no_tok = test_new_doc_no_tok.replace(
-                """
-## TFGPTNewNewModel
 
-[[autodoc]] TFGPTNewNewModel
-    - call
+            class MyTest2VisionConfig(Phi4MultimodalVisionConfig):
+                pass
 
-## FlaxGPTNewNewModel
 
-[[autodoc]] FlaxGPTNewNewModel
-    - __call__
+            class MyTest2AudioConfig(Phi4MultimodalAudioConfig):
+                pass
 
-""",
-                "",
-            )
-            self.init_file(doc_file, test_doc)
-            duplicate_doc_file(doc_file, gpt2_model_patterns, new_model_patterns, frameworks=["pt"])
-            self.check_result(new_doc_file, test_new_doc_pt_only_no_tok)
+
+            class MyTest2Config(Phi4MultimodalConfig):
+                pass
+
+
+            class MyTest2VisionMLP(Phi4MultimodalVisionMLP):
+                pass
+
+
+            class MyTest2VisionAttention(Phi4MultimodalVisionAttention):
+                pass
+
+
+            class MyTest2VisionEncoderLayer(Phi4MultimodalVisionEncoderLayer):
+                pass
+
+
+            class MyTest2VisionEncoder(Phi4MultimodalVisionEncoder):
+                pass
+
+
+            class MyTest2VisionPreTrainedModel(Phi4MultimodalVisionPreTrainedModel):
+                pass
+
+
+            class MyTest2VisionEmbeddings(Phi4MultimodalVisionEmbeddings):
+                pass
+
+
+            class MyTest2VisionMultiheadAttentionPoolingHead(Phi4MultimodalVisionMultiheadAttentionPoolingHead):
+                pass
+
+
+            class MyTest2VisionModel(Phi4MultimodalVisionModel):
+                pass
+
+
+            class MyTest2ImageEmbedding(Phi4MultimodalImageEmbedding):
+                pass
+
+
+            class MyTest2AudioMLP(Phi4MultimodalAudioMLP):
+                pass
+
+
+            class MyTest2AudioAttention(Phi4MultimodalAudioAttention):
+                pass
+
+
+            class MyTest2AudioDepthWiseSeperableConv1d(Phi4MultimodalAudioDepthWiseSeperableConv1d):
+                pass
+
+
+            class MyTest2AudioGluPointWiseConv(Phi4MultimodalAudioGluPointWiseConv):
+                pass
+
+
+            class MyTest2AudioConvModule(Phi4MultimodalAudioConvModule):
+                pass
+
+
+            class MyTest2AudioConformerEncoderLayer(Phi4MultimodalAudioConformerEncoderLayer):
+                pass
+
+
+            class MyTest2AudioNemoConvSubsampling(Phi4MultimodalAudioNemoConvSubsampling):
+                pass
+
+
+            class MyTest2AudioRelativeAttentionBias(Phi4MultimodalAudioRelativeAttentionBias):
+                pass
+
+
+            class MyTest2AudioMeanVarianceNormLayer(Phi4MultimodalAudioMeanVarianceNormLayer):
+                pass
+
+
+            class MyTest2AudioPreTrainedModel(Phi4MultimodalAudioPreTrainedModel):
+                pass
+
+
+            class MyTest2AudioModel(Phi4MultimodalAudioModel):
+                pass
+
+
+            class MyTest2AudioEmbedding(Phi4MultimodalAudioEmbedding):
+                pass
+
+
+            class MyTest2RMSNorm(Phi4MultimodalRMSNorm):
+                pass
+
+
+            class MyTest2MLP(Phi4MultimodalMLP):
+                pass
+
+
+            class MyTest2Attention(Phi4MultimodalAttention):
+                pass
+
+
+            class MyTest2DecoderLayer(Phi4MultimodalDecoderLayer):
+                pass
+
+
+            class MyTest2FeatureEmbedding(Phi4MultimodalFeatureEmbedding):
+                pass
+
+
+            class MyTest2RotaryEmbedding(Phi4MultimodalRotaryEmbedding):
+                pass
+
+
+            class MyTest2PreTrainedModel(Phi4MultimodalPreTrainedModel):
+                pass
+
+
+            class MyTest2Model(Phi4MultimodalModel):
+                pass
+
+
+            class MyTest2ForCausalLM(Phi4MultimodalForCausalLM):
+                pass
+
+
+            class MyTest2FastImageProcessorKwargs(Phi4MultimodalFastImageProcessorKwargs):
+                pass
+
+
+            class MyTest2ImageProcessorFast(Phi4MultimodalImageProcessorFast):
+                pass
+
+
+            class MyTest2FeatureExtractor(Phi4MultimodalFeatureExtractor):
+                pass
+
+
+            class MyTest2ProcessorKwargs(Phi4MultimodalProcessorKwargs):
+                pass
+
+
+            class MyTest2Processor(Phi4MultimodalProcessor):
+                pass
+
+
+            __all__ = [
+                "MyTest2VisionConfig",
+                "MyTest2AudioConfig",
+                "MyTest2Config",
+                "MyTest2AudioPreTrainedModel",
+                "MyTest2AudioModel",
+                "MyTest2VisionPreTrainedModel",
+                "MyTest2VisionModel",
+                "MyTest2PreTrainedModel",
+                "MyTest2Model",
+                "MyTest2ForCausalLM",
+                "MyTest2ImageProcessorFast",
+                "MyTest2FeatureExtractor",
+                "MyTest2Processor",
+            ]
+            """
+        )
+        self.assertFileIsEqual(EXPECTED_MODULAR, os.path.join(model_repo, "modular_my_test2.py"))
+
+        EXPECTED_INIT = textwrap.dedent(
+            f"""
+            # coding=utf-8
+            # Copyright {CURRENT_YEAR} the HuggingFace Team. All rights reserved.
+            #
+            # Licensed under the Apache License, Version 2.0 (the "License");
+            # you may not use this file except in compliance with the License.
+            # You may obtain a copy of the License at
+            #
+            #     http://www.apache.org/licenses/LICENSE-2.0
+            #
+            # Unless required by applicable law or agreed to in writing, software
+            # distributed under the License is distributed on an "AS IS" BASIS,
+            # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+            # See the License for the specific language governing permissions and
+            # limitations under the License.
+
+            from typing import TYPE_CHECKING
+
+            from ...utils import _LazyModule
+            from ...utils.import_utils import define_import_structure
+
+
+            if TYPE_CHECKING:
+                from .configuration_my_test2 import *
+                from .feature_extraction_my_test2 import *
+                from .image_processing_my_test2_fast import *
+                from .modeling_my_test2 import *
+                from .processing_my_test2 import *
+            else:
+                import sys
+
+                _file = globals()["__file__"]
+                sys.modules[__name__] = _LazyModule(__name__, _file, define_import_structure(_file), module_spec=__spec__)
+            """
+        )
+        self.assertFileIsEqual(EXPECTED_INIT, os.path.join(model_repo, "__init__.py"))
+
+        EXPECTED_DOC = textwrap.dedent(
+            f"""
+            <!--Copyright {CURRENT_YEAR} the HuggingFace Team. All rights reserved.
+
+            Licensed under the Apache License, Version 2.0 (the "License");
+            you may not use this file except in compliance with the License.
+            You may obtain a copy of the License at
+
+                http://www.apache.org/licenses/LICENSE-2.0
+
+            Unless required by applicable law or agreed to in writing, software
+            distributed under the License is distributed on an "AS IS" BASIS,
+            WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+            See the License for the specific language governing permissions and
+            limitations under the License.
+
+
+            ⚠️ Note that this file is in Markdown but contain specific syntax for our doc-builder (similar to MDX) that may not be rendered properly in your Markdown viewer.
+
+            -->
+
+
+            # MyTest2
+
+            ## Overview
+
+            The MyTest2 model was proposed in [<INSERT PAPER NAME HERE>](<INSERT PAPER LINK HERE>) by <INSERT AUTHORS HERE>.
+            <INSERT SHORT SUMMARY HERE>
+
+            The abstract from the paper is the following:
+
+            <INSERT PAPER ABSTRACT HERE>
+
+            Tips:
+
+            <INSERT TIPS ABOUT MODEL HERE>
+
+            This model was contributed by [INSERT YOUR HF USERNAME HERE](https://huggingface.co/<INSERT YOUR HF USERNAME HERE>).
+            The original code can be found [here](<INSERT LINK TO GITHUB REPO HERE>).
+
+            ## Usage examples
+
+            <INSERT SOME NICE EXAMPLES HERE>
+
+            ## MyTest2VisionConfig
+
+            [[autodoc]] MyTest2VisionConfig
+
+            ## MyTest2AudioConfig
+
+            [[autodoc]] MyTest2AudioConfig
+
+            ## MyTest2Config
+
+            [[autodoc]] MyTest2Config
+
+            ## MyTest2AudioPreTrainedModel
+
+            [[autodoc]] MyTest2AudioPreTrainedModel
+                - forward
+
+            ## MyTest2AudioModel
+
+            [[autodoc]] MyTest2AudioModel
+                - forward
+
+            ## MyTest2VisionPreTrainedModel
+
+            [[autodoc]] MyTest2VisionPreTrainedModel
+                - forward
+
+            ## MyTest2VisionModel
+
+            [[autodoc]] MyTest2VisionModel
+                - forward
+
+            ## MyTest2PreTrainedModel
+
+            [[autodoc]] MyTest2PreTrainedModel
+                - forward
+
+            ## MyTest2Model
+
+            [[autodoc]] MyTest2Model
+                - forward
+
+            ## MyTest2ForCausalLM
+
+            [[autodoc]] MyTest2ForCausalLM
+
+            ## MyTest2ImageProcessorFast
+
+            [[autodoc]] MyTest2ImageProcessorFast
+
+            ## MyTest2FeatureExtractor
+
+            [[autodoc]] MyTest2FeatureExtractor
+
+            ## MyTest2Processor
+
+            [[autodoc]] MyTest2Processor
+            """
+        )
+        self.assertFileIsEqual(EXPECTED_DOC, os.path.join(self.DOC_PATH, "model_doc", "my_test2.md"))
diff --git a/utils/modular_model_converter.py b/utils/modular_model_converter.py
index ade3589868..fd553cc3b9 100644
--- a/utils/modular_model_converter.py
+++ b/utils/modular_model_converter.py
@@ -17,12 +17,12 @@ import glob
 import importlib
 import os
 import re
+import subprocess
 from abc import ABC, abstractmethod
 from collections import Counter, defaultdict, deque
 from typing import Optional, Union
 
 import libcst as cst
-from check_copies import run_ruff
 from create_dependency_mapping import find_priority_list
 from libcst import ClassDef, CSTVisitor
 from libcst import matchers as m
@@ -1676,6 +1676,16 @@ def create_modules(modular_mapper: ModularFileMapper) -> dict[str, cst.Module]:
     return files
 
 
+def run_ruff(code, check=False):
+    if check:
+        command = ["ruff", "check", "-", "--fix", "--exit-zero"]
+    else:
+        command = ["ruff", "format", "-", "--config", "pyproject.toml", "--silent"]
+    process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, stdin=subprocess.PIPE)
+    stdout, _ = process.communicate(input=code.encode())
+    return stdout.decode()
+
+
 def convert_modular_file(modular_file):
     pattern = re.search(r"modular_(.*)(?=\.py$)", modular_file)
     output = {}