Update all references to canonical models (#29001)

* Script & Manual edition * Update
2024-02-16 08:16:58 +01:00
parent 1e402b957d
commit f497f564bb
561 changed files with 2682 additions and 2687 deletions
--- a/tests/trainer/test_trainer.py
+++ b/tests/trainer/test_trainer.py
@@ -1537,7 +1537,7 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon):
        with tempfile.TemporaryDirectory() as tmpdir:
            testargs = f"""
                run_glue.py
-                --model_name_or_path distilbert-base-uncased
+                --model_name_or_path distilbert/distilbert-base-uncased
                --task_name mrpc
                --do_train
                --do_eval
@@ -1886,7 +1886,7 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon):

    @slow
    def test_trainer_eval_mrpc(self):
-        MODEL_ID = "bert-base-cased-finetuned-mrpc"
+        MODEL_ID = "google-bert/bert-base-cased-finetuned-mrpc"
        tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
        model = AutoModelForSequenceClassification.from_pretrained(MODEL_ID)
        data_args = GlueDataTrainingArguments(
@@ -1901,7 +1901,7 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon):

    @slow
    def test_trainer_eval_multiple(self):
-        MODEL_ID = "gpt2"
+        MODEL_ID = "openai-community/gpt2"
        tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
        model = AutoModelForCausalLM.from_pretrained(MODEL_ID)
        dataset = LineByLineTextDataset(
@@ -1930,7 +1930,7 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon):

    @slow
    def test_trainer_eval_lm(self):
-        MODEL_ID = "distilroberta-base"
+        MODEL_ID = "distilbert/distilroberta-base"
        tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
        dataset = LineByLineTextDataset(
            tokenizer=tokenizer,
@@ -2384,7 +2384,7 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon):
                "launch",
                script_path,
                "--model_name_or_path",
-                "t5-small",
+                "google-t5/t5-small",
                "--per_device_train_batch_size",
                "1",
                "--output_dir",