From 32eb29fef9e73a0ade63dcc86c1fceb0bba68a5b Mon Sep 17 00:00:00 2001 From: Yih-Dar <2521628+ydshieh@users.noreply.github.com> Date: Mon, 13 Dec 2021 12:50:02 +0100 Subject: [PATCH] Fix doc examples: modify config before super().__init__ (#14697) Co-authored-by: ydshieh --- src/transformers/models/bart/modeling_bart.py | 2 +- .../models/bigbird_pegasus/modeling_bigbird_pegasus.py | 2 +- src/transformers/models/blenderbot/modeling_blenderbot.py | 2 +- .../models/blenderbot_small/modeling_blenderbot_small.py | 2 +- src/transformers/models/marian/modeling_marian.py | 2 +- src/transformers/models/mbart/modeling_mbart.py | 2 +- src/transformers/models/pegasus/modeling_pegasus.py | 2 +- .../models/speech_to_text_2/modeling_speech_to_text_2.py | 2 +- src/transformers/models/trocr/modeling_trocr.py | 2 +- .../modeling_{{cookiecutter.lowercase_modelname}}.py | 2 +- 10 files changed, 10 insertions(+), 10 deletions(-) diff --git a/src/transformers/models/bart/modeling_bart.py b/src/transformers/models/bart/modeling_bart.py index ef019ebebb..81fa8a354e 100755 --- a/src/transformers/models/bart/modeling_bart.py +++ b/src/transformers/models/bart/modeling_bart.py @@ -1662,10 +1662,10 @@ class BartDecoderWrapper(BartPretrainedModel): class BartForCausalLM(BartPretrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = BartDecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/bigbird_pegasus/modeling_bigbird_pegasus.py b/src/transformers/models/bigbird_pegasus/modeling_bigbird_pegasus.py index 71a8d70d1a..96c7bcf300 100755 --- a/src/transformers/models/bigbird_pegasus/modeling_bigbird_pegasus.py +++ b/src/transformers/models/bigbird_pegasus/modeling_bigbird_pegasus.py @@ -2865,10 +2865,10 @@ class BigBirdPegasusDecoderWrapper(BigBirdPegasusPreTrainedModel): # Copied from transformers.models.bart.modeling_bart.BartForCausalLM with Bart->BigBirdPegasus, 'facebook/bart-large'->"google/bigbird-pegasus-large-arxiv" class BigBirdPegasusForCausalLM(BigBirdPegasusPreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = BigBirdPegasusDecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/blenderbot/modeling_blenderbot.py b/src/transformers/models/blenderbot/modeling_blenderbot.py index 574fc67b79..208d997f2b 100755 --- a/src/transformers/models/blenderbot/modeling_blenderbot.py +++ b/src/transformers/models/blenderbot/modeling_blenderbot.py @@ -1400,10 +1400,10 @@ class BlenderbotDecoderWrapper(BlenderbotPreTrainedModel): # Copied from transformers.models.bart.modeling_bart.BartForCausalLM with Bart->Blenderbot class BlenderbotForCausalLM(BlenderbotPreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = BlenderbotDecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/blenderbot_small/modeling_blenderbot_small.py b/src/transformers/models/blenderbot_small/modeling_blenderbot_small.py index b0e6bec192..541b955914 100755 --- a/src/transformers/models/blenderbot_small/modeling_blenderbot_small.py +++ b/src/transformers/models/blenderbot_small/modeling_blenderbot_small.py @@ -1374,10 +1374,10 @@ class BlenderbotSmallDecoderWrapper(BlenderbotSmallPreTrainedModel): # Copied from transformers.models.bart.modeling_bart.BartForCausalLM with Bart->BlenderbotSmall class BlenderbotSmallForCausalLM(BlenderbotSmallPreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = BlenderbotSmallDecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/marian/modeling_marian.py b/src/transformers/models/marian/modeling_marian.py index dc839b8983..9827f4caee 100755 --- a/src/transformers/models/marian/modeling_marian.py +++ b/src/transformers/models/marian/modeling_marian.py @@ -1397,10 +1397,10 @@ class MarianDecoderWrapper(MarianPreTrainedModel): # Copied from transformers.models.bart.modeling_bart.BartForCausalLM with Bart->Marian class MarianForCausalLM(MarianPreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = MarianDecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/mbart/modeling_mbart.py b/src/transformers/models/mbart/modeling_mbart.py index ecea4674e0..3cd5ba3ddc 100755 --- a/src/transformers/models/mbart/modeling_mbart.py +++ b/src/transformers/models/mbart/modeling_mbart.py @@ -1665,10 +1665,10 @@ class MBartDecoderWrapper(MBartPreTrainedModel): # Copied from transformers.models.bart.modeling_bart.BartForCausalLM with Bart->MBart class MBartForCausalLM(MBartPreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = MBartDecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/pegasus/modeling_pegasus.py b/src/transformers/models/pegasus/modeling_pegasus.py index ff2d4f10b6..e898826950 100755 --- a/src/transformers/models/pegasus/modeling_pegasus.py +++ b/src/transformers/models/pegasus/modeling_pegasus.py @@ -1486,10 +1486,10 @@ class PegasusDecoderWrapper(PegasusPreTrainedModel): class PegasusForCausalLM(PegasusPreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = PegasusDecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/speech_to_text_2/modeling_speech_to_text_2.py b/src/transformers/models/speech_to_text_2/modeling_speech_to_text_2.py index a6b4e5b542..4aee66b534 100755 --- a/src/transformers/models/speech_to_text_2/modeling_speech_to_text_2.py +++ b/src/transformers/models/speech_to_text_2/modeling_speech_to_text_2.py @@ -744,10 +744,10 @@ class Speech2Text2DecoderWrapper(Speech2Text2PreTrainedModel): ) class Speech2Text2ForCausalLM(Speech2Text2PreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = Speech2Text2DecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/src/transformers/models/trocr/modeling_trocr.py b/src/transformers/models/trocr/modeling_trocr.py index 5b8943a26a..5cc566b2cb 100644 --- a/src/transformers/models/trocr/modeling_trocr.py +++ b/src/transformers/models/trocr/modeling_trocr.py @@ -777,10 +777,10 @@ class TrOCRDecoderWrapper(TrOCRPreTrainedModel): ) class TrOCRForCausalLM(TrOCRPreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = TrOCRDecoderWrapper(config) self.output_projection = nn.Linear(config.hidden_size, config.vocab_size, bias=False) diff --git a/templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_{{cookiecutter.lowercase_modelname}}.py b/templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_{{cookiecutter.lowercase_modelname}}.py index a866859285..38320ee1b6 100755 --- a/templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_{{cookiecutter.lowercase_modelname}}.py +++ b/templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_{{cookiecutter.lowercase_modelname}}.py @@ -3173,10 +3173,10 @@ class {{cookiecutter.camelcase_modelname}}DecoderWrapper({{cookiecutter.camelcas # Copied from transformers.models.bart.modeling_bart.BartForCausalLM with Bart->{{cookiecutter.camelcase_modelname}} class {{cookiecutter.camelcase_modelname}}ForCausalLM({{cookiecutter.camelcase_modelname}}PreTrainedModel): def __init__(self, config): - super().__init__(config) config = copy.deepcopy(config) config.is_decoder = True config.is_encoder_decoder = False + super().__init__(config) self.model = {{cookiecutter.camelcase_modelname}}DecoderWrapper(config) self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False)