From 2b574e7c60dfdd12eb1d54709b326672d798eb08 Mon Sep 17 00:00:00 2001 From: Sam Shleifer Date: Tue, 6 Oct 2020 11:33:51 -0400 Subject: [PATCH] [bart] fix config.classif_dropout (#7593) --- notebooks/05-benchmark.ipynb | 2 +- src/transformers/configuration_bart.py | 2 +- src/transformers/modeling_bart.py | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/notebooks/05-benchmark.ipynb b/notebooks/05-benchmark.ipynb index 455b80b8c3..d6d7d5743b 100644 --- a/notebooks/05-benchmark.ipynb +++ b/notebooks/05-benchmark.ipynb @@ -1658,7 +1658,7 @@ " 'add_final_layer_norm': False,\n", " 'attention_dropout': 0.0,\n", " 'bos_token_id': 0,\n", - " 'classif_dropout': 0.0,\n", + " 'classifier_dropout': 0.0,\n", " 'd_model': 1024,\n", " 'decoder_attention_heads': 16,\n", " 'decoder_ffn_dim': 4096,\n", diff --git a/src/transformers/configuration_bart.py b/src/transformers/configuration_bart.py index cd58d24a62..684df61562 100644 --- a/src/transformers/configuration_bart.py +++ b/src/transformers/configuration_bart.py @@ -195,7 +195,7 @@ class BartConfig(PretrainedConfig): self.dropout = dropout # Classifier stuff - self.classif_dropout = classifier_dropout + self.classifier_dropout = classifier_dropout # pos embedding offset self.extra_pos_embeddings = self.pad_token_id + 1 diff --git a/src/transformers/modeling_bart.py b/src/transformers/modeling_bart.py index 10bcf6d3cc..6d5b56199f 100644 --- a/src/transformers/modeling_bart.py +++ b/src/transformers/modeling_bart.py @@ -1176,7 +1176,7 @@ class BartForSequenceClassification(PretrainedBartModel): config.d_model, config.d_model, config.num_labels, - config.classif_dropout, + config.classifier_dropout, ) self.model._init_weights(self.classification_head.dense) self.model._init_weights(self.classification_head.out_proj)