consistent ignore keys + make private (#8737)
* consistent ignore keys + make private * style * - authorized_missing_keys => _keys_to_ignore_on_load_missing - authorized_unexpected_keys => _keys_to_ignore_on_load_unexpected * move public doc of private attributes to private comment
This commit is contained in:
@@ -576,7 +576,7 @@ class RobertaModel(RobertaPreTrainedModel):
|
||||
|
||||
"""
|
||||
|
||||
authorized_missing_keys = [r"position_ids"]
|
||||
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
||||
|
||||
# Copied from transformers.models.bert.modeling_bert.BertModel.__init__ with Bert->Roberta
|
||||
def __init__(self, config, add_pooling_layer=True):
|
||||
@@ -711,8 +711,8 @@ class RobertaModel(RobertaPreTrainedModel):
|
||||
"""RoBERTa Model with a `language modeling` head on top for CLM fine-tuning. """, ROBERTA_START_DOCSTRING
|
||||
)
|
||||
class RobertaForCausalLM(RobertaPreTrainedModel):
|
||||
authorized_missing_keys = [r"position_ids", r"predictions.decoder.bias"]
|
||||
authorized_unexpected_keys = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"position_ids", r"predictions.decoder.bias"]
|
||||
_keys_to_ignore_on_load_unexpected = [r"pooler"]
|
||||
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
@@ -829,8 +829,8 @@ class RobertaForCausalLM(RobertaPreTrainedModel):
|
||||
|
||||
@add_start_docstrings("""RoBERTa Model with a `language modeling` head on top. """, ROBERTA_START_DOCSTRING)
|
||||
class RobertaForMaskedLM(RobertaPreTrainedModel):
|
||||
authorized_missing_keys = [r"position_ids", r"predictions.decoder.bias"]
|
||||
authorized_unexpected_keys = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"position_ids", r"predictions.decoder.bias"]
|
||||
_keys_to_ignore_on_load_unexpected = [r"pooler"]
|
||||
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
@@ -948,7 +948,7 @@ class RobertaLMHead(nn.Module):
|
||||
ROBERTA_START_DOCSTRING,
|
||||
)
|
||||
class RobertaForSequenceClassification(RobertaPreTrainedModel):
|
||||
authorized_missing_keys = [r"position_ids"]
|
||||
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
||||
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
@@ -1031,7 +1031,7 @@ class RobertaForSequenceClassification(RobertaPreTrainedModel):
|
||||
ROBERTA_START_DOCSTRING,
|
||||
)
|
||||
class RobertaForMultipleChoice(RobertaPreTrainedModel):
|
||||
authorized_missing_keys = [r"position_ids"]
|
||||
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
||||
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
@@ -1123,8 +1123,8 @@ class RobertaForMultipleChoice(RobertaPreTrainedModel):
|
||||
ROBERTA_START_DOCSTRING,
|
||||
)
|
||||
class RobertaForTokenClassification(RobertaPreTrainedModel):
|
||||
authorized_unexpected_keys = [r"pooler"]
|
||||
authorized_missing_keys = [r"position_ids"]
|
||||
_keys_to_ignore_on_load_unexpected = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
||||
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
@@ -1233,8 +1233,8 @@ class RobertaClassificationHead(nn.Module):
|
||||
ROBERTA_START_DOCSTRING,
|
||||
)
|
||||
class RobertaForQuestionAnswering(RobertaPreTrainedModel):
|
||||
authorized_unexpected_keys = [r"pooler"]
|
||||
authorized_missing_keys = [r"position_ids"]
|
||||
_keys_to_ignore_on_load_unexpected = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"position_ids"]
|
||||
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
|
||||
@@ -765,7 +765,7 @@ class TFRobertaLMHead(tf.keras.layers.Layer):
|
||||
@add_start_docstrings("""RoBERTa Model with a `language modeling` head on top. """, ROBERTA_START_DOCSTRING)
|
||||
class TFRobertaForMaskedLM(TFRobertaPreTrainedModel, TFMaskedLanguageModelingLoss):
|
||||
|
||||
authorized_missing_keys = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"pooler"]
|
||||
|
||||
def __init__(self, config, *inputs, **kwargs):
|
||||
super().__init__(config, *inputs, **kwargs)
|
||||
@@ -877,7 +877,7 @@ class TFRobertaClassificationHead(tf.keras.layers.Layer):
|
||||
)
|
||||
class TFRobertaForSequenceClassification(TFRobertaPreTrainedModel, TFSequenceClassificationLoss):
|
||||
|
||||
authorized_missing_keys = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"pooler"]
|
||||
|
||||
def __init__(self, config, *inputs, **kwargs):
|
||||
super().__init__(config, *inputs, **kwargs)
|
||||
@@ -1084,7 +1084,7 @@ class TFRobertaForMultipleChoice(TFRobertaPreTrainedModel, TFMultipleChoiceLoss)
|
||||
)
|
||||
class TFRobertaForTokenClassification(TFRobertaPreTrainedModel, TFTokenClassificationLoss):
|
||||
|
||||
authorized_missing_keys = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"pooler"]
|
||||
|
||||
def __init__(self, config, *inputs, **kwargs):
|
||||
super().__init__(config, *inputs, **kwargs)
|
||||
@@ -1171,7 +1171,7 @@ class TFRobertaForTokenClassification(TFRobertaPreTrainedModel, TFTokenClassific
|
||||
)
|
||||
class TFRobertaForQuestionAnswering(TFRobertaPreTrainedModel, TFQuestionAnsweringLoss):
|
||||
|
||||
authorized_missing_keys = [r"pooler"]
|
||||
_keys_to_ignore_on_load_missing = [r"pooler"]
|
||||
|
||||
def __init__(self, config, *inputs, **kwargs):
|
||||
super().__init__(config, *inputs, **kwargs)
|
||||
|
||||
Reference in New Issue
Block a user