From d064fb56476de2280b7d74b0ff9da06956a9d18a Mon Sep 17 00:00:00 2001 From: felixgwu Date: Wed, 3 Mar 2021 12:05:21 -0500 Subject: [PATCH] Fix the bug in constructing the all_hidden_states of DeBERTa v2 (#10466) * fix all_hidden_states * use output_states instead of next_kv --- src/transformers/models/deberta_v2/modeling_deberta_v2.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/transformers/models/deberta_v2/modeling_deberta_v2.py b/src/transformers/models/deberta_v2/modeling_deberta_v2.py index 29f495b481..4fd6131e45 100644 --- a/src/transformers/models/deberta_v2/modeling_deberta_v2.py +++ b/src/transformers/models/deberta_v2/modeling_deberta_v2.py @@ -450,10 +450,11 @@ class DebertaV2Encoder(nn.Module): else: next_kv = hidden_states rel_embeddings = self.get_rel_embedding() + output_states = next_kv for i, layer_module in enumerate(self.layer): if output_hidden_states: - all_hidden_states = all_hidden_states + (hidden_states,) + all_hidden_states = all_hidden_states + (output_states,) output_states = layer_module( next_kv,