From ca422e3d7d8086baf233993af2f6f90f30729933 Mon Sep 17 00:00:00 2001 From: Patrick von Platen Date: Thu, 21 Jan 2021 11:17:13 +0100 Subject: [PATCH] finish (#9721) --- src/transformers/models/t5/modeling_t5.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/transformers/models/t5/modeling_t5.py b/src/transformers/models/t5/modeling_t5.py index a050b81fd0..f27ede05e1 100644 --- a/src/transformers/models/t5/modeling_t5.py +++ b/src/transformers/models/t5/modeling_t5.py @@ -934,9 +934,9 @@ class T5Stack(T5PreTrainedModel): encoder_extended_attention_mask = encoder_extended_attention_mask.to(hidden_states.device) if encoder_decoder_position_bias is not None: encoder_decoder_position_bias = encoder_decoder_position_bias.to(hidden_states.device) - if head_mask is not None: + if not (isinstance(head_mask, list) and head_mask[0] is None): head_mask = head_mask.to(hidden_states.device) - if encoder_head_mask is not None: + if not (isinstance(encoder_head_mask, list) and encoder_head_mask[0] is None): encoder_head_mask = encoder_head_mask.to(hidden_states.device) if output_hidden_states: all_hidden_states = all_hidden_states + (hidden_states,)