[Use cache] Align logic of use_cache with output_attentions and output_hidden_states (#5194)

* fix use cache * add bart use cache * fix bart * finish bart
2020-06-24 16:09:17 +02:00
parent 64c393ee74
commit c2a26ec8a6
13 changed files with 90 additions and 21 deletions
--- a/tests/test_modeling_t5.py
+++ b/tests/test_modeling_t5.py
@@ -193,7 +193,14 @@ class T5ModelTester:
        model.eval()

        # first forward pass
-        output, past_key_value_states = model(input_ids, use_cache=True)
+        outputs = model(input_ids, use_cache=True)
+        outputs_use_cache_conf = model(input_ids)
+        outputs_no_past = model(input_ids, use_cache=False)
+
+        self.parent.assertTrue(len(outputs) == len(outputs_use_cache_conf))
+        self.parent.assertTrue(len(outputs) == len(outputs_no_past) + 1)
+
+        output, past_key_value_states = outputs

        # create hypothetical next token and extent to next_input_ids
        next_tokens = ids_tensor((self.batch_size, 1), config.vocab_size)