diff --git a/examples/run_transfo_xl.py b/examples/run_transfo_xl.py index 1218a1f547..3a0a70e68e 100644 --- a/examples/run_transfo_xl.py +++ b/examples/run_transfo_xl.py @@ -100,7 +100,7 @@ def main(): total_len, total_loss = 0, 0. start_time = time.time() with torch.no_grad(): - mems = tuple() + mems = None for idx, (data, target, seq_len) in enumerate(eval_iter): ret = model(data, target, *mems) loss, mems = ret