From 6c1b23554f8bb5b5e1f6c80969acab764c755678 Mon Sep 17 00:00:00 2001 From: Lysandre Date: Mon, 3 Feb 2020 17:23:53 -0500 Subject: [PATCH] Sample instead of greedy decoding by default in generate --- src/transformers/modeling_utils.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/transformers/modeling_utils.py b/src/transformers/modeling_utils.py index 2e1215cb45..4178e8ca1e 100644 --- a/src/transformers/modeling_utils.py +++ b/src/transformers/modeling_utils.py @@ -586,7 +586,7 @@ class PreTrainedModel(nn.Module, ModuleUtilsMixin): self, input_ids=None, max_length=None, - do_sample=None, + do_sample=True, num_beams=None, temperature=None, top_k=None, @@ -617,7 +617,7 @@ class PreTrainedModel(nn.Module, ModuleUtilsMixin): The max length of the sequence to be generated. Between 1 and infinity. Default to 20. do_sample: (`optional`) bool - If set to `False` greedy decoding is used. Otherwise sampling is used. Default to greedy sampling. + If set to `False` greedy decoding is used. Otherwise sampling is used. Defaults to `True`. num_beams: (`optional`) int Number of beams for beam search. Must be between 1 and infinity. 1 means no beam search. Default to 1.