From 63e91f5fde64563bdf19276d3eca9b61fc8310c3 Mon Sep 17 00:00:00 2001 From: Sylvain Gugger <35901082+sgugger@users.noreply.github.com> Date: Fri, 20 Nov 2020 09:27:25 -0500 Subject: [PATCH] Document adam betas TrainingArguments (#8688) --- src/transformers/training_args.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/transformers/training_args.py b/src/transformers/training_args.py index d9650261ea..416037ac43 100644 --- a/src/transformers/training_args.py +++ b/src/transformers/training_args.py @@ -89,6 +89,10 @@ class TrainingArguments: The initial learning rate for Adam. weight_decay (:obj:`float`, `optional`, defaults to 0): The weight decay to apply (if not zero). + adam_beta1 (:obj:`float`, `optional`, defaults to 0.9): + The beta1 for the Adam optimizer. + adam_beta2 (:obj:`float`, `optional`, defaults to 0.999): + The beta2 for the Adam optimizer. adam_epsilon (:obj:`float`, `optional`, defaults to 1e-8): Epsilon for the Adam optimizer. max_grad_norm (:obj:`float`, `optional`, defaults to 1.0):