diff --git a/docs/source/en/optimizers.md b/docs/source/en/optimizers.md index 20bb956ad6..8c8a197dba 100644 --- a/docs/source/en/optimizers.md +++ b/docs/source/en/optimizers.md @@ -137,7 +137,6 @@ args = TrainingArguments( max_steps=1000, per_device_train_batch_size=4, + optim="adalomo", - gradient_checkpointing=True, gradient_checkpointing=True, logging_strategy="steps", logging_steps=1, @@ -199,4 +198,4 @@ args = TrainingArguments( save_strategy="no", run_name="stable-adamw", ) -``` \ No newline at end of file +```