Add inverse sqrt learning rate scheduler (#21495)
* added inverse sqrt lr scheduler * Updated get_scheduler in src/transformers/optimization.py * Updated src/transformers/__init__.py * Added inverse sqrt lr scheduler test * Updated docs/source/en/main_classes/optimizer_schedules.mdx * Ran style and quality scripts * Fix get_inverse_sqrt_schedule docstring * Comment implementation URL
This commit is contained in:
committed by
GitHub
parent
b9af152efb
commit
a3034c7004
@@ -33,6 +33,7 @@ if is_torch_available():
|
||||
get_constant_schedule_with_warmup,
|
||||
get_cosine_schedule_with_warmup,
|
||||
get_cosine_with_hard_restarts_schedule_with_warmup,
|
||||
get_inverse_sqrt_schedule,
|
||||
get_linear_schedule_with_warmup,
|
||||
get_polynomial_decay_schedule_with_warmup,
|
||||
)
|
||||
@@ -145,6 +146,10 @@ class ScheduleInitTest(unittest.TestCase):
|
||||
{**common_kwargs, "power": 2.0, "lr_end": 1e-7},
|
||||
[0.0, 5.0, 10.0, 7.656, 5.625, 3.906, 2.5, 1.406, 0.625, 0.156],
|
||||
),
|
||||
get_inverse_sqrt_schedule: (
|
||||
{"num_warmup_steps": 2},
|
||||
[0.0, 5.0, 10.0, 8.165, 7.071, 6.325, 5.774, 5.345, 5.0, 4.714],
|
||||
),
|
||||
}
|
||||
|
||||
for scheduler_func, data in scheds.items():
|
||||
|
||||
Reference in New Issue
Block a user