From 8ebf7c6bd9bdda693a429a05a8d5496414492a03 Mon Sep 17 00:00:00 2001 From: jahatef Date: Tue, 31 Oct 2023 01:33:46 +0000 Subject: [PATCH] fix lion optimizer documentation --- megatron/neox_arguments/neox_args.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/megatron/neox_arguments/neox_args.py b/megatron/neox_arguments/neox_args.py index e1a58b6d9..8d0953da2 100644 --- a/megatron/neox_arguments/neox_args.py +++ b/megatron/neox_arguments/neox_args.py @@ -390,7 +390,7 @@ class NeoXArgsOptimizer(NeoXArgsTemplate): "adam", "onebitadam", "cpu_adam", "cpu_torch_adam", "sm3", "madgrad_wd", "sgd", "lion" ] = "adam" """ - Type of optimizer to use. Choose from ['adam', 'onebitadam', 'cpu_adam', 'cpu_torch_adam', 'sm3', 'madgrad_wd', 'sgd'] + Type of optimizer to use. Choose from ['adam', 'onebitadam', 'cpu_adam', 'cpu_torch_adam', 'sm3', 'madgrad_wd', 'sgd', 'lion'] NOTE: sgd will use MuSGD from Mup. Mup must be enabled for this optimizer. """