From cfeef6d9d2c4b6fd6e978d28f604ff8dbe5c4bd0 Mon Sep 17 00:00:00 2001 From: Kosti Date: Tue, 20 Feb 2024 23:47:17 +0000 Subject: [PATCH] Typo: SGD->AdamW (#471) --- transformer_lm/main.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/transformer_lm/main.py b/transformer_lm/main.py index e5ec37dd..044af58c 100644 --- a/transformer_lm/main.py +++ b/transformer_lm/main.py @@ -189,7 +189,7 @@ if __name__ == "__main__": "--num_iters", type=int, default=100000, help="Iterations to train for." ) parser.add_argument( - "--learning_rate", type=float, default=3e-4, help="SGD learning rate." + "--learning_rate", type=float, default=3e-4, help="AdamW learning rate." ) parser.add_argument( "--weight_decay", type=float, default=1e-5, help="Set the weight decay"