diff --git a/train_configs/llama3_405b.toml b/train_configs/llama3_405b.toml index fb250642..b7f78dc2 100644 --- a/train_configs/llama3_405b.toml +++ b/train_configs/llama3_405b.toml @@ -23,7 +23,7 @@ tokenizer_path = "./torchtitan/datasets/tokenizer/original/tokenizer.model" [optimizer] name = "AdamW" -lr = 0.8e-4 +lr = 8e-5 [training] batch_size = 2