We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 060780d + 3cd1a3a commit 65f9791Copy full SHA for 65f9791
train_configs/llama3_405b.toml
@@ -23,7 +23,7 @@ tokenizer_path = "./torchtitan/datasets/tokenizer/original/tokenizer.model"
23
24
[optimizer]
25
name = "AdamW"
26
-lr = 0.8e-4
+lr = 8e-5
27
28
[training]
29
batch_size = 2
0 commit comments