diff --git a/litgpt/config.py b/litgpt/config.py index 9ff7825589..e03fa8ae34 100644 --- a/litgpt/config.py +++ b/litgpt/config.py @@ -847,8 +847,8 @@ def norm_class(self) -> Type: name="Llama-3-8B{}", hf_config=dict(org="meta-llama", name="Meta-Llama-3-8B{}"), block_size=8192, - vocab_size=128256, - padding_multiple=64, + vocab_size=128000, + padded_vocab_size=128256, n_layer=32, n_head=32, n_query_groups=8, @@ -865,8 +865,8 @@ def norm_class(self) -> Type: name="Llama-3-70B{}", hf_config=dict(org="meta-llama", name="Meta-Llama-3-70B{}"), block_size=8192, - vocab_size=128256, - padding_multiple=64, + vocab_size=128000, + padded_vocab_size=128256, n_layer=80, n_head=64, n_embd=8192,