Skip to content

Commit

Permalink
[NeMo-UX] Adding recipes (NVIDIA#9720) (NVIDIA#9851)
Browse files Browse the repository at this point in the history
* Adding recipy proposal

* Adding more recipies

* Apply isort and black reformatting

* Remove api.py inside llm.gpt.model

* Adding resume to FineTuneRecipy

* Fix spelling error

* Fix spelling error

* Fix spelling error

* Apply isort and black reformatting

* Adding resume to PreTrainRecipe

* update recipe proposal to use sdk.Partial

* Apply isort and black reformatting

* update __init__

* update __init__

* fix return type

* Fix bug in factory

* rename recipe folder to 'models'

* Fixes

* Apply isort and black reformatting

* Bug fixes

* rename models --> configs

* Apply isort and black reformatting

* rename configs --> recipes

* Apply isort and black reformatting

* address comments

---------

Signed-off-by: ashors1 <[email protected]>
Signed-off-by: artbataev <[email protected]>
Signed-off-by: marcromeyn <[email protected]>
Signed-off-by: ashors1 <[email protected]>
Signed-off-by: Hemil Desai <[email protected]>
Signed-off-by: hemildesai <[email protected]>
Co-authored-by: Marc Romeyn <[email protected]>
Co-authored-by: artbataev <[email protected]>
Co-authored-by: marcromeyn <[email protected]>
Co-authored-by: ashors1 <[email protected]>
Co-authored-by: ashors1 <[email protected]>
Co-authored-by: Hemil Desai <[email protected]>
Co-authored-by: hemildesai <[email protected]>
Co-authored-by: Anna Shors <[email protected]>
Signed-off-by: Boxiang Wang <[email protected]>
  • Loading branch information
9 people authored and BoxiangW committed Jul 30, 2024
1 parent 4a10842 commit dbf151a
Show file tree
Hide file tree
Showing 13 changed files with 320 additions and 162 deletions.
35 changes: 1 addition & 34 deletions nemo/collections/llm/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -42,24 +42,7 @@
gpt_data_step,
gpt_forward_step,
)
from nemo.collections.llm.gpt.model.api import (
code_gemma_2b,
code_gemma_7b,
code_llama_7b,
code_llama_13b,
code_llama_34b,
code_llama_70b,
gemma,
gemma_2b,
gemma_7b,
llama2_7b,
llama2_13b,
llama2_70b,
llama3_8b,
llama3_70b,
mistral,
mixtral,
)
from nemo.collections.llm.recipes import * # noqa

__all__ = [
"MockDataModule",
Expand Down Expand Up @@ -103,21 +86,5 @@
"mock",
"squad",
"dolly",
"mistral",
"mixtral",
"llama2_7b",
"llama3_8b",
"llama2_13b",
"llama2_70b",
"llama3_70b",
"code_llama_7b",
"code_llama_13b",
"code_llama_34b",
"code_llama_70b",
"gemma",
"gemma_2b",
"gemma_7b",
"code_gemma_2b",
"code_gemma_7b",
"peft",
]
125 changes: 0 additions & 125 deletions nemo/collections/llm/gpt/model/api.py

This file was deleted.

13 changes: 13 additions & 0 deletions nemo/collections/llm/recipes/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
from nemo.collections.llm.recipes import llama2_7b, llama3_8b, llama3_8b_16k, llama3_8b_64k, mistral
from nemo.collections.llm.recipes.log.default import default_log
from nemo.collections.llm.recipes.optim import adam

__all__ = [
"llama3_8b",
"llama3_8b_16k",
"llama3_8b_64k",
"llama2_7b",
"mistral",
"adam",
"default_log",
]
61 changes: 61 additions & 0 deletions nemo/collections/llm/recipes/llama2_7b.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,61 @@
import pytorch_lightning as pl

from nemo import lightning as nl
from nemo.collections.llm.api import finetune, pretrain
from nemo.collections.llm.gpt.data.api import squad
from nemo.collections.llm.gpt.model.llama import Llama2Config7B, LlamaModel
from nemo.collections.llm.peft.api import gpt_lora
from nemo.collections.llm.recipes.log.default import default_log
from nemo.collections.llm.recipes.optim.adam import adam_with_cosine_annealing
from nemo.collections.llm.utils import Partial, factory

NAME = "llama2_7b"


@factory(name=NAME)
def model() -> pl.LightningModule:
return LlamaModel(Llama2Config7B())


@factory(name=NAME)
def trainer(devices=8) -> nl.Trainer:
strategy = nl.MegatronStrategy(tensor_model_parallel_size=2)

return nl.Trainer(
devices=devices,
max_steps=100,
accelerator="gpu",
strategy=strategy,
plugins=nl.MegatronMixedPrecision(precision="bf16-mixed"),
)


@factory(name=NAME + "_hf")
def hf_resume() -> nl.AutoResume:
return nl.AutoResume(import_path="hf://meta-llama/Llama-2-7b-hf")


@factory(name=NAME, for_task="llm.pretrain")
def pretrain_recipe() -> Partial:
return Partial(
pretrain,
model=model,
trainer=trainer,
data=squad,
log=default_log,
optim=adam_with_cosine_annealing,
)


@factory(name=NAME, for_task="llm.finetune")
def finetune_recipe() -> Partial:
return Partial(
finetune,
model=model,
trainer=trainer,
data=squad,
log=default_log,
optim=adam_with_cosine_annealing,
peft=gpt_lora,
resume=hf_resume,
)
61 changes: 61 additions & 0 deletions nemo/collections/llm/recipes/llama3_8b.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,61 @@
import pytorch_lightning as pl

from nemo import lightning as nl
from nemo.collections.llm.api import finetune, pretrain
from nemo.collections.llm.gpt.data.api import squad
from nemo.collections.llm.gpt.model.llama import Llama3Config8B, LlamaModel
from nemo.collections.llm.peft.api import gpt_lora
from nemo.collections.llm.recipes.log.default import default_log
from nemo.collections.llm.recipes.optim.adam import adam_with_cosine_annealing
from nemo.collections.llm.utils import Partial, factory

NAME = "llama3_8b"


@factory(name=NAME)
def model() -> pl.LightningModule:
return LlamaModel(Llama3Config8B(seq_length=16384))


@factory(name=NAME)
def trainer(devices=8) -> nl.Trainer:
strategy = nl.MegatronStrategy(tensor_model_parallel_size=2)

return nl.Trainer(
devices=devices,
max_steps=100,
accelerator="gpu",
strategy=strategy,
plugins=nl.MegatronMixedPrecision(precision="bf16-mixed"),
)


@factory(name=NAME + "_hf")
def hf_resume() -> nl.AutoResume:
return nl.AutoResume(import_path="hf://meta-llama/Meta-Llama-3-8B")


@factory(name=NAME, for_task="llm.pretrain")
def pretrain_recipe() -> Partial:
return Partial(
pretrain,
model=model,
trainer=trainer,
data=squad,
log=default_log,
optim=adam_with_cosine_annealing,
)


@factory(name=NAME, for_task="llm.finetune")
def finetune_recipe() -> Partial:
return Partial(
finetune,
model=model,
trainer=trainer,
data=squad,
log=default_log,
optim=adam_with_cosine_annealing,
peft=gpt_lora,
resume=hf_resume,
)
45 changes: 45 additions & 0 deletions nemo/collections/llm/recipes/llama3_8b_16k.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
import pytorch_lightning as pl

from nemo import lightning as nl
from nemo.collections.llm.api import pretrain
from nemo.collections.llm.gpt.data.api import squad
from nemo.collections.llm.gpt.model.llama import Llama3Config8B, LlamaModel
from nemo.collections.llm.recipes.log.default import default_log
from nemo.collections.llm.recipes.optim.adam import adam_with_cosine_annealing
from nemo.collections.llm.utils import Partial, factory

NAME = "llama3_8b_16k"


@factory(name=NAME)
def model() -> pl.LightningModule:
return LlamaModel(Llama3Config8B(seq_length=16384))


@factory(name=NAME)
def trainer(devices=8) -> nl.Trainer:
strategy = nl.MegatronStrategy(
tensor_model_parallel_size=4,
context_parallel_size=2,
sequence_parallel=True,
)

return nl.Trainer(
devices=devices,
max_steps=100,
accelerator="gpu",
strategy=strategy,
plugins=nl.MegatronMixedPrecision(precision="bf16-mixed"),
)


@factory(name=NAME, for_task="llm.pretrain")
def pretrain_recipe() -> Partial:
return Partial(
pretrain,
model=model,
trainer=trainer,
data=squad,
log=default_log,
optim=adam_with_cosine_annealing,
)
Loading

0 comments on commit dbf151a

Please sign in to comment.