Skip to content

Commit b81d118

Browse files
authored
Merge pull request #28 from AI-Hypercomputer/nemo-a4x-recipes
Fix comments to reflect the right llama model
2 parents 2b09a91 + 4171130 commit b81d118

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

training/a4x/llama3-1-70b/nemo-pretraining-gke/16node-FP8CS-GBS2048/recipe/llama3-1-70b-fp8cs-gbs2048-gpus64.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
"""Nemo2 pretraining recipe for Llama 3.1 8B model."""
1+
"""Nemo2 pretraining recipe for Llama 3.1 70B model."""
22

33
from nemo.collections import llm
44
from nemo.collections.llm.recipes import llama31_70b
@@ -17,7 +17,7 @@ def recipe(
1717
profile_end_step: int = 0,
1818
profile_ranks: str = "0",
1919
) -> run.Partial:
20-
"""Returns a Nemo2 training recipe for Llama 3.1 8B model.
20+
"""Returns a Nemo2 training recipe for Llama 3.1 70B model.
2121
2222
Args:
2323
profile_enabled: Whether to enable Nsys profiling.
@@ -102,7 +102,7 @@ def recipe(
102102
pretrain.trainer.callbacks.append(
103103
run.Config(
104104
FLOPsMeasurementCallback,
105-
model_name="llama31-8b",
105+
model_name="llama31-70b",
106106
model_config=pretrain.model.config,
107107
data_config=pretrain.data,
108108
)

0 commit comments

Comments
 (0)