Skip to content

Commit

Permalink
add missing model definitions
Browse files Browse the repository at this point in the history
  • Loading branch information
samos123 committed Nov 18, 2024
1 parent d1b5014 commit 497f90e
Showing 1 changed file with 4 additions and 1 deletion.
5 changes: 4 additions & 1 deletion axlearn/experiments/text/gpt/fuji.py
Original file line number Diff line number Diff line change
Expand Up @@ -54,7 +54,7 @@
from axlearn.experiments.text.gpt.common import scaled_hidden_dim
from axlearn.experiments.trainer_config_utils import TrainerConfigFn

MODEL_SIZES = ("test", "1B", "3B", "7B", "8B", "70B")
MODEL_SIZES = ("test", "1B", "3B", "7B", "8B", "70B", "405B")


class Version(enum.Enum):
Expand Down Expand Up @@ -92,18 +92,21 @@ class Version(enum.Enum):
"test": 1 * (1024**4), # 1T tokens
"7B": 1 * (1024**4), # 1T tokens
"70B": int(1.4 * (1024**4)), # 1.4T tokens
"405B": int(1.4 * (1024**4)), # 1.4T tokens
},
Version.V2: {
"test": 2 * (1024**4), # 2T tokens
"7B": 2 * (1024**4), # 2T tokens
"70B": 2 * (1024**4), # 2T tokens
"405B": 2 * (1024**4), # 15T tokens
},
Version.V3: {
"test": 15 * (1024**4), # 15T tokens
"1B": 15 * (1024**4), # 15T tokens
"3B": 15 * (1024**4), # 15T tokens
"8B": 15 * (1024**4), # 15T tokens
"70B": 15 * (1024**4), # 15T tokens
"405B": 15 * (1024**4), # 15T tokens
},
}

Expand Down

0 comments on commit 497f90e

Please sign in to comment.