Skip to content

Commit

Permalink
adjust hidden size, NCCL log level
Browse files Browse the repository at this point in the history
  • Loading branch information
epwalsh committed Dec 3, 2024
1 parent 3dfdedf commit 355f61a
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 0 deletions.
3 changes: 3 additions & 0 deletions src/olmo_core/internal/common.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@
from olmo_core.io import is_url
from olmo_core.launch.beaker import (
BeakerEnvSecret,
BeakerEnvVar,
BeakerLaunchConfig,
BeakerWekaBucket,
OLMoCoreBeakerImage,
Expand Down Expand Up @@ -61,6 +62,7 @@ def build_launch_config(
task_name: str = "train",
workspace: str = "ai2/OLMo-core",
budget: str = "ai2/oe-training",
nccl_debug: bool = False,
) -> BeakerLaunchConfig:
weka_buckets: List[BeakerWekaBucket] = []
if root_dir.startswith("/weka/"):
Expand All @@ -81,6 +83,7 @@ def build_launch_config(
num_gpus=8,
shared_filesystem=not is_url(root_dir),
allow_dirty=False,
env_vars=[BeakerEnvVar(name="NCCL_DEBUG", value="INFO" if nccl_debug else "WARN")],
env_secrets=[
BeakerEnvSecret(name="BEAKER_TOKEN", secret=f"{beaker_user}_BEAKER_TOKEN"),
BeakerEnvSecret(name="WANDB_API_KEY", secret=f"{beaker_user}_WANDB_API_KEY"),
Expand Down
1 change: 1 addition & 0 deletions src/olmo_core/nn/transformer/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -460,6 +460,7 @@ def olmo2_26B(cls, vocab_size: int, **kwargs) -> "TransformerConfig":
block_name=kwargs.pop("block_name", TransformerBlockType.reordered_norm),
qk_norm=kwargs.pop("qk_norm", True),
rope_theta=kwargs.pop("rope_theta", 500_000),
hidden_size_multiple_of=kwargs.pop("hidden_size_multiple_of", 1024),
layer_norm_eps=1e-6,
**kwargs,
)
Expand Down

0 comments on commit 355f61a

Please sign in to comment.