Skip to content

Commit

Permalink
fix
Browse files Browse the repository at this point in the history
  • Loading branch information
ahmeda14960 committed Feb 16, 2024
1 parent 4136e66 commit eea0fa0
Show file tree
Hide file tree
Showing 2 changed files with 16 additions and 6 deletions.
4 changes: 2 additions & 2 deletions config/gpt2_med.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,8 +11,8 @@ model:
gradient_checkpointing: true
scale_attn_by_inverse_layer_idx: true

# initialize_from_hf: "gpt2-medium"
# use_hf_model_config: true
initialize_from_hf: "gpt2-medium"
use_hf_model_config: true

trainer:
wandb:
Expand Down
18 changes: 14 additions & 4 deletions config/gpt2_medium.yaml
Original file line number Diff line number Diff line change
@@ -1,4 +1,7 @@
data: !include data/openwebtext_source.yaml
data:
id: dlwh/wikitext_103_detokenized
tokenizer: "EleutherAI/gpt-neox-20b"
cache_dir: "gs://levanter-data/tokenized/wiki-fast/"
model:
type: gpt2
hidden_dim: 1024
Expand All @@ -7,15 +10,22 @@ model:
seq_len: 1024
gradient_checkpointing: true
scale_attn_by_inverse_layer_idx: true

initialize_from_hf: "gpt2-medium"
use_hf_model_config: true

trainer:
wandb:
project: "levanter"
project: "locked"
tags: [ "openwebtext", "gpt2"]

mp: p=f32,c=bfloat16
model_axis_size: 1
per_device_parallelism: 16
per_device_parallelism: -1
train_batch_size: 32
num_train_steps: 2000000
optimizer:
learning_rate: 3E-4
learning_rate: 1E-6
weight_decay: 0.1
warmup: 0.01
min_lr_ratio: 0.1

0 comments on commit eea0fa0

Please sign in to comment.