Skip to content

Commit

Permalink
best 150m adam hparams
Browse files Browse the repository at this point in the history
  • Loading branch information
Jackmin801 committed Jan 18, 2025
1 parent 1c1c6a2 commit 1f53b72
Showing 1 changed file with 22 additions and 0 deletions.
22 changes: 22 additions & 0 deletions configs/150M/H100-fast.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,22 @@
name_model = "150M"
project = "debug_150m_zero_band"
type_model = "llama2"

[train]
micro_bs = 64 # change this base on the gpu
reshard_after_forward = true

[optim]
batch_size = 512
warmup_steps = 278
total_steps = 8192

[optim.optim]
lr = 0.003551730141097694
betas1 = 0.9454835470717078
betas2 = 0.9190488086654895
weight_decay = 0.24530252977858977

[data]
seq_length = 1024
dataset_name_or_paths = "datasets/fineweb-edu"

0 comments on commit 1f53b72

Please sign in to comment.