Skip to content

Commit

Permalink
Merged.
Browse files Browse the repository at this point in the history
  • Loading branch information
apaz-cli committed Jan 18, 2025
2 parents 0e87e1d + f6e238a commit 22e14e9
Show file tree
Hide file tree
Showing 3 changed files with 35 additions and 5 deletions.
22 changes: 22 additions & 0 deletions configs/150M/H100-fast.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,22 @@
name_model = "150M"
project = "debug_150m_zero_band"
type_model = "llama2"

[train]
micro_bs = 64 # change this base on the gpu
reshard_after_forward = true

[optim]
batch_size = 512
warmup_steps = 278
total_steps = 8192

[optim.optim]
lr = 0.003551730141097694
betas1 = 0.9454835470717078
betas2 = 0.9190488086654895
weight_decay = 0.24530252977858977

[data]
seq_length = 1024
dataset_name_or_paths = "datasets/fineweb-edu"
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@ dependencies = [
"ninja",
"zstandard",
"pyarrow",
"toposolve",
"toposolve>=0.1.17",
"psutil",
"torch-shampoo @ git+https://github.com/facebookresearch/optimizers.git@main",
"liger-kernel",
Expand Down
16 changes: 12 additions & 4 deletions uv.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

0 comments on commit 22e14e9

Please sign in to comment.