diff --git a/configs/150M/3090.toml b/configs/150M/3090.toml index 5179e298..f3c11a49 100644 --- a/configs/150M/3090.toml +++ b/configs/150M/3090.toml @@ -11,3 +11,9 @@ batch_size = 512 warmup_steps = 1000 total_steps = 88_000 lr = 4e-4 + + +[data] +dataset_name_or_paths = "/data/datasets/fineweb-edu,/data/datasets/StackV1-popular" +dataset_ratio = "80:20" +num_workers = 2 \ No newline at end of file