Skip to content

Commit

Permalink
fix chunk_num_per_shard #1
Browse files Browse the repository at this point in the history
  • Loading branch information
t1101675 committed Nov 7, 2024
1 parent e680467 commit 6d914e8
Showing 1 changed file with 1 addition and 0 deletions.
1 change: 1 addition & 0 deletions data_utils/indexed_dataset.py
Original file line number Diff line number Diff line change
Expand Up @@ -141,6 +141,7 @@ def __init__(self,
self.output_path = output_path
self.bin_file = os.path.join(self.output_path, f"{self.split}_{self.ofid}.bin")
self.idx_file = os.path.join(self.output_path, f"{self.split}_{self.ofid}.idx")
self.chunk_num_per_shard = chunk_num_per_shard
self.tmp_output_path = tmp_output_path
if self.tmp_output_path is not None:
self.tmp_bin_file = os.path.join(self.tmp_output_path, f"{self.split}_{self.ofid}.bin")
Expand Down

0 comments on commit 6d914e8

Please sign in to comment.