Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions src/datasets/arrow_dataset.py
Original file line number Diff line number Diff line change
Expand Up @@ -2941,7 +2941,7 @@ def init_buffer_and_writer():
pbar_unit = "ex" if not batched else "ba"
pbar_desc = (desc + " " if desc is not None else "") + "#" + str(rank) if rank is not None else desc
pbar = logging.tqdm(
pbar_iterable,
zip(range(0, num_rows, batch_size), pbar_iterable),
total=pbar_total,
disable=disable_tqdm,
position=rank,
Expand All @@ -2960,7 +2960,7 @@ def init_buffer_and_writer():
else:
writer.write(example)
else:
for i, batch in zip(range(0, num_rows, batch_size), pbar):
for i, batch in pbar:
indices = list(
range(*(slice(i, i + batch_size).indices(input_dataset.num_rows)))
) # Something simpler?
Expand Down