Skip to content

Commit

Permalink
set world-size=1
Browse files Browse the repository at this point in the history
  • Loading branch information
eitanturok committed Oct 7, 2024
1 parent f87c9da commit bb42db4
Showing 1 changed file with 3 additions and 0 deletions.
3 changes: 3 additions & 0 deletions scripts/data_prep/convert_dataset_hf.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@
# SPDX-License-Identifier: Apache-2.0

"""Streaming dataset conversion scripts for C4 and The Pile."""
import os
from argparse import ArgumentParser, Namespace

from llmfoundry.command_utils import convert_dataset_hf_from_args
Expand Down Expand Up @@ -48,6 +49,8 @@ def parse_args() -> Namespace:

if __name__ == '__main__':
args = parse_args()
# to fix https://github.com/mosaicml/llm-foundry/issues/1575
os.environ['WORLD_SIZE'] = '1'
convert_dataset_hf_from_args(
dataset=args.dataset,
data_subset=args.data_subset,
Expand Down

0 comments on commit bb42db4

Please sign in to comment.