Skip to content

Commit

Permalink
Add default processes in text to mds conversion (#608)
Browse files Browse the repository at this point in the history
  • Loading branch information
irenedea committed Sep 18, 2023
1 parent e7c4567 commit 10b221f
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion scripts/data_prep/convert_text_to_mds.py
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@
from glob import glob
from typing import Iterable, List, Tuple, cast

import psutil
from composer.utils import (ObjectStore, maybe_create_object_store_from_uri,
parse_uri)
from streaming import MDSWriter
Expand Down Expand Up @@ -87,7 +88,7 @@ def parse_args() -> Namespace:
'--processes',
type=int,
required=False,
default=1,
default=min(max(psutil.cpu_count() - 2, 1), 32),
help=
'The number of processes to use to download and convert the dataset',
)
Expand Down

0 comments on commit 10b221f

Please sign in to comment.