diff --git a/setup.py b/setup.py index 642ba0a845..edc3dfdcc5 100644 --- a/setup.py +++ b/setup.py @@ -57,7 +57,7 @@ 'transformers>=v4.51.0,<4.52', 'mosaicml-streaming>=0.12.0,<0.13', 'torch>=2.7.0,<2.7.1', - 'datasets>=3.3.2,<3.7', + 'datasets>=3.3.2,<4.2', 'fsspec==2023.6.0', # newer version results in a bug in datasets that duplicates data 'sentencepiece==0.2.0', 'einops==0.8.1',