diff --git a/pyproject.toml b/pyproject.toml index 24fd66dbbb..1b78651a0b 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,5 +1,5 @@ [build-system] -requires = ["setuptools==80.9.0", "setuptools-scm==9.2.0"] +requires = ["setuptools==82.0.1", "setuptools-scm==10.1.1"] build-backend = "setuptools.build_meta" [project] @@ -78,14 +78,14 @@ huggingfacenotorch = [ "tyro", "protobuf", "sentencepiece>=0.2.0", - "datasets>=3.4.1,!=4.0.*,!=4.1.0,<4.4.0", + "datasets>=4.0,<5.1", "accelerate>=0.34.1", "peft>=0.18.0,!=0.11.0", "huggingface_hub>=0.34.0", "hf_transfer", "diffusers", - "transformers>=4.51.3,!=4.52.0,!=4.52.1,!=4.52.2,!=4.52.3,!=4.53.0,!=4.54.0,!=4.55.0,!=4.55.1,!=4.57.0,!=4.57.4,!=4.57.5,!=5.0.0,!=5.1.0,<=5.5.0", - "trl>=0.18.2,!=0.19.0,<=0.24.0", + "transformers>=4.51.3,!=4.52.0,!=4.52.1,!=4.52.2,!=4.52.3,!=4.53.0,!=4.54.0,!=4.55.0,!=4.55.1,!=4.57.0,!=4.57.4,!=4.57.5,!=5.0.0,!=5.1.0,<=5.12.1", + "trl>=0.18.2,!=0.19.0,<=1.6.0", "sentence-transformers", ] huggingface = [ @@ -350,22 +350,22 @@ cu121 = [ ] cu118-torch211 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu118onlytorch211]", ] cu121-torch211 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu121onlytorch211]", ] cu118-torch212 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu118onlytorch212]", ] cu121-torch212 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu121onlytorch212]", ] cu118-torch220 = [ @@ -555,12 +555,12 @@ conda = [ ] colab-torch211 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu121onlytorch211]", ] colab-ampere-torch211 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu121onlytorch211]", "packaging", "ninja", @@ -583,8 +583,8 @@ colab-new = [ "unsloth_zoo>=2026.6.1", "packaging", "tyro", - "transformers>=4.51.3,!=4.52.0,!=4.52.1,!=4.52.2,!=4.52.3,!=4.53.0,!=4.54.0,!=4.55.0,!=4.55.1,!=4.57.0,!=4.57.4,!=4.57.5,!=5.0.0,!=5.1.0,<=5.5.0", - "datasets>=3.4.1,!=4.0.*,!=4.1.0,<4.4.0", + "transformers>=4.51.3,!=4.52.0,!=4.52.1,!=4.52.2,!=4.52.3,!=4.53.0,!=4.54.0,!=4.55.0,!=4.55.1,!=4.57.0,!=4.57.4,!=4.57.5,!=5.0.0,!=5.1.0,<=5.12.1", + "datasets>=4.0,<5.1", "sentencepiece>=0.2.0", "tqdm", "psutil", @@ -599,7 +599,7 @@ colab-new = [ ] colab-no-deps = [ "accelerate>=0.34.1", - "trl>=0.18.2,!=0.19.0,<=0.24.0", + "trl>=0.18.2,!=0.19.0,<=1.6.0", "peft>=0.18.0", "xformers ; ('linux' in sys_platform or sys_platform == 'win32') and (platform_machine == 'AMD64' or platform_machine == 'x86_64')", "bitsandbytes>=0.45.5,!=0.46.0,!=0.48.0", @@ -631,13 +631,13 @@ cu121-ampere = [ ] cu118-ampere-torch211 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu118onlytorch211]", "unsloth[flashattention]", ] cu121-ampere-torch211 = [ "unsloth[huggingface]", - "bitsandbytes==0.45.5", + "bitsandbytes==0.49.2", "unsloth[cu121onlytorch211]", "unsloth[flashattention]", ]