AniketAsla commited on
Commit
16966ba
·
verified ·
1 Parent(s): 37ec93d

deploy: update train/requirements.txt

Browse files
Files changed (1) hide show
  1. train/requirements.txt +49 -49
train/requirements.txt CHANGED
@@ -1,49 +1,49 @@
1
- # Training deps for DebateFloor GRPO on HF Jobs.
2
- # Tested image: pytorch/pytorch:2.4.0-cuda12.1-cudnn9-runtime
3
- # (PyTorch 2.4.0, torchvision 0.19.0, CUDA 12.1, Python 3.11)
4
-
5
- # Core RL trainer.
6
- # - GRPO was added in trl 0.13 (Jan 2025) and the GRPOConfig API used in
7
- # train/train_minimal.py (processing_class, reward_funcs, num_generations,
8
- # max_completion_length, max_prompt_length) stabilized in 0.15.
9
- # - Cap below 0.20 to keep transformers requirement at 4.48 (avoids needing
10
- # torch>=2.5 which the base image doesn't have).
11
- trl>=0.15.0,<0.18.0
12
-
13
- # transformers must be < 4.48 — that's the version where loss_deformable_detr.py
14
- # was added, which unconditionally imports image_transforms -> torchvision at
15
- # module load time. Even purging torchvision can't avoid this if transformers
16
- # tries to import it during _LazyModule resolution.
17
- # trl 0.15.2 accepts transformers >= 4.46, so 4.46 / 4.47 are both valid.
18
- transformers>=4.46.0,<4.48.0
19
-
20
- # Note: torchvision is INTENTIONALLY not pinned. The HF Jobs base image ships
21
- # torch 2.11.0+cu130 (not 2.4.0 as the tag suggests), and ABI-matching
22
- # torchvision wheels for cu130 are not always available. Since DebateFloor is
23
- # text-only and never uses image transforms, jobs_run.py uninstalls torchvision
24
- # entirely after pip install — transformers will then skip the broken
25
- # `image_utils → torchvision::nms` import path.
26
-
27
- # Model + LoRA.
28
- peft>=0.13.0
29
- accelerate>=1.0.0,<2.0.0
30
- datasets>=2.19.0
31
-
32
- # bitsandbytes prebuilt wheel for CUDA 12.x.
33
- bitsandbytes>=0.43.0
34
-
35
- # Logging / IO
36
- wandb>=0.17.0
37
- requests>=2.32.0
38
- matplotlib>=3.8.0
39
-
40
- # Env server (uvicorn + FastAPI come from root requirements.txt; we just need
41
- # the openenv-core import path because train_minimal.py loads
42
- # server.calibration_grader + server.claim_generator).
43
- uvicorn>=0.30.0
44
- openenv-core>=0.2.3
45
-
46
- # Unsloth 4-bit QLoRA (MR-3 hackathon constraint).
47
- # unsloth-zoo is the runtime backend; pinning a recent stable version known to
48
- # work with torch 2.4.
49
- unsloth>=2024.10
 
1
+ # Training deps for DebateFloor GRPO on HF Jobs.
2
+ # Tested image: pytorch/pytorch:2.4.0-cuda12.1-cudnn9-runtime
3
+ # (PyTorch 2.4.0, torchvision 0.19.0, CUDA 12.1, Python 3.11)
4
+
5
+ # Core RL trainer.
6
+ # - GRPO was added in trl 0.13 (Jan 2025) and the GRPOConfig API used in
7
+ # train/train_minimal.py (processing_class, reward_funcs, num_generations,
8
+ # max_completion_length, max_prompt_length) stabilized in 0.15.
9
+ # - Cap below 0.20 to keep transformers requirement at 4.48 (avoids needing
10
+ # torch>=2.5 which the base image doesn't have).
11
+ trl>=0.15.0,<0.18.0
12
+
13
+ # transformers must be < 4.48 — that's the version where loss_deformable_detr.py
14
+ # was added, which unconditionally imports image_transforms -> torchvision at
15
+ # module load time. Even purging torchvision can't avoid this if transformers
16
+ # tries to import it during _LazyModule resolution.
17
+ # trl 0.15.2 accepts transformers >= 4.46, so 4.46 / 4.47 are both valid.
18
+ transformers>=4.46.0,<4.48.0
19
+
20
+ # Note: torchvision is INTENTIONALLY not pinned. The HF Jobs base image ships
21
+ # torch 2.11.0+cu130 (not 2.4.0 as the tag suggests), and ABI-matching
22
+ # torchvision wheels for cu130 are not always available. Since DebateFloor is
23
+ # text-only and never uses image transforms, jobs_run.py uninstalls torchvision
24
+ # entirely after pip install — transformers will then skip the broken
25
+ # `image_utils → torchvision::nms` import path.
26
+
27
+ # Model + LoRA.
28
+ peft>=0.13.0
29
+ accelerate>=1.0.0,<2.0.0
30
+ datasets>=2.19.0
31
+
32
+ # bitsandbytes prebuilt wheel for CUDA 12.x.
33
+ bitsandbytes>=0.43.0
34
+
35
+ # Logging / IO
36
+ wandb>=0.17.0
37
+ requests>=2.32.0
38
+ matplotlib>=3.8.0
39
+
40
+ # Env server (uvicorn + FastAPI come from root requirements.txt; we just need
41
+ # the openenv-core import path because train_minimal.py loads
42
+ # server.calibration_grader + server.claim_generator).
43
+ uvicorn>=0.30.0
44
+ openenv-core>=0.2.3
45
+
46
+ # Unsloth 4-bit QLoRA (MR-3 hackathon constraint).
47
+ # unsloth-zoo is the runtime backend; pinning a recent stable version known to
48
+ # work with torch 2.4.
49
+ unsloth>=2024.10