forked from PrimeIntellect-ai/prime-rl
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathpyproject.toml
More file actions
122 lines (108 loc) · 3 KB
/
pyproject.toml
File metadata and controls
122 lines (108 loc) · 3 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
[project]
name = "prime-rl"
version = "0.1.0"
description = ""
readme = "README.md"
requires-python = "~=3.12.0"
dependencies = [
"beartype>=0.21.0",
"cydifflib>=1.2.0",
"datasets>=3.6.0",
"google-cloud-storage>=3.1.1", # TODO: Delete after refactor
"jaxtyping>=0.3.2",
"liger-kernel>=0.5.10",
"loguru>=0.7.3",
"numpy>=2.2.6",
"openai>=1.90.0",
"pydantic>=1.10.13",
"pydantic-settings>=2.10.1",
"pylatexenc>=2.10",
"pynvml>=12.0.0",
"tomli>=2.2.1",
"torch>=2.7.0",
"transformers>=4.53.0",
"uvloop>=0.21.0",
"vllm==0.10.0",
"wandb>=0.20.1",
"lovely-tensors>=0.1.18",
"rich>=14.0.0",
"tomli-w",
"verifiers>=0.1.3",
"textarena>=0.6.16",
"nltk>=3.9.1",
"math-verify>=0.8.0",
"muon_fsdp2>=0.3.0",
"torchdata>=0.11.0",
]
[project.scripts]
rl = "prime_rl.rl:main"
trainer = "prime_rl.trainer.rl.train:main"
orchestrator = "prime_rl.orchestrator.orchestrator:main"
inference = "prime_rl.inference.server:main"
sft = "prime_rl.trainer.sft.train:main"
eval = "prime_rl.eval.eval:main"
[build-system]
requires = ["hatchling"]
build-backend = "hatchling.build"
[project.optional-dependencies]
flash-attn = ["flash-attn>=2.8.0"]
flash-infer = ["flashinfer-python>=0.2.8rc1"]
vf = [
"alphabet-sort>=0.1.5",
"ascii-tree>=0.1.6",
"pydantic-adherence>=0.1.3",
"reverse-text>=0.1.4",
"unscramble>=0.1.3",
"skywork-math>=0.1.6",
"deepscaler-math>=0.1.4",
"acereason-math>=0.1.4",
"hendrycks-math>=0.1.4",
"intellect-math>=0.1.4",
"aime2024>=0.1.9",
"aime2025>=0.1.9",
"math500>=0.1.9",
]
[tool.uv]
no-build-isolation-package = ["flash-attn"]
prerelease = "allow"
[tool.uv.sources]
torch = [{ index = "pytorch-cu128" }]
alphabet-sort = { index = "primeintellect" }
ascii-tree = { index = "primeintellect" }
pydantic-adherence = { index = "primeintellect" }
reverse-text = { index = "primeintellect" }
unscramble = { index = "primeintellect" }
skywork-math = { index = "primeintellect" }
deepscaler-math = { index = "primeintellect" }
acereason-math = { index = "primeintellect" }
hendrycks-math = { index = "primeintellect" }
intellect-math = { index = "primeintellect" }
aime2024 = { index = "primeintellect" }
aime2025 = { index = "primeintellect" }
math500 = { index = "primeintellect" }
[[tool.uv.index]]
name = "pytorch-cu128"
url = "https://download.pytorch.org/whl/test/cu128"
explicit = true
[[tool.uv.index]]
name = "primeintellect"
url = "https://hub.primeintellect.ai/primeintellect/simple"
[dependency-groups]
dev = [
"ipykernel>=6.29.5",
"ipywidgets>=8.1.7",
"pre-commit>=4.2.0",
"pytest>=8.4.1",
"ruff>=0.12.1",
]
[tool.ruff.lint]
select = ["F", "I"]
ignore = ["F722", "F821"] # Need to ignore for jaxtyping (https://docs.kidger.site/jaxtyping/faq/)
[tool.ruff]
line-length = 120
[tool.pytest.ini_options]
addopts = "--strict-markers"
markers = [
"slow: marks tests as slow (deselect with '-m \"not slow\"')",
"gpu: marks tests as gpu (deselect with '-m \"not gpu\"')",
]