-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathpyproject.toml
More file actions
63 lines (55 loc) · 1.34 KB
/
pyproject.toml
File metadata and controls
63 lines (55 loc) · 1.34 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
[project]
name = "verifiable-rl-coder"
version = "0.1.0"
description = "RL post-training for small coding LLMs with verifiable execution rewards"
readme = "README.md"
license = { file = "LICENSE" }
requires-python = ">=3.11,<3.13"
authors = [
{ name = "Devesh Maheshwari", email = "deveshmaheshwari100@gmail.com" },
]
dependencies = [
"torch>=2.3",
"transformers>=4.46",
"datasets>=3.0",
"evalplus>=0.3.1",
"docker>=7.1",
"numpy>=1.26",
"pyyaml>=6.0",
"tqdm>=4.66",
]
[project.optional-dependencies]
dev = [
"ruff>=0.7",
"pyright>=1.1.385",
"pytest>=8.3",
"pytest-timeout>=2.3",
]
# GPU / training stack — Linux only (vLLM doesn't ship mac wheels).
# Install with: pip install -e ".[dev,gpu]"
gpu = [
"vllm>=0.6.3",
"accelerate>=1.0",
# SFT / RL training stack for weeks 3–4
"peft>=0.13",
"trl>=0.12",
"wandb>=0.18",
]
[build-system]
requires = ["setuptools>=68", "wheel"]
build-backend = "setuptools.build_meta"
[tool.setuptools.packages.find]
where = ["src"]
[tool.ruff]
line-length = 130
target-version = "py311"
src = ["src", "tests", "scripts"]
[tool.ruff.lint]
select = ["E", "F", "I", "B", "UP", "N", "SIM"]
[tool.ruff.lint.per-file-ignores]
"tests/*" = ["B018"]
"scripts/*" = ["E402"]
[tool.pytest.ini_options]
testpaths = ["tests"]
addopts = "-q --strict-markers"
timeout = 60