Skip to content

Commit 2418a78

Browse files
[release] bump to v0.2.2 (#1345)
Co-authored-by: lilei <799812479@qq.com>
1 parent d1bf498 commit 2418a78

File tree

6 files changed

+33
-15
lines changed

6 files changed

+33
-15
lines changed

.github/workflows/pr-test.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ jobs:
4848
strategy:
4949
fail-fast: false
5050
matrix:
51-
info: [{"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_async_short.py"}, {"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_short.py"}, {"num_gpus": 2, "test_file": "test_qwen3_0.6B_fsdp_colocated_2xGPU.py"}]
51+
info: [{"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_async_short.py"}, {"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_short.py"}]
5252
defaults:
5353
run:
5454
working-directory: ${{ github.workspace }}
@@ -95,7 +95,7 @@ jobs:
9595
strategy:
9696
fail-fast: false
9797
matrix:
98-
info: [{"num_gpus": 2, "test_file": "test_qwen3_4B_fsdp_true_on_policy.py"}, {"num_gpus": 8, "test_file": "test_qwen3_vl_4B_fsdp.py"}, {"num_gpus": 2, "test_file": "test_qwen3_0.6B_fsdp_distributed.py"}, {"num_gpus": 4, "test_file": "test_qwen3_0.6B_megatron_fsdp_align.py"}]
98+
info: [{"num_gpus": 4, "test_file": "test_qwen3_4B_fsdp_true_on_policy.py --colocated"}, {"num_gpus": 8, "test_file": "test_qwen3_vl_4B_fsdp.py"}, {"num_gpus": 2, "test_file": "test_qwen3_0.6B_fsdp_distributed.py"}, {"num_gpus": 4, "test_file": "test_qwen3_0.6B_megatron_fsdp_align.py"}]
9999
defaults:
100100
run:
101101
working-directory: ${{ github.workspace }}
@@ -283,7 +283,7 @@ jobs:
283283
strategy:
284284
fail-fast: false
285285
matrix:
286-
info: [{"num_gpus": 2, "test_file": "test_qwen2.5_0.5B_gsm8k.py"}, {"num_gpus": 2, "test_file": "test_qwen2.5_0.5B_gsm8k_async.py"}]
286+
info: [{"num_gpus": 2, "test_file": "test_qwen2.5_0.5B_gsm8k.py"}, {"num_gpus": 2, "test_file": "test_qwen2.5_0.5B_gsm8k_async.py"}, {"num_gpus": 2, "test_file": "test_qwen3_0.6B_fsdp_colocated_2xGPU.py"}, {"num_gpus": 2, "test_file": "test_qwen3_0.6B_fsdp_distributed.py"}]
287287
defaults:
288288
run:
289289
working-directory: ${{ github.workspace }}

.github/workflows/pr-test.yml.j2

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,13 +4,12 @@
44
'tests': [
55
{'test_file': 'test_qwen2.5_0.5B_gsm8k_async_short.py', 'num_gpus': 4},
66
{'test_file': 'test_qwen2.5_0.5B_gsm8k_short.py', 'num_gpus': 4},
7-
{'test_file': 'test_qwen3_0.6B_fsdp_colocated_2xGPU.py', 'num_gpus': 2},
87
],
98
},
109
'e2e-test-fsdp': {
1110
'label': 'run-ci-fsdp',
1211
'tests': [
13-
{'test_file': 'test_qwen3_4B_fsdp_true_on_policy.py', 'num_gpus': 2},
12+
{'test_file': 'test_qwen3_4B_fsdp_true_on_policy.py --colocated', 'num_gpus': 4},
1413
{'test_file': 'test_qwen3_vl_4B_fsdp.py', 'num_gpus': 8},
1514
{'test_file': 'test_qwen3_0.6B_fsdp_distributed.py', 'num_gpus': 2},
1615
{'test_file': 'test_qwen3_0.6B_megatron_fsdp_align.py', 'num_gpus': 4},
@@ -48,6 +47,8 @@
4847
'tests': [
4948
{'test_file': 'test_qwen2.5_0.5B_gsm8k.py', 'num_gpus': 2},
5049
{'test_file': 'test_qwen2.5_0.5B_gsm8k_async.py', 'num_gpus': 2},
50+
{'test_file': 'test_qwen3_0.6B_fsdp_colocated_2xGPU.py', 'num_gpus': 2},
51+
{'test_file': 'test_qwen3_0.6B_fsdp_distributed.py', 'num_gpus': 2},
5152
],
5253
},
5354
'e2e-test-image': {

build_conda.sh

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -74,6 +74,7 @@ fi
7474

7575
# https://github.com/pytorch/pytorch/issues/168167
7676
pip install nvidia-cudnn-cu12==9.16.0.29
77+
pip install "numpy<2"
7778

7879
# apply patch
7980
cd $BASE_DIR/sglang

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ def get_tag(self):
3232
setup(
3333
author="slime Team",
3434
name="slime",
35-
version="0.2.1",
35+
version="0.2.2",
3636
packages=find_packages(include=["slime*", "slime_plugins*"]),
3737
include_package_data=True,
3838
install_requires=_fetch_requirements("requirements.txt"),

tests/test_qwen3_4B_fsdp_true_on_policy.py

Lines changed: 15 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,15 @@
11
import os
2+
from argparse import ArgumentParser
23
import slime.utils.external_utils.command_utils as U
34

45
ENABLE_EVAL = bool(int(os.environ.get("SLIME_TEST_ENABLE_EVAL", "1")))
5-
NUM_GPUS = 2
6+
NUM_GPUS = 4
67

78
MODEL_NAME = "Qwen3-4B"
89

10+
parser = ArgumentParser()
11+
parser.add_argument("--colocated", action="store_true", help="Whether to run with colocate.")
12+
913

1014
def prepare():
1115
U.exec_command("mkdir -p /root/models /root/datasets")
@@ -14,7 +18,7 @@ def prepare():
1418
U.hf_download_dataset("zhuzilin/aime-2024")
1519

1620

17-
def execute():
21+
def execute(args):
1822
ckpt_args = f"--hf-checkpoint /root/models/{MODEL_NAME} "
1923

2024
rollout_args = (
@@ -29,7 +33,7 @@ def execute():
2933
"--n-samples-per-prompt 8 "
3034
"--rollout-max-response-len 4096 "
3135
"--rollout-temperature 1 "
32-
"--global-batch-size 32 "
36+
"--global-batch-size 64 "
3337
)
3438

3539
eval_args = (
@@ -75,7 +79,12 @@ def execute():
7579

7680
ci_args = "--ci-test "
7781

78-
misc_args = "--actor-num-nodes 1 " f"--actor-num-gpus-per-node {NUM_GPUS} " "--colocate "
82+
if args.colocated:
83+
misc_args = f"--actor-num-nodes 1 --actor-num-gpus-per-node {NUM_GPUS} --colocate "
84+
else:
85+
misc_args = (
86+
f"--actor-num-nodes 1 --actor-num-gpus-per-node {NUM_GPUS // 2} --rollout-num-gpus {NUM_GPUS // 2} "
87+
)
7988

8089
train_args = (
8190
f"{ckpt_args} "
@@ -106,7 +115,8 @@ def execute():
106115

107116

108117
if __name__ == "__main__":
118+
args = parser.parse_args()
109119
prepare()
110120
for proxy_var in ("http_proxy", "https_proxy", "HTTP_PROXY", "HTTPS_PROXY"):
111121
os.environ.pop(proxy_var, None)
112-
execute()
122+
execute(args)

tests/test_qwen3_vl_4B_fsdp.py

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -68,8 +68,13 @@ def execute():
6868
"--sglang-mem-fraction-static 0.6 "
6969
"--sglang-decode-log-interval 1000 "
7070
"--sglang-enable-metrics "
71+
# "--sglang-enable-deterministic-inference "
72+
# "--sglang-rl-on-policy-target fsdp "
7173
"--sglang-attention-backend fa3 "
7274
"--attn-implementation flash_attention_3 "
75+
"--sglang-cuda-graph-bs 1 2 4 8 16 24 32 40 48 56 64 "
76+
# "--deterministic-mode "
77+
# "--true-on-policy-mode "
7378
)
7479

7580
ci_args = "--ci-test "
@@ -91,6 +96,9 @@ def execute():
9196
)
9297

9398
extra_env_vars = {
99+
# "NCCL_ALGO": "allreduce:tree",
100+
# "NVTE_ALLOW_NONDETERMINISTIC_ALGO": "0",
101+
# "CUBLAS_WORKSPACE_CONFIG": ":4096:8",
94102
"CUDA_DEVICE_MAX_CONNECTIONS": "1",
95103
}
96104

@@ -104,8 +112,6 @@ def execute():
104112

105113
if __name__ == "__main__":
106114
prepare()
107-
os.environ.pop("http_proxy", None)
108-
os.environ.pop("https_proxy", None)
109-
os.environ.pop("HTTP_PROXY", None)
110-
os.environ.pop("HTTPS_PROXY", None)
115+
for proxy_var in ("http_proxy", "https_proxy", "HTTP_PROXY", "HTTPS_PROXY"):
116+
os.environ.pop(proxy_var, None)
111117
execute()

0 commit comments

Comments
 (0)