Skip to content

Commit 2d255a4

Browse files
authored
Merge branch 'main' into zhuzilin/sglang-config-v2
2 parents 5aaf4f3 + 88208ce commit 2d255a4

32 files changed

+590
-1158
lines changed

.github/workflows/bot-slash-lint.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ jobs:
2323
steps:
2424
- name: React to command comment (ack)
2525
if: always()
26-
uses: actions/github-script@v7
26+
uses: actions/github-script@v8
2727
with:
2828
script: |
2929
const commentId = context.payload.comment.id;
@@ -36,14 +36,14 @@ jobs:
3636
});
3737
3838
- name: Check out Git repository
39-
uses: actions/checkout@v4
39+
uses: actions/checkout@v6
4040
with:
4141
repository: ${{ github.repository }}
4242
ref: refs/pull/${{ github.event.issue.number }}/head
4343
token: ${{ secrets.GITHUB_TOKEN }}
4444

4545
- name: Set up Python
46-
uses: actions/setup-python@v5
46+
uses: actions/setup-python@v6
4747
with:
4848
python-version: '3.10'
4949

@@ -80,7 +80,7 @@ jobs:
8080
runs-on: ubuntu-latest
8181
steps:
8282
- name: Remove initial ack reaction
83-
uses: actions/github-script@v7
83+
uses: actions/github-script@v8
8484
with:
8585
script: |
8686
const commentId = context.payload.comment.id;

.github/workflows/conda-ci.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ jobs:
2222

2323
steps:
2424
- name: Checkout repository
25-
uses: actions/checkout@v4
25+
uses: actions/checkout@v6
2626

2727
- name: Construct Conda
2828
run: |

.github/workflows/pr-test.yml

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,7 @@ jobs:
6262

6363
steps:
6464
- name: Checkout repository
65-
uses: actions/checkout@v4
65+
uses: actions/checkout@v6
6666

6767
- name: Install
6868
shell: bash
@@ -109,7 +109,7 @@ jobs:
109109

110110
steps:
111111
- name: Checkout repository
112-
uses: actions/checkout@v4
112+
uses: actions/checkout@v6
113113

114114
- name: Install
115115
shell: bash
@@ -142,7 +142,7 @@ jobs:
142142
strategy:
143143
fail-fast: false
144144
matrix:
145-
info: [{"num_gpus": 8, "test_file": "test_quick_start_glm4_9B.py"}, {"num_gpus": 8, "test_file": "test_qwen3_30B_A3B.py", "use_deepep": "1", "use_fp8_rollout": "1"}, {"enable_eval": "0", "num_gpus": 8, "test_file": "test_qwen3_30B_A3B_r3.py", "use_deepep": "1", "use_fp8_rollout": "1"}, {"enable_eval": "0", "num_gpus": 8, "test_file": "test_qwen3_30B_A3B_r3.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ppo.py"}, {"num_gpus": 8, "test_file": "test_moonlight_16B_A3B.py"}, {"enable_eval": "0", "num_gpus": 8, "test_file": "test_moonlight_16B_A3B_r3.py"}, {"num_gpus": 8, "test_file": "test_mimo_7B_mtp_only_grad.py"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_debug_rollout_then_train.py"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_opd_sglang.py"}]
145+
info: [{"num_gpus": 8, "test_file": "test_quick_start_glm4_9B.py"}, {"num_gpus": 8, "test_file": "test_qwen3_30B_A3B.py", "use_deepep": "1", "use_fp8_rollout": "1"}, {"enable_eval": "0", "num_gpus": 8, "test_file": "test_qwen3_30B_A3B_r3.py", "use_deepep": "1", "use_fp8_rollout": "1"}, {"enable_eval": "0", "num_gpus": 8, "test_file": "test_qwen3_30B_A3B_r3.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ppo.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ppo_train_critic_only.py"}, {"num_gpus": 8, "test_file": "test_moonlight_16B_A3B.py"}, {"enable_eval": "0", "num_gpus": 8, "test_file": "test_moonlight_16B_A3B_r3.py"}, {"num_gpus": 8, "test_file": "test_mimo_7B_mtp_only_grad.py"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_debug_rollout_then_train.py"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_opd_sglang.py"}]
146146
defaults:
147147
run:
148148
working-directory: ${{ github.workspace }}
@@ -156,7 +156,7 @@ jobs:
156156

157157
steps:
158158
- name: Checkout repository
159-
uses: actions/checkout@v4
159+
uses: actions/checkout@v6
160160

161161
- name: Install
162162
shell: bash
@@ -203,7 +203,7 @@ jobs:
203203

204204
steps:
205205
- name: Checkout repository
206-
uses: actions/checkout@v4
206+
uses: actions/checkout@v6
207207

208208
- name: Install
209209
shell: bash
@@ -250,7 +250,7 @@ jobs:
250250

251251
steps:
252252
- name: Checkout repository
253-
uses: actions/checkout@v4
253+
uses: actions/checkout@v6
254254

255255
- name: Install
256256
shell: bash
@@ -283,7 +283,7 @@ jobs:
283283
strategy:
284284
fail-fast: false
285285
matrix:
286-
info: [{"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_async_short.py"}, {"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_short.py"}, {"num_gpus": 2, "test_file": "test_qwen3_4B_fsdp_true_on_policy.py"}, {"num_gpus": 8, "test_file": "test_qwen3_vl_4B_fsdp.py"}, {"num_gpus": 8, "test_file": "test_quick_start_glm4_9B.py"}, {"num_gpus": 8, "test_file": "test_qwen3_30B_A3B.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ppo.py"}, {"num_gpus": 8, "test_file": "test_moonlight_16B_A3B.py"}, {"num_gpus": 8, "test_file": "test_mimo_7B_mtp_only_grad.py"}, {"num_gpus": 8, "test_file": "test_qwen3_0.6B_parallel_check.py"}, {"num_gpus": 4, "test_file": "test_qwen3_0.6B_megatron_fsdp_align.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ckpt.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ckpt.py --async-save"}, {"num_gpus": 2, "test_file": "test_qwen2.5_0.5B_gsm8k.py"}, {"num_gpus": 2, "test_file": "test_qwen2.5_0.5B_gsm8k_async.py"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_debug_rollout_then_train.py"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_opd_sglang.py"}]
286+
info: [{"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_async_short.py"}, {"num_gpus": 4, "test_file": "test_qwen2.5_0.5B_gsm8k_short.py"}, {"num_gpus": 2, "test_file": "test_qwen3_4B_fsdp_true_on_policy.py"}, {"num_gpus": 8, "test_file": "test_qwen3_vl_4B_fsdp.py"}, {"num_gpus": 8, "test_file": "test_quick_start_glm4_9B.py"}, {"num_gpus": 8, "test_file": "test_qwen3_30B_A3B.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ppo.py"}, {"num_gpus": 8, "test_file": "test_moonlight_16B_A3B.py"}, {"num_gpus": 8, "test_file": "test_mimo_7B_mtp_only_grad.py"}, {"num_gpus": 8, "test_file": "test_qwen3_0.6B_parallel_check.py"}, {"num_gpus": 4, "test_file": "test_qwen3_0.6B_megatron_fsdp_align.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ckpt.py"}, {"num_gpus": 8, "test_file": "test_qwen3_4B_ckpt.py --async-save"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_debug_rollout_then_train.py"}, {"num_gpus": 8, "test_file": "test_qwen2.5_0.5B_opd_sglang.py"}]
287287
defaults:
288288
run:
289289
working-directory: ${{ github.workspace }}
@@ -297,7 +297,7 @@ jobs:
297297

298298
steps:
299299
- name: Checkout repository
300-
uses: actions/checkout@v4
300+
uses: actions/checkout@v6
301301

302302
- name: Install
303303
shell: bash
@@ -395,7 +395,7 @@ jobs:
395395

396396
steps:
397397
- name: Checkout repository
398-
uses: actions/checkout@v4
398+
uses: actions/checkout@v6
399399

400400
- name: Install
401401
shell: bash

.github/workflows/pr-test.yml.j2

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,7 @@
2424
{'test_file': 'test_qwen3_30B_A3B_r3.py', 'num_gpus': 8, 'use_deepep': '1', 'use_fp8_rollout': '1', 'enable_eval': '0'},
2525
{'test_file': 'test_qwen3_30B_A3B_r3.py', 'num_gpus': 8, 'enable_eval': '0'},
2626
{'test_file': 'test_qwen3_4B_ppo.py', 'num_gpus': 8},
27+
{'test_file': 'test_qwen3_4B_ppo_train_critic_only.py', 'num_gpus': 8},
2728
{'test_file': 'test_moonlight_16B_A3B.py', 'num_gpus': 8},
2829
{'test_file': 'test_moonlight_16B_A3B_r3.py', 'num_gpus': 8, 'enable_eval': '0'},
2930
{'test_file': 'test_mimo_7B_mtp_only_grad.py', 'num_gpus': 8},
@@ -63,8 +64,6 @@
6364
{'test_file': 'test_qwen3_0.6B_megatron_fsdp_align.py', 'num_gpus': 4},
6465
{'test_file': 'test_qwen3_4B_ckpt.py', 'num_gpus': 8},
6566
{'test_file': 'test_qwen3_4B_ckpt.py --async-save', 'num_gpus': 8},
66-
{'test_file': 'test_qwen2.5_0.5B_gsm8k.py', 'num_gpus': 2},
67-
{'test_file': 'test_qwen2.5_0.5B_gsm8k_async.py', 'num_gpus': 2},
6867
{'test_file': 'test_qwen2.5_0.5B_debug_rollout_then_train.py', 'num_gpus': 8},
6968
{'test_file': 'test_qwen2.5_0.5B_opd_sglang.py', 'num_gpus': 8},
7069
],

.github/workflows/pre-commit.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,12 +15,12 @@ jobs:
1515
runs-on: ubuntu-latest
1616
steps:
1717
- name: Checkout repository
18-
uses: actions/checkout@v4
18+
uses: actions/checkout@v6
1919
with:
2020
fetch-depth: 0
2121

2222
- name: Set up Python
23-
uses: actions/setup-python@v5
23+
uses: actions/setup-python@v6
2424
with:
2525
python-version: '3.10'
2626
cache: 'pip'
@@ -29,7 +29,7 @@ jobs:
2929
run: pip install --upgrade pip pre-commit
3030

3131
- name: Cache pre-commit environments
32-
uses: actions/cache@v4
32+
uses: actions/cache@v5
3333
with:
3434
path: ~/.cache/pre-commit
3535
key: pre-commit-${{ runner.os }}-${{ hashFiles('.pre-commit-config.yaml') }}

.github/workflows/release-docs.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,10 +22,10 @@ jobs:
2222
contents: write
2323
steps:
2424
- name: Checkout code
25-
uses: actions/checkout@v4
25+
uses: actions/checkout@v6
2626

2727
- name: Setup Python
28-
uses: actions/setup-python@v5
28+
uses: actions/setup-python@v6
2929
with:
3030
python-version: '3.13'
3131

docker/Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
ARG SGLANG_IMAGE_TAG=nightly-dev-20260107-dce8b060
1+
ARG SGLANG_IMAGE_TAG=v0.5.9
22
FROM slimerl/sglang:${SGLANG_IMAGE_TAG} AS sglang
33

44
# ======================================== Arguments =============================================

0 commit comments

Comments
 (0)