Skip to content

Commit 4240ea7

Browse files
authored
Merge branch 'verl-project:main' into main
2 parents 01d4918 + 5e2f2b2 commit 4240ea7

File tree

8 files changed

+28
-38
lines changed

8 files changed

+28
-38
lines changed

.github/workflows/e2e_ascend.yml

Lines changed: 4 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -67,21 +67,16 @@ jobs:
6767
llm_rl_job:
6868
if: github.repository_owner == 'verl-project'
6969
name: E2E Ascend testing for RL training scenarios of LLM models
70-
runs-on: linux-aarch64-a2-8
70+
runs-on: linux-aarch64-a2b3-8
7171
timeout-minutes: 120
7272
container:
73-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
73+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
7474
options: >-
7575
--shm-size 16g
7676
env:
7777
HF_ENDPOINT: "https://hf-mirror.com"
7878
HF_HUB_ENABLE_HF_TRANSFER: "0" # This is more stable
7979
steps:
80-
- name: Config third-party dependency download cache
81-
run: |
82-
sed -Ei 's@(ports|archive).ubuntu.com@cache-service.nginx-pypi-cache.svc.cluster.local:8081@g' /etc/apt/sources.list
83-
pip config set global.index-url http://cache-service.nginx-pypi-cache.svc.cluster.local/pypi/simple
84-
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
8580
- name: Check npu and CANN info
8681
run: |
8782
cat /usr/local/Ascend/ascend-toolkit/latest/"$(uname -i)"-linux/ascend_toolkit_install.info
@@ -132,21 +127,16 @@ jobs:
132127
vlm_rl_job:
133128
if: github.repository_owner == 'verl-project'
134129
name: E2E Ascend testing for RL training scenarios of VLM models
135-
runs-on: linux-aarch64-a2-8
130+
runs-on: linux-aarch64-a2b3-8
136131
timeout-minutes: 120
137132
container:
138-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
133+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
139134
options: >-
140135
--shm-size 16g
141136
env:
142137
HF_ENDPOINT: "https://hf-mirror.com"
143138
HF_HUB_ENABLE_HF_TRANSFER: "0" # This is more stable
144139
steps:
145-
- name: Config third-party dependency download cache
146-
run: |
147-
sed -Ei 's@(ports|archive).ubuntu.com@cache-service.nginx-pypi-cache.svc.cluster.local:8081@g' /etc/apt/sources.list
148-
pip config set global.index-url http://cache-service.nginx-pypi-cache.svc.cluster.local/pypi/simple
149-
pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
150140
- name: Check npu and CANN info
151141
run: |
152142
cat /usr/local/Ascend/ascend-toolkit/latest/"$(uname -i)"-linux/ascend_toolkit_install.info

.github/workflows/e2e_one_step_off_policy_ascend.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -83,10 +83,10 @@ jobs:
8383
# Test FSDP2 strategy
8484
e2e_one_step_off_policy_fsdp2_ascend:
8585
if: github.repository_owner == 'verl-project'
86-
runs-on: linux-aarch64-a2-8
86+
runs-on: linux-aarch64-a2b3-8
8787
timeout-minutes: 60 # Increase this timeout value as needed
8888
container:
89-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
89+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
9090
options: >-
9191
--shm-size 16g
9292
env:
@@ -127,10 +127,10 @@ jobs:
127127
# Test Megatron strategy
128128
e2e_one_step_off_policy_megatron_ascend:
129129
if: github.repository_owner == 'verl-project'
130-
runs-on: linux-aarch64-a2-8
130+
runs-on: linux-aarch64-a2b3-8
131131
timeout-minutes: 60 # Increase this timeout value as needed
132132
container:
133-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
133+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
134134
options: >-
135135
--shm-size 16g
136136
env:

.github/workflows/e2e_ppo_trainer_megatron_vllm_2_ascend.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -89,10 +89,10 @@ permissions:
8989
jobs:
9090
e2e_ppo_trainer_fsdp_vllm_ascend:
9191
if: github.repository_owner == 'verl-project'
92-
runs-on: linux-aarch64-a2-8
92+
runs-on: linux-aarch64-a2b3-8
9393
timeout-minutes: 90 # Increase this timeout value as needed
9494
container:
95-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
95+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
9696
options: >-
9797
--shm-size 16g
9898
env:
@@ -166,10 +166,10 @@ jobs:
166166
167167
e2e_ppo_trainer_fsdp-qwen2_5vl-3b_ascend:
168168
if: github.repository_owner == 'verl-project'
169-
runs-on: linux-aarch64-a2-8
169+
runs-on: linux-aarch64-a2b3-8
170170
timeout-minutes: 60 # Increase this timeout value as needed
171171
container:
172-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
172+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
173173
options: >-
174174
--shm-size 16g
175175
env:

.github/workflows/e2e_sft_llm_ascend.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -71,10 +71,10 @@ permissions:
7171
jobs:
7272
e2e_sft_llm_ascend:
7373
if: github.repository_owner == 'verl-project'
74-
runs-on: linux-aarch64-a2-8
74+
runs-on: linux-aarch64-a2b3-8
7575
timeout-minutes: 90 # Increase this timeout value as needed
7676
container:
77-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
77+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
7878
options: >-
7979
--shm-size 16g
8080
env:

.github/workflows/model_ascend.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -63,10 +63,10 @@ permissions:
6363
jobs:
6464
model_rmpad_ascend:
6565
if: github.repository_owner == 'verl-project'
66-
runs-on: linux-aarch64-a2-8
66+
runs-on: linux-aarch64-a2b3-8
6767
timeout-minutes: 60 # Increase this timeout value as needed
6868
container:
69-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
69+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
7070
options: >-
7171
--shm-size 16g
7272
env:
@@ -112,10 +112,10 @@ jobs:
112112
# NOTE: List as an independent job to make rerun easier.
113113
model_rmpad_fsdp2_unstable_ascend:
114114
if: github.repository_owner == 'verl-project'
115-
runs-on: linux-aarch64-a2-8
115+
runs-on: linux-aarch64-a2b3-8
116116
timeout-minutes: 60
117117
container:
118-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
118+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
119119
options: >-
120120
--shm-size 16g
121121
env:

.github/workflows/nightly_ascend.yml

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -47,10 +47,10 @@ jobs:
4747
# Test ppo qwen3-8b fsdp+vllm
4848
nightlyCI_ppo-qwen3-8b-fsdp-vllm_ascend:
4949
if: github.repository_owner == 'verl-project'
50-
runs-on: linux-aarch64-a2-8
50+
runs-on: linux-aarch64-a2b3-8
5151
timeout-minutes: 180 # Increase this timeout value as needed
5252
container:
53-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
53+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
5454
options: >-
5555
--shm-size 16g
5656
env:
@@ -90,10 +90,10 @@ jobs:
9090
# Test grpo qwen25-7b-Instruct fsdp+vllm
9191
nightlyCI_grpo-qwen25-7b-Instruct-fsdp-vllm_ascend:
9292
if: github.repository_owner == 'verl-project'
93-
runs-on: linux-aarch64-a2-8
93+
runs-on: linux-aarch64-a2b3-8
9494
timeout-minutes: 180 # Increase this timeout value as needed
9595
container:
96-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
96+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
9797
options: >-
9898
--shm-size 16g
9999
env:
@@ -133,10 +133,10 @@ jobs:
133133
# Test grpo qwen25-vl-3b-Instruct fsdp+vllm
134134
nightlyCI_grpo-qwen25-vl-3b-Instruct-fsdp-vllm_ascend:
135135
if: github.repository_owner == 'verl-project'
136-
runs-on: linux-aarch64-a2-8
136+
runs-on: linux-aarch64-a2b3-8
137137
timeout-minutes: 180 # Increase this timeout value as needed
138138
container:
139-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
139+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
140140
options: >-
141141
--shm-size 16g
142142
env:

.github/workflows/npu_unit_tests.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -73,10 +73,10 @@ permissions:
7373
jobs:
7474
npu_unit_tests:
7575
if: github.repository_owner == 'verl-project'
76-
runs-on: linux-aarch64-a2-8
76+
runs-on: linux-aarch64-a2b3-8
7777
timeout-minutes: 60 # Increase this timeout value as needed
7878
container:
79-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
79+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
8080
options: >-
8181
--shm-size 16g
8282
env:

.github/workflows/reward_model_vllm_ascend.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -61,10 +61,10 @@ permissions:
6161
jobs:
6262
reward_model_vllm_ascend:
6363
if: github.repository_owner == 'verl-project'
64-
runs-on: linux-aarch64-a2-8
64+
runs-on: linux-aarch64-a2b3-8
6565
timeout-minutes: 60 # Increase this timeout value as needed
6666
container:
67-
image: swr.ap-southeast-1.myhuaweicloud.com/base_image/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
67+
image: swr.cn-southwest-2.myhuaweicloud.com/modelfoundry/ascend-ci/verl/verl:verl-8.5.0-910b-ubuntu22.04-py3.11-latest
6868
options: >-
6969
--shm-size 16g
7070
env:

0 commit comments

Comments
 (0)