|
12 | 12 | # See the License for the specific language governing permissions and |
13 | 13 | # limitations under the License. |
14 | 14 |
|
15 | | -name: test-gang-scheduling-runai |
| 15 | +name: test-gang-scheduling-lw |
16 | 16 | tasks: |
17 | | -- id: register-trainingworkload |
18 | | - type: RegisterObj |
19 | | - params: |
20 | | - template: "resources/benchmarks/templates/runai/trainingworkload.yaml" |
21 | | - nameFormat: "twl{{._ENUM_}}" |
22 | | - podNameFormat: "{{._NAME_}}-0-0" |
23 | | - podCount: 1 |
24 | | -- id: register-distributedworkload |
25 | | - type: RegisterObj |
26 | | - params: |
27 | | - template: "resources/benchmarks/templates/runai/distributedworkload.yaml" |
28 | | - nameFormat: "dwl{{._ENUM_}}" |
29 | | - podNameFormat: "{{._NAME_}}-(launcher-[a-z0-9]+|worker-[0-9]+)" |
30 | | - podCount: "{{.workers}} + 1" |
31 | | -# |
32 | | -### Benchmark test |
33 | | -# |
34 | 17 | - id: job1 |
35 | 18 | type: SubmitObj |
36 | 19 | params: |
37 | | - refTaskId: register-distributedworkload |
| 20 | + refTaskId: register-lw |
38 | 21 | count: 1 |
39 | 22 | params: |
40 | 23 | workers: 31 |
41 | 24 | ttl: 2m |
42 | 25 | - id: job2 |
43 | 26 | type: SubmitObj |
44 | 27 | params: |
45 | | - refTaskId: register-distributedworkload |
| 28 | + refTaskId: register-lw |
46 | 29 | count: 2 |
47 | 30 | params: |
48 | 31 | workers: 15 |
49 | 32 | ttl: 2m |
50 | 33 | - id: job3 |
51 | 34 | type: SubmitObj |
52 | 35 | params: |
53 | | - refTaskId: register-distributedworkload |
| 36 | + refTaskId: register-lw |
54 | 37 | count: 3 |
55 | 38 | params: |
56 | 39 | workers: 9 |
57 | 40 | ttl: 2m |
58 | 41 | - id: job3.1 |
59 | 42 | type: SubmitObj |
60 | 43 | params: |
61 | | - refTaskId: register-distributedworkload |
| 44 | + refTaskId: register-lw |
62 | 45 | count: 1 |
63 | 46 | params: |
64 | 47 | workers: 1 |
65 | 48 | ttl: 2m |
66 | 49 | - id: job4 |
67 | 50 | type: SubmitObj |
68 | 51 | params: |
69 | | - refTaskId: register-distributedworkload |
| 52 | + refTaskId: register-lw |
70 | 53 | count: 4 |
71 | 54 | params: |
72 | 55 | workers: 7 |
73 | 56 | ttl: 2m |
74 | 57 | - id: job5 |
75 | 58 | type: SubmitObj |
76 | 59 | params: |
77 | | - refTaskId: register-distributedworkload |
| 60 | + refTaskId: register-lw |
78 | 61 | count: 5 |
79 | 62 | params: |
80 | 63 | workers: 5 |
81 | 64 | ttl: 2m |
82 | 65 | - id: job5.1 |
83 | 66 | type: SubmitObj |
84 | 67 | params: |
85 | | - refTaskId: register-trainingworkload |
| 68 | + refTaskId: register |
86 | 69 | count: 2 |
87 | 70 | params: |
| 71 | + replicas: 1 |
88 | 72 | ttl: 2m |
89 | 73 | - id: job6 |
90 | 74 | type: SubmitObj |
91 | 75 | params: |
92 | | - refTaskId: register-distributedworkload |
| 76 | + refTaskId: register-lw |
93 | 77 | count: 6 |
94 | 78 | params: |
95 | 79 | workers: 4 |
96 | 80 | ttl: 2m |
97 | 81 | - id: job6.1 |
98 | 82 | type: SubmitObj |
99 | 83 | params: |
100 | | - refTaskId: register-distributedworkload |
| 84 | + refTaskId: register-lw |
101 | 85 | count: 1 |
102 | 86 | params: |
103 | 87 | workers: 1 |
104 | 88 | ttl: 2m |
105 | 89 | - id: job7 |
106 | 90 | type: SubmitObj |
107 | 91 | params: |
108 | | - refTaskId: register-distributedworkload |
| 92 | + refTaskId: register-lw |
109 | 93 | count: 7 |
110 | 94 | params: |
111 | 95 | workers: 3 |
112 | 96 | ttl: 2m |
113 | 97 | - id: job7.1 |
114 | 98 | type: SubmitObj |
115 | 99 | params: |
116 | | - refTaskId: register-distributedworkload |
| 100 | + refTaskId: register-lw |
117 | 101 | count: 1 |
118 | 102 | params: |
119 | 103 | workers: 1 |
120 | 104 | ttl: 2m |
121 | 105 | - id: job7.2 |
122 | 106 | type: SubmitObj |
123 | 107 | params: |
124 | | - refTaskId: register-trainingworkload |
| 108 | + refTaskId: register |
125 | 109 | count: 2 |
126 | 110 | params: |
| 111 | + replicas: 1 |
127 | 112 | ttl: 2m |
128 | 113 | - id: job8 |
129 | 114 | type: SubmitObj |
130 | 115 | params: |
131 | | - refTaskId: register-distributedworkload |
| 116 | + refTaskId: register-lw |
132 | 117 | count: 8 |
133 | 118 | params: |
134 | 119 | workers: 3 |
135 | 120 | ttl: 2m |
136 | 121 | - id: job9 |
137 | 122 | type: SubmitObj |
138 | 123 | params: |
139 | | - refTaskId: register-distributedworkload |
| 124 | + refTaskId: register-lw |
140 | 125 | count: 9 |
141 | 126 | params: |
142 | 127 | workers: 2 |
143 | 128 | ttl: 2m |
144 | 129 | - id: job9.1 |
145 | 130 | type: SubmitObj |
146 | 131 | params: |
147 | | - refTaskId: register-distributedworkload |
| 132 | + refTaskId: register-lw |
148 | 133 | count: 1 |
149 | 134 | params: |
150 | 135 | workers: 4 |
|
0 commit comments