|
7 | 7 | hal.executable @warp_reduction_dispatch { |
8 | 8 | hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
9 | 9 | hal.executable.export public @warp_reduction_dispatch layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2 : index) -> (index, index, index) { |
10 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 10 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
11 | 11 | hal.return %x, %y, %z : index, index, index |
12 | 12 | } |
13 | 13 | builtin.module { |
@@ -61,7 +61,7 @@ hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
61 | 61 | hal.executable @warp_reduction_broadcast_dispatch { |
62 | 62 | hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
63 | 63 | hal.executable.export public @warp_reduction_broadcast_dispatch layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2 : index) -> (index, index, index) { |
64 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 64 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
65 | 65 | hal.return %x, %y, %z : index, index, index |
66 | 66 | } |
67 | 67 | builtin.module { |
@@ -121,7 +121,7 @@ hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
121 | 121 | hal.executable @softmax { |
122 | 122 | hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
123 | 123 | hal.executable.export public @softmax layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2 : index) -> (index, index, index) { |
124 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 124 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
125 | 125 | hal.return %x, %y, %z : index, index, index |
126 | 126 | } |
127 | 127 | builtin.module { |
@@ -178,7 +178,7 @@ hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
178 | 178 | hal.executable @softmax_singlesubgroup { |
179 | 179 | hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
180 | 180 | hal.executable.export public @softmax_singlesubgroup layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2 : index) -> (index, index, index) { |
181 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 181 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
182 | 182 | hal.return %x, %y, %z : index, index, index |
183 | 183 | } |
184 | 184 | builtin.module { |
@@ -233,7 +233,7 @@ hal.executable.variant @cuda target(<"cuda", "cuda-nvptx-fb">) { |
233 | 233 | hal.executable @small_reduction { |
234 | 234 | hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
235 | 235 | hal.executable.export public @small_reduction ordinal(0) layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2: index) -> (index, index, index) { |
236 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 236 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
237 | 237 | hal.return %x, %y, %z : index, index, index |
238 | 238 | } |
239 | 239 | builtin.module { |
@@ -271,7 +271,7 @@ hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
271 | 271 | hal.executable @group_reduction { |
272 | 272 | hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
273 | 273 | hal.executable.export public @group_reduction ordinal(0) layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2: index) -> (index, index, index) { |
274 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 274 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
275 | 275 | hal.return %x, %y, %z : index, index, index |
276 | 276 | } |
277 | 277 | builtin.module { |
@@ -307,7 +307,7 @@ hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
307 | 307 | hal.executable @group_elementwise_reduction_elementwise { |
308 | 308 | hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
309 | 309 | hal.executable.export public @group_elementwise_reduction_elementwise ordinal(0) layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index) -> (index, index, index) { |
310 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1) |
| 310 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1) |
311 | 311 | hal.return %x, %y, %z : index, index, index |
312 | 312 | } |
313 | 313 | builtin.module { |
@@ -350,7 +350,7 @@ hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
350 | 350 | hal.executable @group_reduction_larger { |
351 | 351 | hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
352 | 352 | hal.executable.export public @group_reduction_larger ordinal(0) layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2: index) -> (index, index, index) { |
353 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 353 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
354 | 354 | hal.return %x, %y, %z : index, index, index |
355 | 355 | } |
356 | 356 | builtin.module { |
@@ -387,7 +387,7 @@ hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
387 | 387 | hal.executable @group_reduction_1d { |
388 | 388 | hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
389 | 389 | hal.executable.export public @group_reduction_1d ordinal(0) layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2: index) -> (index, index, index) { |
390 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2) |
| 390 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2) |
391 | 391 | hal.return %x, %y, %z : index, index, index |
392 | 392 | } |
393 | 393 | builtin.module { |
@@ -423,7 +423,7 @@ hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
423 | 423 | hal.executable @group_elementwise_reduction_elementwise_4d { |
424 | 424 | hal.executable.variant public @cuda_nvptx_fb target(<"cuda", "cuda-nvptx-fb">) { |
425 | 425 | hal.executable.export public @group_elementwise_reduction_elementwise_4d ordinal(0) layout(#pipeline_layout) count(%arg0: !hal.device, %arg1: index, %arg2: index, %arg3: index) -> (index, index, index) { |
426 | | - %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_dag_root(%arg1, %arg2, %arg3) |
| 426 | + %x, %y, %z = iree_tensor_ext.dispatch.workgroup_count_from_slice(%arg1, %arg2, %arg3) |
427 | 427 | hal.return %x, %y, %z : index, index, index |
428 | 428 | } |
429 | 429 | builtin.module { |
|
0 commit comments