File tree
9 files changed
+117
-40
lines changed- csrc
- flash_attn/src
9 files changed
+117
-40
lines changedLines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
33 | 33 |
| |
34 | 34 |
| |
35 | 35 |
| |
36 |
| - | |
| 36 | + | |
37 | 37 |
| |
38 | 38 |
| |
39 | 39 |
| |
|
- CHANGELOG.md+7-2
- CMakeLists.txt+24-3
- PUBLICATIONS.md+7
- README.md+9-4
- cmake/version.h.in-38
- cmake/version_extended.h.in+34
- examples/02_dump_reg_shmem/CMakeLists.txt+1
- examples/08_turing_tensorop_gemm/turing_tensorop_gemm.cu+2-2
- examples/56_hopper_ptr_array_batched_gemm/56_hopper_ptr_array_batched_gemm.cu+7-7
- examples/56_hopper_ptr_array_batched_gemm/CMakeLists.txt+10-8
- examples/57_hopper_grouped_gemm/57_hopper_grouped_gemm.cu+96-49
- examples/57_hopper_grouped_gemm/CMakeLists.txt+10
- include/cute/arch/copy_sm90_desc.hpp+1-1
- include/cute/atom/mma_atom.hpp+2
- include/cute/util/print.hpp+2-2
- include/cute/util/type_traits.hpp+3
- include/cutlass/arch/mma_sm90.h+4
- include/cutlass/bfloat16.h+1
- include/cutlass/detail/layout.hpp+35-1
- include/cutlass/epilogue/collective/builders/sm90_builder.inl+12-7
- include/cutlass/epilogue/collective/default_epilogue.hpp+1
- include/cutlass/epilogue/collective/default_epilogue_array.hpp+32-18
- include/cutlass/epilogue/collective/sm90_epilogue_tma_warpspecialized.hpp+76-38
- include/cutlass/epilogue/dispatch_policy.hpp+1-2
- include/cutlass/epilogue/fusion/sm90_callbacks_tma_warpspecialized.hpp+28
- include/cutlass/epilogue/fusion/sm90_visitor_store_tma_warpspecialized.hpp+1
- include/cutlass/epilogue/thread/linear_combination.h+57-12
- include/cutlass/epilogue/threadblock/default_epilogue_tensor_op_row_broadcast.h-183
- include/cutlass/epilogue/threadblock/predicated_tile_iterator_row_broadcast.h-519
- include/cutlass/gemm/collective/builders/sm90_gmma_builder.inl+4-8
- include/cutlass/gemm/collective/sm90_mma_array_tma_gmma_ss_warpspecialized.hpp+45-29
- include/cutlass/gemm/device/gemm_sparse_row_broadcast.h-514
- include/cutlass/gemm/dispatch_policy.hpp+4-7
- include/cutlass/gemm/group_array_problem_shape.hpp+12
- include/cutlass/gemm/kernel/default_gemm_sparse_row_broadcast.h-191
- include/cutlass/gemm/kernel/sm90_gemm_array_tma_warpspecialized_cooperative.hpp+30-35
- include/cutlass/gemm/kernel/sm90_gemm_tma.hpp+5-7
- include/cutlass/gemm/kernel/sm90_gemm_tma_warpspecialized.hpp+5-7
- include/cutlass/gemm/kernel/sm90_gemm_tma_warpspecialized_cooperative.hpp+5-7
- include/cutlass/gemm/kernel/sm90_gemm_tma_warpspecialized_pingpong.hpp+5-7
- include/cutlass/gemm/kernel/sm90_gemm_warpspecialized.hpp+5-7
- include/cutlass/gemm/kernel/sm90_gemm_warpspecialized_cooperative.hpp+5-7
- include/cutlass/gemm/kernel/sm90_gemm_warpspecialized_pingpong.hpp+5-7
- include/cutlass/gemm/kernel/sm90_tile_scheduler_group.hpp+140-86
- include/cutlass/gemm/kernel/sparse_gemm_row_broadcast.h-400
- include/cutlass/gemm/kernel/tile_scheduler_params.h+14-6
- include/cutlass/version.h+80
- pyproject.toml+2-2
- python/cutlass/__init__.py+3-3
- python/cutlass/backend/c_types.py+6-2
- python/cutlass/backend/epilogue.py+23-1
- python/cutlass/backend/evt/frontend/frontend_base.py+2-2
- python/cutlass/backend/evt/passes/graph_drawer.py-16
- python/cutlass/backend/gemm_operation.py+28-18
- python/setup_library.py+1-1
- python/setup_pycute.py+1-1
- test/unit/gemm/device/CMakeLists.txt+1
- test/unit/gemm/device/gemm_f16n_f16n_f16t_tensor_op_f32_sparse_sm80.cu-19
- test/unit/gemm/device/sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_warpspecialized_cooperative_aux_store.cu+685
- test/unit/gemm/device/testbed_sparse.h+7-20
- tools/util/include/cutlass/util/packed_stride.hpp+1-1
Lines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
521 | 521 |
| |
522 | 522 |
| |
523 | 523 |
| |
524 |
| - | |
| 524 | + | |
525 | 525 |
| |
526 | 526 |
| |
527 | 527 |
| |
|
Lines changed: 18 additions & 12 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
70 | 70 |
| |
71 | 71 |
| |
72 | 72 |
| |
73 |
| - | |
74 |
| - | |
75 |
| - | |
| 73 | + | |
| 74 | + | |
| 75 | + | |
76 | 76 |
| |
77 | 77 |
| |
78 | 78 |
| |
| |||
101 | 101 |
| |
102 | 102 |
| |
103 | 103 |
| |
| 104 | + | |
104 | 105 |
| |
| 106 | + | |
105 | 107 |
| |
106 | 108 |
| |
107 | 109 |
| |
| |||
115 | 117 |
| |
116 | 118 |
| |
117 | 119 |
| |
118 |
| - | |
| 120 | + | |
119 | 121 |
| |
120 | 122 |
| |
121 | 123 |
| |
| |||
140 | 142 |
| |
141 | 143 |
| |
142 | 144 |
| |
143 |
| - | |
| 145 | + | |
144 | 146 |
| |
145 | 147 |
| |
146 | 148 |
| |
| |||
185 | 187 |
| |
186 | 188 |
| |
187 | 189 |
| |
188 |
| - | |
| 190 | + | |
189 | 191 |
| |
190 | 192 |
| |
191 | 193 |
| |
| |||
211 | 213 |
| |
212 | 214 |
| |
213 | 215 |
| |
214 |
| - | |
| 216 | + | |
215 | 217 |
| |
216 | 218 |
| |
217 | 219 |
| |
| |||
244 | 246 |
| |
245 | 247 |
| |
246 | 248 |
| |
247 |
| - | |
| 249 | + | |
248 | 250 |
| |
249 | 251 |
| |
250 | 252 |
| |
| |||
264 | 266 |
| |
265 | 267 |
| |
266 | 268 |
| |
267 |
| - | |
| 269 | + | |
268 | 270 |
| |
269 | 271 |
| |
270 | 272 |
| |
| |||
276 | 278 |
| |
277 | 279 |
| |
278 | 280 |
| |
279 |
| - | |
| 281 | + | |
280 | 282 |
| |
281 | 283 |
| |
282 | 284 |
| |
| |||
292 | 294 |
| |
293 | 295 |
| |
294 | 296 |
| |
295 |
| - | |
| 297 | + | |
296 | 298 |
| |
297 | 299 |
| |
298 |
| - | |
| 300 | + | |
299 | 301 |
| |
| 302 | + | |
| 303 | + | |
| 304 | + | |
| 305 | + | |
300 | 306 |
| |
301 | 307 |
| |
302 | 308 |
|
Lines changed: 16 additions & 15 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
43 | 43 |
| |
44 | 44 |
| |
45 | 45 |
| |
46 |
| - | |
47 |
| - | |
| 46 | + | |
| 47 | + | |
48 | 48 |
| |
49 |
| - | |
| 49 | + | |
50 | 50 |
| |
51 | 51 |
| |
52 | 52 |
| |
| |||
84 | 84 |
| |
85 | 85 |
| |
86 | 86 |
| |
87 |
| - | |
88 |
| - | |
| 87 | + | |
| 88 | + | |
89 | 89 |
| |
90 | 90 |
| |
91 |
| - | |
| 91 | + | |
92 | 92 |
| |
93 | 93 |
| |
94 | 94 |
| |
| |||
114 | 114 |
| |
115 | 115 |
| |
116 | 116 |
| |
117 |
| - | |
| 117 | + | |
118 | 118 |
| |
119 | 119 |
| |
120 | 120 |
| |
| |||
148 | 148 |
| |
149 | 149 |
| |
150 | 150 |
| |
151 |
| - | |
| 151 | + | |
152 | 152 |
| |
153 | 153 |
| |
154 | 154 |
| |
| |||
158 | 158 |
| |
159 | 159 |
| |
160 | 160 |
| |
161 |
| - | |
| 161 | + | |
162 | 162 |
| |
163 | 163 |
| |
164 | 164 |
| |
| |||
180 | 180 |
| |
181 | 181 |
| |
182 | 182 |
| |
| 183 | + | |
183 | 184 |
| |
184 | 185 |
| |
185 | 186 |
| |
186 | 187 |
| |
187 | 188 |
| |
188 | 189 |
| |
189 |
| - | |
| 190 | + | |
190 | 191 |
| |
191 | 192 |
| |
192 | 193 |
| |
| |||
217 | 218 |
| |
218 | 219 |
| |
219 | 220 |
| |
220 |
| - | |
| 221 | + | |
221 | 222 |
| |
222 | 223 |
| |
223 | 224 |
| |
| |||
259 | 260 |
| |
260 | 261 |
| |
261 | 262 |
| |
262 |
| - | |
| 263 | + | |
263 | 264 |
| |
264 | 265 |
| |
265 | 266 |
| |
| |||
287 | 288 |
| |
288 | 289 |
| |
289 | 290 |
| |
290 |
| - | |
| 291 | + | |
291 | 292 |
| |
292 | 293 |
| |
293 | 294 |
| |
| |||
315 | 316 |
| |
316 | 317 |
| |
317 | 318 |
| |
318 |
| - | |
| 319 | + | |
319 | 320 |
| |
320 | 321 |
| |
321 | 322 |
| |
| |||
346 | 347 |
| |
347 | 348 |
| |
348 | 349 |
| |
349 |
| - | |
| 350 | + | |
350 | 351 |
| |
351 | 352 |
| |
352 | 353 |
| |
|
Lines changed: 4 additions & 2 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
231 | 231 |
| |
232 | 232 |
| |
233 | 233 |
| |
234 |
| - | |
| 234 | + | |
| 235 | + | |
| 236 | + | |
235 | 237 |
| |
236 |
| - | |
| 238 | + | |
237 | 239 |
| |
238 | 240 |
| |
239 | 241 |
| |
|
Lines changed: 8 additions & 7 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
55 | 55 |
| |
56 | 56 |
| |
57 | 57 |
| |
58 |
| - | |
| 58 | + | |
59 | 59 |
| |
60 | 60 |
| |
61 |
| - | |
| 61 | + | |
62 | 62 |
| |
63 | 63 |
| |
64 | 64 |
| |
| |||
133 | 133 |
| |
134 | 134 |
| |
135 | 135 |
| |
136 |
| - | |
| 136 | + | |
137 | 137 |
| |
138 | 138 |
| |
139 | 139 |
| |
| |||
152 | 152 |
| |
153 | 153 |
| |
154 | 154 |
| |
155 |
| - | |
156 |
| - | |
157 |
| - | |
158 |
| - | |
| 155 | + | |
| 156 | + | |
| 157 | + | |
159 | 158 |
| |
160 | 159 |
| |
161 | 160 |
| |
162 | 161 |
| |
163 | 162 |
| |
| 163 | + | |
| 164 | + | |
164 | 165 |
| |
165 | 166 |
| |
166 | 167 |
| |
|
0 commit comments