Skip to content

Commit 5ddc143

Browse files
committed
documentation
1 parent b33860f commit 5ddc143

1 file changed

Lines changed: 1 addition & 2 deletions

File tree

tmp_scripts/utils/sepal_gpu.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -162,10 +162,9 @@ def _cuda_kernel_diffusion_gpu(
162162
results_all = cp.full(n_genes, -999999.0, dtype=cp.float64) # Results for ALL genes
163163

164164
# Calculate shared memory (fixed size per block, independent of n_cells)
165-
tile_size = 1024 # Fixed tile size for scalability
166165
min_blocks = 256 # Hardware-specific minimum
167166
blocks_per_grid = max(n_genes, min_blocks)
168-
shared_mem_size = tile_size * 2 * 8 # 2 double arrays per tile
167+
shared_mem_size = threads_per_block * 2 * 8 # 2 double arrays per thread
169168

170169

171170
# **SINGLE KERNEL LAUNCH FOR ALL GENES**

0 commit comments

Comments
 (0)