We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 89d3014 commit 14f0a4fCopy full SHA for 14f0a4f
xformers/ops/fmha/_triton/splitk_kernels.py
@@ -392,7 +392,7 @@ def _fwd_kernel_splitK(
392
logical_page_idx = logical_block_idx // BLOCKS_IN_PAGE
393
physical_page_idx = tl.load(
394
block_table + stride_blocktablesl * logical_page_idx
395
- ).to(tl.int64) # Cast to int64 to avoid overflow when offset > 2^31
+ ).to(tl.int32)
396
offset = physical_page_idx * PAGE_SIZE + block_offset_in_page * BLOCK_N
397
398
current_block_size = min(hi - start_n, BLOCK_N)
0 commit comments